diff --git "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" --- "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" +++ "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0434, "train/learning_rate": 2.0605700712589072e-06, "train/epoch": 19.62, "train/global_step": 17500, "_runtime": 112316, "_timestamp": 1647706193, "_step": 17506, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 2.0, 15.0, 20.0, 54.0, 108.0, 165.0, 221.0, 212.0, 113.0, 59.0, 27.0, 11.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.312162399291992, -18.56810188293457, -15.824040412902832, -13.079978942871094, -10.335918426513672, -7.59185791015625, -4.847795486450195, -2.1037349700927734, 0.6403255462646484, 3.3843865394592285, 6.128447532653809, 8.872509002685547, 11.616569519042969, 14.36063003540039, 17.104692459106445, 19.848752975463867, 22.59281349182129, 25.33687400817871, 28.080936431884766, 30.824996948242188, 33.56905746459961, 36.31311798095703, 39.05718231201172, 41.801239013671875, 44.54530334472656, 47.289363861083984, 50.033424377441406, 52.777488708496094, 55.52154541015625, 58.26560974121094, 61.00967025756836, 63.75373077392578, 66.49778747558594, 69.24185180664062, 71.98590850830078, 74.72997283935547, 77.47402954101562, 80.21809387207031, 82.962158203125, 85.70621490478516, 88.45027160644531, 91.1943359375, 93.93839263916016, 96.68245697021484, 99.426513671875, 102.17057800292969, 104.91464233398438, 107.65869903564453, 110.40276336669922, 113.1468276977539, 115.89088439941406, 118.63494873046875, 121.3790054321289, 124.1230697631836, 126.86712646484375, 129.61119079589844, 132.35525512695312, 135.0993194580078, 137.8433837890625, 140.58743286132812, 143.3314971923828, 146.0755615234375, 148.8196258544922, 151.56369018554688, 154.3077392578125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 14.0, 14.0, 20.0, 32.0, 27.0, 33.0, 38.0, 56.0, 37.0, 37.0, 39.0, 66.0, 60.0, 56.0, 53.0, 51.0, 53.0, 37.0, 44.0, 36.0, 38.0, 28.0, 29.0, 22.0, 21.0, 8.0, 6.0, 8.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.62236022949219, -31.6335506439209, -30.644742965698242, -29.655933380126953, -28.667125701904297, -27.678316116333008, -26.68950653076172, -25.700698852539062, -24.711891174316406, -23.723081588745117, -22.73427391052246, -21.745464324951172, -20.756656646728516, -19.767847061157227, -18.779037475585938, -17.79022979736328, -16.801420211791992, -15.81261157989502, -14.823802947998047, -13.834993362426758, -12.846185684204102, -11.857376098632812, -10.86856746673584, -9.879758834838867, -8.890950202941895, -7.902141571044922, -6.913332939147949, -5.924523830413818, -4.935715198516846, -3.946906566619873, -2.958097457885742, -1.9692888259887695, -0.9804782867431641, 0.008330464363098145, 0.9971392154693604, 1.985948085784912, 2.9747567176818848, 3.9635653495788574, 4.952374458312988, 5.941183090209961, 6.929991722106934, 7.918800354003906, 8.907608985900879, 9.896417617797852, 10.88522720336914, 11.874034881591797, 12.862844467163086, 13.851653099060059, 14.840461730957031, 15.829270362854004, 16.818078994750977, 17.806888580322266, 18.795696258544922, 19.78450584411621, 20.7733154296875, 21.762123107910156, 22.750930786132812, 23.7397403717041, 24.728548049926758, 25.717357635498047, 26.706165313720703, 27.694974899291992, 28.68378448486328, 29.672592163085938, 30.661401748657227]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 5.0, 12.0, 13.0, 10.0, 13.0, 17.0, 27.0, 25.0, 38.0, 35.0, 34.0, 39.0, 45.0, 46.0, 58.0, 56.0, 54.0, 53.0, 48.0, 51.0, 60.0, 35.0, 45.0, 41.0, 35.0, 18.0, 26.0, 11.0, 18.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51953125, -2.441650390625, -2.36376953125, -2.285888671875, -2.2080078125, -2.130126953125, -2.05224609375, -1.974365234375, -1.896484375, -1.818603515625, -1.74072265625, -1.662841796875, -1.5849609375, -1.507080078125, -1.42919921875, -1.351318359375, -1.2734375, -1.195556640625, -1.11767578125, -1.039794921875, -0.9619140625, -0.884033203125, -0.80615234375, -0.728271484375, -0.650390625, -0.572509765625, -0.49462890625, -0.416748046875, -0.3388671875, -0.260986328125, -0.18310546875, -0.105224609375, -0.02734375, 0.050537109375, 0.12841796875, 0.206298828125, 0.2841796875, 0.362060546875, 0.43994140625, 0.517822265625, 0.595703125, 0.673583984375, 0.75146484375, 0.829345703125, 0.9072265625, 0.985107421875, 1.06298828125, 1.140869140625, 1.21875, 1.296630859375, 1.37451171875, 1.452392578125, 1.5302734375, 1.608154296875, 1.68603515625, 1.763916015625, 1.841796875, 1.919677734375, 1.99755859375, 2.075439453125, 2.1533203125, 2.231201171875, 2.30908203125, 2.386962890625, 2.46484375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 10.0, 16.0, 20.0, 23.0, 44.0, 64.0, 100.0, 115.0, 157.0, 249.0, 382.0, 695.0, 1842.0, 6802.0, 41142.0, 770747.0, 3282921.0, 74559.0, 10288.0, 2203.0, 790.0, 385.0, 236.0, 166.0, 95.0, 78.0, 53.0, 32.0, 19.0, 12.0, 6.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.015625, -27.240234375, -26.46484375, -25.689453125, -24.9140625, -24.138671875, -23.36328125, -22.587890625, -21.8125, -21.037109375, -20.26171875, -19.486328125, -18.7109375, -17.935546875, -17.16015625, -16.384765625, -15.609375, -14.833984375, -14.05859375, -13.283203125, -12.5078125, -11.732421875, -10.95703125, -10.181640625, -9.40625, -8.630859375, -7.85546875, -7.080078125, -6.3046875, -5.529296875, -4.75390625, -3.978515625, -3.203125, -2.427734375, -1.65234375, -0.876953125, -0.1015625, 0.673828125, 1.44921875, 2.224609375, 3.0, 3.775390625, 4.55078125, 5.326171875, 6.1015625, 6.876953125, 7.65234375, 8.427734375, 9.203125, 9.978515625, 10.75390625, 11.529296875, 12.3046875, 13.080078125, 13.85546875, 14.630859375, 15.40625, 16.181640625, 16.95703125, 17.732421875, 18.5078125, 19.283203125, 20.05859375, 20.833984375, 21.609375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 3.0, 6.0, 10.0, 13.0, 8.0, 9.0, 21.0, 24.0, 21.0, 41.0, 44.0, 57.0, 82.0, 82.0, 101.0, 127.0, 180.0, 251.0, 313.0, 533.0, 599.0, 379.0, 243.0, 211.0, 152.0, 119.0, 100.0, 64.0, 51.0, 47.0, 36.0, 37.0, 33.0, 18.0, 14.0, 7.0, 4.0, 7.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.8359375, -6.62957763671875, -6.4232177734375, -6.21685791015625, -6.010498046875, -5.80413818359375, -5.5977783203125, -5.39141845703125, -5.18505859375, -4.97869873046875, -4.7723388671875, -4.56597900390625, -4.359619140625, -4.15325927734375, -3.9468994140625, -3.74053955078125, -3.5341796875, -3.32781982421875, -3.1214599609375, -2.91510009765625, -2.708740234375, -2.50238037109375, -2.2960205078125, -2.08966064453125, -1.88330078125, -1.67694091796875, -1.4705810546875, -1.26422119140625, -1.057861328125, -0.85150146484375, -0.6451416015625, -0.43878173828125, -0.232421875, -0.02606201171875, 0.1802978515625, 0.38665771484375, 0.593017578125, 0.79937744140625, 1.0057373046875, 1.21209716796875, 1.41845703125, 1.62481689453125, 1.8311767578125, 2.03753662109375, 2.243896484375, 2.45025634765625, 2.6566162109375, 2.86297607421875, 3.0693359375, 3.27569580078125, 3.4820556640625, 3.68841552734375, 3.894775390625, 4.10113525390625, 4.3074951171875, 4.51385498046875, 4.72021484375, 4.92657470703125, 5.1329345703125, 5.33929443359375, 5.545654296875, 5.75201416015625, 5.9583740234375, 6.16473388671875, 6.37109375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 10.0, 8.0, 7.0, 13.0, 33.0, 36.0, 57.0, 81.0, 132.0, 195.0, 292.0, 527.0, 906.0, 1691.0, 3541.0, 7407.0, 20693.0, 68784.0, 287613.0, 2494006.0, 1070216.0, 167776.0, 44265.0, 14411.0, 5670.0, 2580.0, 1384.0, 794.0, 416.0, 314.0, 175.0, 104.0, 38.0, 35.0, 29.0, 17.0, 11.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0, -21.349609375, -20.69921875, -20.048828125, -19.3984375, -18.748046875, -18.09765625, -17.447265625, -16.796875, -16.146484375, -15.49609375, -14.845703125, -14.1953125, -13.544921875, -12.89453125, -12.244140625, -11.59375, -10.943359375, -10.29296875, -9.642578125, -8.9921875, -8.341796875, -7.69140625, -7.041015625, -6.390625, -5.740234375, -5.08984375, -4.439453125, -3.7890625, -3.138671875, -2.48828125, -1.837890625, -1.1875, -0.537109375, 0.11328125, 0.763671875, 1.4140625, 2.064453125, 2.71484375, 3.365234375, 4.015625, 4.666015625, 5.31640625, 5.966796875, 6.6171875, 7.267578125, 7.91796875, 8.568359375, 9.21875, 9.869140625, 10.51953125, 11.169921875, 11.8203125, 12.470703125, 13.12109375, 13.771484375, 14.421875, 15.072265625, 15.72265625, 16.373046875, 17.0234375, 17.673828125, 18.32421875, 18.974609375, 19.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 11.0, 21.0, 16.0, 34.0, 49.0, 50.0, 88.0, 104.0, 112.0, 127.0, 120.0, 85.0, 67.0, 42.0, 22.0, 16.0, 9.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-63.37506103515625, -61.9963493347168, -60.617637634277344, -59.23892593383789, -57.86021423339844, -56.48149871826172, -55.102787017822266, -53.72407531738281, -52.34536361694336, -50.966651916503906, -49.58794021606445, -48.209228515625, -46.83051300048828, -45.45180130004883, -44.073089599609375, -42.69437789916992, -41.31566619873047, -39.936954498291016, -38.55824279785156, -37.17953109741211, -35.800819396972656, -34.42210388183594, -33.043392181396484, -31.66468048095703, -30.285968780517578, -28.907257080078125, -27.528545379638672, -26.149831771850586, -24.771120071411133, -23.39240837097168, -22.013694763183594, -20.63498306274414, -19.256271362304688, -17.877559661865234, -16.49884796142578, -15.120134353637695, -13.741422653198242, -12.362710952758789, -10.98399829864502, -9.60528564453125, -8.226573944091797, -6.8478617668151855, -5.469149589538574, -4.090437412261963, -2.7117252349853516, -1.3330130577087402, 0.045699119567871094, 1.4244117736816406, 2.8031234741210938, 4.181835651397705, 5.560547828674316, 6.939260005950928, 8.317972183227539, 9.696683883666992, 11.075396537780762, 12.454109191894531, 13.832820892333984, 15.211532592773438, 16.59024429321289, 17.968957901000977, 19.34766960144043, 20.726381301879883, 22.10509490966797, 23.483806610107422, 24.862518310546875]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 10.0, 7.0, 15.0, 13.0, 14.0, 10.0, 25.0, 26.0, 24.0, 43.0, 21.0, 33.0, 29.0, 31.0, 24.0, 35.0, 45.0, 41.0, 41.0, 45.0, 43.0, 40.0, 42.0, 31.0, 34.0, 32.0, 32.0, 20.0, 21.0, 26.0, 24.0, 19.0, 17.0, 13.0, 14.0, 11.0, 9.0, 3.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.057994842529297, -22.260908126831055, -21.463821411132812, -20.666732788085938, -19.869646072387695, -19.072559356689453, -18.275470733642578, -17.478384017944336, -16.681297302246094, -15.884210586547852, -15.087122917175293, -14.290035247802734, -13.492948532104492, -12.69586181640625, -11.898774147033691, -11.101686477661133, -10.30459976196289, -9.507513046264648, -8.71042537689209, -7.9133381843566895, -7.116250991821289, -6.319163799285889, -5.522076606750488, -4.724989414215088, -3.9279022216796875, -3.130815029144287, -2.3337278366088867, -1.5366406440734863, -0.7395534515380859, 0.05753374099731445, 0.8546209335327148, 1.6517081260681152, 2.4487972259521484, 3.245884418487549, 4.042971611022949, 4.84005880355835, 5.63714599609375, 6.43423318862915, 7.231320381164551, 8.02840805053711, 8.825494766235352, 9.622581481933594, 10.419669151306152, 11.216756820678711, 12.013843536376953, 12.810930252075195, 13.608017921447754, 14.405105590820312, 15.202192306518555, 15.999279022216797, 16.796367645263672, 17.593454360961914, 18.390541076660156, 19.1876277923584, 19.98471450805664, 20.781803131103516, 21.578889846801758, 22.3759765625, 23.173065185546875, 23.970151901245117, 24.76723861694336, 25.5643253326416, 26.361412048339844, 27.15850067138672, 27.95558738708496]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 11.0, 6.0, 3.0, 12.0, 20.0, 22.0, 25.0, 25.0, 27.0, 37.0, 39.0, 45.0, 56.0, 63.0, 61.0, 69.0, 60.0, 64.0, 55.0, 53.0, 34.0, 48.0, 34.0, 29.0, 30.0, 20.0, 11.0, 17.0, 12.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.11492919921875, -3.0247802734375, -2.93463134765625, -2.844482421875, -2.75433349609375, -2.6641845703125, -2.57403564453125, -2.48388671875, -2.39373779296875, -2.3035888671875, -2.21343994140625, -2.123291015625, -2.03314208984375, -1.9429931640625, -1.85284423828125, -1.7626953125, -1.67254638671875, -1.5823974609375, -1.49224853515625, -1.402099609375, -1.31195068359375, -1.2218017578125, -1.13165283203125, -1.04150390625, -0.95135498046875, -0.8612060546875, -0.77105712890625, -0.680908203125, -0.59075927734375, -0.5006103515625, -0.41046142578125, -0.3203125, -0.23016357421875, -0.1400146484375, -0.04986572265625, 0.040283203125, 0.13043212890625, 0.2205810546875, 0.31072998046875, 0.40087890625, 0.49102783203125, 0.5811767578125, 0.67132568359375, 0.761474609375, 0.85162353515625, 0.9417724609375, 1.03192138671875, 1.1220703125, 1.21221923828125, 1.3023681640625, 1.39251708984375, 1.482666015625, 1.57281494140625, 1.6629638671875, 1.75311279296875, 1.84326171875, 1.93341064453125, 2.0235595703125, 2.11370849609375, 2.203857421875, 2.29400634765625, 2.3841552734375, 2.47430419921875, 2.564453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 14.0, 26.0, 37.0, 77.0, 150.0, 252.0, 510.0, 943.0, 1621.0, 3034.0, 5660.0, 11824.0, 31714.0, 477937.0, 459105.0, 31532.0, 11809.0, 5774.0, 2961.0, 1584.0, 898.0, 471.0, 276.0, 151.0, 74.0, 43.0, 24.0, 13.0, 11.0, 9.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1171875, -7.87841796875, -7.6396484375, -7.40087890625, -7.162109375, -6.92333984375, -6.6845703125, -6.44580078125, -6.20703125, -5.96826171875, -5.7294921875, -5.49072265625, -5.251953125, -5.01318359375, -4.7744140625, -4.53564453125, -4.296875, -4.05810546875, -3.8193359375, -3.58056640625, -3.341796875, -3.10302734375, -2.8642578125, -2.62548828125, -2.38671875, -2.14794921875, -1.9091796875, -1.67041015625, -1.431640625, -1.19287109375, -0.9541015625, -0.71533203125, -0.4765625, -0.23779296875, 0.0009765625, 0.23974609375, 0.478515625, 0.71728515625, 0.9560546875, 1.19482421875, 1.43359375, 1.67236328125, 1.9111328125, 2.14990234375, 2.388671875, 2.62744140625, 2.8662109375, 3.10498046875, 3.34375, 3.58251953125, 3.8212890625, 4.06005859375, 4.298828125, 4.53759765625, 4.7763671875, 5.01513671875, 5.25390625, 5.49267578125, 5.7314453125, 5.97021484375, 6.208984375, 6.44775390625, 6.6865234375, 6.92529296875, 7.1640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 10.0, 7.0, 9.0, 10.0, 9.0, 17.0, 20.0, 27.0, 39.0, 28.0, 28.0, 34.0, 33.0, 36.0, 41.0, 43.0, 43.0, 44.0, 1063.0, 36.0, 41.0, 44.0, 40.0, 46.0, 35.0, 34.0, 30.0, 22.0, 16.0, 24.0, 20.0, 17.0, 16.0, 10.0, 11.0, 9.0, 5.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.977447509765625, -1.91583251953125, -1.854217529296875, -1.7926025390625, -1.730987548828125, -1.66937255859375, -1.607757568359375, -1.546142578125, -1.484527587890625, -1.42291259765625, -1.361297607421875, -1.2996826171875, -1.238067626953125, -1.17645263671875, -1.114837646484375, -1.05322265625, -0.991607666015625, -0.92999267578125, -0.868377685546875, -0.8067626953125, -0.745147705078125, -0.68353271484375, -0.621917724609375, -0.560302734375, -0.498687744140625, -0.43707275390625, -0.375457763671875, -0.3138427734375, -0.252227783203125, -0.19061279296875, -0.128997802734375, -0.0673828125, -0.005767822265625, 0.05584716796875, 0.117462158203125, 0.1790771484375, 0.240692138671875, 0.30230712890625, 0.363922119140625, 0.425537109375, 0.487152099609375, 0.54876708984375, 0.610382080078125, 0.6719970703125, 0.733612060546875, 0.79522705078125, 0.856842041015625, 0.91845703125, 0.980072021484375, 1.04168701171875, 1.103302001953125, 1.1649169921875, 1.226531982421875, 1.28814697265625, 1.349761962890625, 1.411376953125, 1.472991943359375, 1.53460693359375, 1.596221923828125, 1.6578369140625, 1.719451904296875, 1.78106689453125, 1.842681884765625, 1.904296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 9.0, 14.0, 14.0, 23.0, 18.0, 23.0, 26.0, 58.0, 82.0, 108.0, 146.0, 206.0, 289.0, 458.0, 773.0, 1169.0, 1980.0, 3742.0, 6792.0, 14946.0, 39535.0, 236632.0, 1664000.0, 80129.0, 23781.0, 10080.0, 5088.0, 2712.0, 1567.0, 944.0, 552.0, 383.0, 230.0, 154.0, 125.0, 97.0, 65.0, 44.0, 29.0, 18.0, 31.0, 16.0, 8.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.93359375, -2.839752197265625, -2.74591064453125, -2.652069091796875, -2.5582275390625, -2.464385986328125, -2.37054443359375, -2.276702880859375, -2.182861328125, -2.089019775390625, -1.99517822265625, -1.901336669921875, -1.8074951171875, -1.713653564453125, -1.61981201171875, -1.525970458984375, -1.43212890625, -1.338287353515625, -1.24444580078125, -1.150604248046875, -1.0567626953125, -0.962921142578125, -0.86907958984375, -0.775238037109375, -0.681396484375, -0.587554931640625, -0.49371337890625, -0.399871826171875, -0.3060302734375, -0.212188720703125, -0.11834716796875, -0.024505615234375, 0.0693359375, 0.163177490234375, 0.25701904296875, 0.350860595703125, 0.4447021484375, 0.538543701171875, 0.63238525390625, 0.726226806640625, 0.820068359375, 0.913909912109375, 1.00775146484375, 1.101593017578125, 1.1954345703125, 1.289276123046875, 1.38311767578125, 1.476959228515625, 1.57080078125, 1.664642333984375, 1.75848388671875, 1.852325439453125, 1.9461669921875, 2.040008544921875, 2.13385009765625, 2.227691650390625, 2.321533203125, 2.415374755859375, 2.50921630859375, 2.603057861328125, 2.6968994140625, 2.790740966796875, 2.88458251953125, 2.978424072265625, 3.072265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 7.0, 5.0, 10.0, 7.0, 25.0, 27.0, 65.0, 136.0, 465.0, 92.0, 40.0, 27.0, 21.0, 10.0, 11.0, 5.0, 4.0, 6.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3097381591796875, -1.264984130859375, -1.2202301025390625, -1.17547607421875, -1.1307220458984375, -1.085968017578125, -1.0412139892578125, -0.9964599609375, -0.9517059326171875, -0.906951904296875, -0.8621978759765625, -0.81744384765625, -0.7726898193359375, -0.727935791015625, -0.6831817626953125, -0.638427734375, -0.5936737060546875, -0.548919677734375, -0.5041656494140625, -0.45941162109375, -0.4146575927734375, -0.369903564453125, -0.3251495361328125, -0.2803955078125, -0.2356414794921875, -0.190887451171875, -0.1461334228515625, -0.10137939453125, -0.0566253662109375, -0.011871337890625, 0.0328826904296875, 0.07763671875, 0.1223907470703125, 0.167144775390625, 0.2118988037109375, 0.25665283203125, 0.3014068603515625, 0.346160888671875, 0.3909149169921875, 0.4356689453125, 0.4804229736328125, 0.525177001953125, 0.5699310302734375, 0.61468505859375, 0.6594390869140625, 0.704193115234375, 0.7489471435546875, 0.793701171875, 0.8384552001953125, 0.883209228515625, 0.9279632568359375, 0.97271728515625, 1.0174713134765625, 1.062225341796875, 1.1069793701171875, 1.1517333984375, 1.1964874267578125, 1.241241455078125, 1.2859954833984375, 1.33074951171875, 1.3755035400390625, 1.420257568359375, 1.4650115966796875, 1.509765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 8.0, 4.0, 7.0, 13.0, 14.0, 22.0, 19.0, 23.0, 45.0, 69.0, 143.0, 1006.0, 37661.0, 1001599.0, 7176.0, 375.0, 112.0, 59.0, 36.0, 31.0, 24.0, 16.0, 15.0, 12.0, 14.0, 12.0, 6.0, 2.0, 0.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.140625, -20.465087890625, -19.78955078125, -19.114013671875, -18.4384765625, -17.762939453125, -17.08740234375, -16.411865234375, -15.736328125, -15.060791015625, -14.38525390625, -13.709716796875, -13.0341796875, -12.358642578125, -11.68310546875, -11.007568359375, -10.33203125, -9.656494140625, -8.98095703125, -8.305419921875, -7.6298828125, -6.954345703125, -6.27880859375, -5.603271484375, -4.927734375, -4.252197265625, -3.57666015625, -2.901123046875, -2.2255859375, -1.550048828125, -0.87451171875, -0.198974609375, 0.4765625, 1.152099609375, 1.82763671875, 2.503173828125, 3.1787109375, 3.854248046875, 4.52978515625, 5.205322265625, 5.880859375, 6.556396484375, 7.23193359375, 7.907470703125, 8.5830078125, 9.258544921875, 9.93408203125, 10.609619140625, 11.28515625, 11.960693359375, 12.63623046875, 13.311767578125, 13.9873046875, 14.662841796875, 15.33837890625, 16.013916015625, 16.689453125, 17.364990234375, 18.04052734375, 18.716064453125, 19.3916015625, 20.067138671875, 20.74267578125, 21.418212890625, 22.09375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 15.0, 26.0, 32.0, 43.0, 88.0, 107.0, 110.0, 140.0, 114.0, 97.0, 62.0, 58.0, 29.0, 22.0, 13.0, 12.0, 10.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.794527530670166, -1.7396577596664429, -1.6847881078720093, -1.6299183368682861, -1.5750486850738525, -1.5201789140701294, -1.4653091430664062, -1.4104394912719727, -1.355569839477539, -1.300700068473816, -1.2458304166793823, -1.1909606456756592, -1.1360909938812256, -1.0812212228775024, -1.0263514518737793, -0.9714818000793457, -0.9166120290756226, -0.8617423176765442, -0.8068726062774658, -0.7520028352737427, -0.6971331834793091, -0.6422634124755859, -0.5873937010765076, -0.5325239896774292, -0.47765427827835083, -0.42278456687927246, -0.3679148554801941, -0.31304511427879333, -0.25817540287971497, -0.2033056914806366, -0.14843595027923584, -0.09356623888015747, -0.0386965274810791, 0.016173191368579865, 0.07104291021823883, 0.1259126365184784, 0.18078234791755676, 0.23565205931663513, 0.2905218005180359, 0.34539151191711426, 0.4002612233161926, 0.455130934715271, 0.5100006461143494, 0.5648703575134277, 0.6197401285171509, 0.6746097803115845, 0.7294795513153076, 0.784349262714386, 0.8392189741134644, 0.8940886855125427, 0.9489583969116211, 1.0038281679153442, 1.0586978197097778, 1.113567590713501, 1.1684372425079346, 1.2233070135116577, 1.2781767845153809, 1.333046555519104, 1.3879162073135376, 1.4427859783172607, 1.4976556301116943, 1.5525254011154175, 1.6073951721191406, 1.6622648239135742, 1.7171344757080078]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 9.0, 8.0, 10.0, 10.0, 9.0, 13.0, 20.0, 17.0, 20.0, 29.0, 28.0, 39.0, 32.0, 30.0, 29.0, 39.0, 53.0, 48.0, 41.0, 54.0, 50.0, 52.0, 33.0, 42.0, 36.0, 38.0, 29.0, 23.0, 19.0, 24.0, 24.0, 17.0, 14.0, 7.0, 16.0, 4.0, 6.0, 9.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3937840461730957, -1.3491837978363037, -1.3045835494995117, -1.2599833011627197, -1.2153829336166382, -1.1707826852798462, -1.1261824369430542, -1.0815821886062622, -1.0369818210601807, -0.9923815727233887, -0.9477812647819519, -0.9031810164451599, -0.8585807085037231, -0.8139804601669312, -0.7693802118301392, -0.7247799634933472, -0.6801797151565552, -0.6355794668197632, -0.5909791588783264, -0.5463789105415344, -0.5017786026000977, -0.45717835426330566, -0.41257810592651367, -0.3679778277873993, -0.3233775496482849, -0.27877727150917053, -0.23417700827121735, -0.18957674503326416, -0.14497646689414978, -0.1003761887550354, -0.05577594041824341, -0.011175662279129028, 0.03342461585998535, 0.07802488654851913, 0.12262515723705292, 0.1672254204750061, 0.21182569861412048, 0.25642597675323486, 0.30102622509002686, 0.34562650322914124, 0.3902267813682556, 0.43482705950737, 0.4794273376464844, 0.5240275859832764, 0.5686278343200684, 0.6132281422615051, 0.6578283905982971, 0.7024286985397339, 0.7470289468765259, 0.7916291952133179, 0.8362295031547546, 0.8808297514915466, 0.9254300594329834, 0.9700303077697754, 1.0146305561065674, 1.0592308044433594, 1.1038310527801514, 1.1484313011169434, 1.1930315494537354, 1.2376317977905273, 1.2822321653366089, 1.3268324136734009, 1.3714326620101929, 1.4160329103469849, 1.4606332778930664]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 20.0, 12.0, 23.0, 22.0, 29.0, 33.0, 42.0, 49.0, 41.0, 57.0, 59.0, 65.0, 55.0, 58.0, 64.0, 48.0, 45.0, 49.0, 57.0, 31.0, 26.0, 28.0, 16.0, 20.0, 17.0, 10.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.049163818359375, -2.95574951171875, -2.862335205078125, -2.7689208984375, -2.675506591796875, -2.58209228515625, -2.488677978515625, -2.395263671875, -2.301849365234375, -2.20843505859375, -2.115020751953125, -2.0216064453125, -1.928192138671875, -1.83477783203125, -1.741363525390625, -1.64794921875, -1.554534912109375, -1.46112060546875, -1.367706298828125, -1.2742919921875, -1.180877685546875, -1.08746337890625, -0.994049072265625, -0.900634765625, -0.807220458984375, -0.71380615234375, -0.620391845703125, -0.5269775390625, -0.433563232421875, -0.34014892578125, -0.246734619140625, -0.1533203125, -0.059906005859375, 0.03350830078125, 0.126922607421875, 0.2203369140625, 0.313751220703125, 0.40716552734375, 0.500579833984375, 0.593994140625, 0.687408447265625, 0.78082275390625, 0.874237060546875, 0.9676513671875, 1.061065673828125, 1.15447998046875, 1.247894287109375, 1.34130859375, 1.434722900390625, 1.52813720703125, 1.621551513671875, 1.7149658203125, 1.808380126953125, 1.90179443359375, 1.995208740234375, 2.088623046875, 2.182037353515625, 2.27545166015625, 2.368865966796875, 2.4622802734375, 2.555694580078125, 2.64910888671875, 2.742523193359375, 2.8359375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 9.0, 9.0, 9.0, 12.0, 27.0, 28.0, 46.0, 57.0, 94.0, 146.0, 195.0, 353.0, 565.0, 1078.0, 1742.0, 3109.0, 5944.0, 11460.0, 22577.0, 46262.0, 94208.0, 179205.0, 263147.0, 201468.0, 108034.0, 53643.0, 26563.0, 13329.0, 6660.0, 3592.0, 2059.0, 1147.0, 678.0, 391.0, 250.0, 152.0, 92.0, 66.0, 51.0, 25.0, 22.0, 14.0, 6.0, 12.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.69140625, -4.54296875, -4.39453125, -4.24609375, -4.09765625, -3.94921875, -3.80078125, -3.65234375, -3.50390625, -3.35546875, -3.20703125, -3.05859375, -2.91015625, -2.76171875, -2.61328125, -2.46484375, -2.31640625, -2.16796875, -2.01953125, -1.87109375, -1.72265625, -1.57421875, -1.42578125, -1.27734375, -1.12890625, -0.98046875, -0.83203125, -0.68359375, -0.53515625, -0.38671875, -0.23828125, -0.08984375, 0.05859375, 0.20703125, 0.35546875, 0.50390625, 0.65234375, 0.80078125, 0.94921875, 1.09765625, 1.24609375, 1.39453125, 1.54296875, 1.69140625, 1.83984375, 1.98828125, 2.13671875, 2.28515625, 2.43359375, 2.58203125, 2.73046875, 2.87890625, 3.02734375, 3.17578125, 3.32421875, 3.47265625, 3.62109375, 3.76953125, 3.91796875, 4.06640625, 4.21484375, 4.36328125, 4.51171875, 4.66015625, 4.80859375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 8.0, 12.0, 16.0, 18.0, 15.0, 26.0, 25.0, 38.0, 31.0, 53.0, 77.0, 73.0, 125.0, 136.0, 184.0, 1300.0, 198.0, 137.0, 106.0, 83.0, 65.0, 48.0, 37.0, 28.0, 25.0, 25.0, 27.0, 17.0, 23.0, 13.0, 11.0, 7.0, 11.0, 7.0, 4.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.796875, -8.5343017578125, -8.271728515625, -8.0091552734375, -7.74658203125, -7.4840087890625, -7.221435546875, -6.9588623046875, -6.6962890625, -6.4337158203125, -6.171142578125, -5.9085693359375, -5.64599609375, -5.3834228515625, -5.120849609375, -4.8582763671875, -4.595703125, -4.3331298828125, -4.070556640625, -3.8079833984375, -3.54541015625, -3.2828369140625, -3.020263671875, -2.7576904296875, -2.4951171875, -2.2325439453125, -1.969970703125, -1.7073974609375, -1.44482421875, -1.1822509765625, -0.919677734375, -0.6571044921875, -0.39453125, -0.1319580078125, 0.130615234375, 0.3931884765625, 0.65576171875, 0.9183349609375, 1.180908203125, 1.4434814453125, 1.7060546875, 1.9686279296875, 2.231201171875, 2.4937744140625, 2.75634765625, 3.0189208984375, 3.281494140625, 3.5440673828125, 3.806640625, 4.0692138671875, 4.331787109375, 4.5943603515625, 4.85693359375, 5.1195068359375, 5.382080078125, 5.6446533203125, 5.9072265625, 6.1697998046875, 6.432373046875, 6.6949462890625, 6.95751953125, 7.2200927734375, 7.482666015625, 7.7452392578125, 8.0078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 13.0, 8.0, 11.0, 16.0, 22.0, 15.0, 25.0, 12.0, 32.0, 32.0, 72.0, 71.0, 157.0, 635.0, 5180.0, 168809.0, 2834157.0, 131087.0, 4277.0, 555.0, 158.0, 96.0, 59.0, 33.0, 29.0, 20.0, 20.0, 17.0, 17.0, 18.0, 6.0, 4.0, 2.0, 7.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.14208984375, -25.1904296875, -24.23876953125, -23.287109375, -22.33544921875, -21.3837890625, -20.43212890625, -19.48046875, -18.52880859375, -17.5771484375, -16.62548828125, -15.673828125, -14.72216796875, -13.7705078125, -12.81884765625, -11.8671875, -10.91552734375, -9.9638671875, -9.01220703125, -8.060546875, -7.10888671875, -6.1572265625, -5.20556640625, -4.25390625, -3.30224609375, -2.3505859375, -1.39892578125, -0.447265625, 0.50439453125, 1.4560546875, 2.40771484375, 3.359375, 4.31103515625, 5.2626953125, 6.21435546875, 7.166015625, 8.11767578125, 9.0693359375, 10.02099609375, 10.97265625, 11.92431640625, 12.8759765625, 13.82763671875, 14.779296875, 15.73095703125, 16.6826171875, 17.63427734375, 18.5859375, 19.53759765625, 20.4892578125, 21.44091796875, 22.392578125, 23.34423828125, 24.2958984375, 25.24755859375, 26.19921875, 27.15087890625, 28.1025390625, 29.05419921875, 30.005859375, 30.95751953125, 31.9091796875, 32.86083984375, 33.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 23.0, 119.0, 259.0, 356.0, 171.0, 63.0, 15.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.67247772216797, -87.32238006591797, -84.9722900390625, -82.6221923828125, -80.27210235595703, -77.92200469970703, -75.57191467285156, -73.22181701660156, -70.87171936035156, -68.52162170410156, -66.1715316772461, -63.821434020996094, -61.47134017944336, -59.121246337890625, -56.77115249633789, -54.421058654785156, -52.07096481323242, -49.72087097167969, -47.37077713012695, -45.02068328857422, -42.67058563232422, -40.320491790771484, -37.97039794921875, -35.62030029296875, -33.27021026611328, -30.920116424560547, -28.57002067565918, -26.219926834106445, -23.869831085205078, -21.519737243652344, -19.16964340209961, -16.819547653198242, -14.46945571899414, -12.11936092376709, -9.769266128540039, -7.419172286987305, -5.069077491760254, -2.718982696533203, -0.36888885498046875, 1.9812068939208984, 4.331300735473633, 6.681395530700684, 9.031490325927734, 11.381584167480469, 13.73167896270752, 16.08177375793457, 18.431867599487305, 20.781963348388672, 23.132057189941406, 25.48215103149414, 27.832246780395508, 30.182340621948242, 32.53243637084961, 34.882530212402344, 37.23262405395508, 39.58271789550781, 41.93281555175781, 44.28290939331055, 46.63300323486328, 48.98310089111328, 51.333194732666016, 53.68328857421875, 56.033382415771484, 58.38347625732422, 60.73357009887695]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 12.0, 10.0, 10.0, 13.0, 23.0, 18.0, 31.0, 19.0, 36.0, 32.0, 38.0, 38.0, 55.0, 46.0, 49.0, 47.0, 43.0, 48.0, 43.0, 54.0, 30.0, 44.0, 32.0, 39.0, 29.0, 37.0, 16.0, 16.0, 19.0, 15.0, 11.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.911903381347656, -30.872209548950195, -29.832515716552734, -28.792821884155273, -27.753128051757812, -26.71343421936035, -25.67374038696289, -24.63404655456543, -23.59435272216797, -22.554658889770508, -21.514965057373047, -20.475271224975586, -19.435577392578125, -18.395883560180664, -17.356189727783203, -16.316495895385742, -15.276802062988281, -14.23710823059082, -13.19741439819336, -12.157720565795898, -11.118026733398438, -10.078332901000977, -9.038639068603516, -7.998945236206055, -6.959251403808594, -5.919557571411133, -4.879863739013672, -3.840169906616211, -2.80047607421875, -1.760782241821289, -0.7210884094238281, 0.3186054229736328, 1.3582992553710938, 2.3979930877685547, 3.4376869201660156, 4.477380752563477, 5.5170745849609375, 6.556768417358398, 7.596462249755859, 8.63615608215332, 9.675849914550781, 10.715543746948242, 11.755237579345703, 12.794931411743164, 13.834625244140625, 14.874319076538086, 15.914012908935547, 16.953706741333008, 17.99340057373047, 19.03309440612793, 20.07278823852539, 21.11248207092285, 22.152175903320312, 23.191869735717773, 24.231563568115234, 25.271257400512695, 26.310951232910156, 27.350645065307617, 28.390338897705078, 29.43003273010254, 30.4697265625, 31.50942039489746, 32.54911422729492, 33.58880615234375, 34.628501892089844]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 10.0, 11.0, 11.0, 21.0, 25.0, 32.0, 45.0, 38.0, 32.0, 46.0, 55.0, 51.0, 56.0, 63.0, 66.0, 62.0, 56.0, 51.0, 48.0, 34.0, 39.0, 29.0, 31.0, 14.0, 19.0, 11.0, 10.0, 12.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.363525390625, -3.26025390625, -3.156982421875, -3.0537109375, -2.950439453125, -2.84716796875, -2.743896484375, -2.640625, -2.537353515625, -2.43408203125, -2.330810546875, -2.2275390625, -2.124267578125, -2.02099609375, -1.917724609375, -1.814453125, -1.711181640625, -1.60791015625, -1.504638671875, -1.4013671875, -1.298095703125, -1.19482421875, -1.091552734375, -0.98828125, -0.885009765625, -0.78173828125, -0.678466796875, -0.5751953125, -0.471923828125, -0.36865234375, -0.265380859375, -0.162109375, -0.058837890625, 0.04443359375, 0.147705078125, 0.2509765625, 0.354248046875, 0.45751953125, 0.560791015625, 0.6640625, 0.767333984375, 0.87060546875, 0.973876953125, 1.0771484375, 1.180419921875, 1.28369140625, 1.386962890625, 1.490234375, 1.593505859375, 1.69677734375, 1.800048828125, 1.9033203125, 2.006591796875, 2.10986328125, 2.213134765625, 2.31640625, 2.419677734375, 2.52294921875, 2.626220703125, 2.7294921875, 2.832763671875, 2.93603515625, 3.039306640625, 3.142578125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 14.0, 22.0, 39.0, 57.0, 79.0, 126.0, 224.0, 407.0, 848.0, 2481.0, 8497.0, 41327.0, 360125.0, 3523367.0, 217913.0, 29869.0, 6150.0, 1579.0, 579.0, 277.0, 116.0, 79.0, 51.0, 20.0, 9.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.515625, -18.007080078125, -17.49853515625, -16.989990234375, -16.4814453125, -15.972900390625, -15.46435546875, -14.955810546875, -14.447265625, -13.938720703125, -13.43017578125, -12.921630859375, -12.4130859375, -11.904541015625, -11.39599609375, -10.887451171875, -10.37890625, -9.870361328125, -9.36181640625, -8.853271484375, -8.3447265625, -7.836181640625, -7.32763671875, -6.819091796875, -6.310546875, -5.802001953125, -5.29345703125, -4.784912109375, -4.2763671875, -3.767822265625, -3.25927734375, -2.750732421875, -2.2421875, -1.733642578125, -1.22509765625, -0.716552734375, -0.2080078125, 0.300537109375, 0.80908203125, 1.317626953125, 1.826171875, 2.334716796875, 2.84326171875, 3.351806640625, 3.8603515625, 4.368896484375, 4.87744140625, 5.385986328125, 5.89453125, 6.403076171875, 6.91162109375, 7.420166015625, 7.9287109375, 8.437255859375, 8.94580078125, 9.454345703125, 9.962890625, 10.471435546875, 10.97998046875, 11.488525390625, 11.9970703125, 12.505615234375, 13.01416015625, 13.522705078125, 14.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 13.0, 10.0, 27.0, 30.0, 51.0, 69.0, 99.0, 157.0, 218.0, 346.0, 515.0, 790.0, 588.0, 397.0, 228.0, 168.0, 104.0, 96.0, 48.0, 45.0, 22.0, 15.0, 13.0, 4.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.3968505859375, -11.035888671875, -10.6749267578125, -10.31396484375, -9.9530029296875, -9.592041015625, -9.2310791015625, -8.8701171875, -8.5091552734375, -8.148193359375, -7.7872314453125, -7.42626953125, -7.0653076171875, -6.704345703125, -6.3433837890625, -5.982421875, -5.6214599609375, -5.260498046875, -4.8995361328125, -4.53857421875, -4.1776123046875, -3.816650390625, -3.4556884765625, -3.0947265625, -2.7337646484375, -2.372802734375, -2.0118408203125, -1.65087890625, -1.2899169921875, -0.928955078125, -0.5679931640625, -0.20703125, 0.1539306640625, 0.514892578125, 0.8758544921875, 1.23681640625, 1.5977783203125, 1.958740234375, 2.3197021484375, 2.6806640625, 3.0416259765625, 3.402587890625, 3.7635498046875, 4.12451171875, 4.4854736328125, 4.846435546875, 5.2073974609375, 5.568359375, 5.9293212890625, 6.290283203125, 6.6512451171875, 7.01220703125, 7.3731689453125, 7.734130859375, 8.0950927734375, 8.4560546875, 8.8170166015625, 9.177978515625, 9.5389404296875, 9.89990234375, 10.2608642578125, 10.621826171875, 10.9827880859375, 11.34375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 13.0, 14.0, 19.0, 23.0, 38.0, 62.0, 59.0, 136.0, 229.0, 362.0, 729.0, 1406.0, 2931.0, 6920.0, 18481.0, 55811.0, 213457.0, 1425724.0, 2076714.0, 284205.0, 69689.0, 21922.0, 8389.0, 3396.0, 1653.0, 826.0, 420.0, 232.0, 162.0, 80.0, 65.0, 43.0, 18.0, 14.0, 14.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.0694580078125, -13.568603515625, -13.0677490234375, -12.56689453125, -12.0660400390625, -11.565185546875, -11.0643310546875, -10.5634765625, -10.0626220703125, -9.561767578125, -9.0609130859375, -8.56005859375, -8.0592041015625, -7.558349609375, -7.0574951171875, -6.556640625, -6.0557861328125, -5.554931640625, -5.0540771484375, -4.55322265625, -4.0523681640625, -3.551513671875, -3.0506591796875, -2.5498046875, -2.0489501953125, -1.548095703125, -1.0472412109375, -0.54638671875, -0.0455322265625, 0.455322265625, 0.9561767578125, 1.45703125, 1.9578857421875, 2.458740234375, 2.9595947265625, 3.46044921875, 3.9613037109375, 4.462158203125, 4.9630126953125, 5.4638671875, 5.9647216796875, 6.465576171875, 6.9664306640625, 7.46728515625, 7.9681396484375, 8.468994140625, 8.9698486328125, 9.470703125, 9.9715576171875, 10.472412109375, 10.9732666015625, 11.47412109375, 11.9749755859375, 12.475830078125, 12.9766845703125, 13.4775390625, 13.9783935546875, 14.479248046875, 14.9801025390625, 15.48095703125, 15.9818115234375, 16.482666015625, 16.9835205078125, 17.484375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 13.0, 28.0, 61.0, 144.0, 211.0, 242.0, 168.0, 81.0, 39.0, 13.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.35580825805664, -60.49708938598633, -57.63837432861328, -54.77965545654297, -51.92094039916992, -49.06222152709961, -46.20350646972656, -43.34478759765625, -40.48606872558594, -37.627349853515625, -34.76863479614258, -31.909915924072266, -29.05120086669922, -26.192481994628906, -23.333765029907227, -20.475048065185547, -17.6163330078125, -14.75761604309082, -11.89889907836914, -9.040181159973145, -6.181464195251465, -3.322747230529785, -0.46402931213378906, 2.3946876525878906, 5.25340461730957, 8.11212158203125, 10.97083854675293, 13.829556465148926, 16.688274383544922, 19.54698944091797, 22.40570831298828, 25.26442527770996, 28.123146057128906, 30.981863021850586, 33.840579986572266, 36.69929885864258, 39.558013916015625, 42.41673278808594, 45.27545166015625, 48.1341667175293, 50.992881774902344, 53.851600646972656, 56.7103157043457, 59.569034576416016, 62.42774963378906, 65.28646850585938, 68.14518737792969, 71.00390625, 73.86262512207031, 76.72134399414062, 79.58006286621094, 82.43877410888672, 85.29749298095703, 88.15621185302734, 91.01493072509766, 93.87364196777344, 96.73236083984375, 99.59107971191406, 102.44979858398438, 105.30850982666016, 108.16722869873047, 111.02594757080078, 113.8846664428711, 116.74337768554688, 119.60209655761719]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 3.0, 5.0, 15.0, 12.0, 17.0, 16.0, 16.0, 30.0, 28.0, 26.0, 30.0, 35.0, 35.0, 36.0, 36.0, 51.0, 47.0, 41.0, 49.0, 44.0, 29.0, 45.0, 38.0, 44.0, 43.0, 39.0, 23.0, 24.0, 31.0, 13.0, 19.0, 17.0, 17.0, 12.0, 5.0, 9.0, 4.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-33.95026779174805, -32.974952697753906, -31.9996395111084, -31.02432632446289, -30.04901123046875, -29.073698043823242, -28.098384857177734, -27.123069763183594, -26.147754669189453, -25.172441482543945, -24.197126388549805, -23.221813201904297, -22.246498107910156, -21.27118492126465, -20.29587173461914, -19.320556640625, -18.345243453979492, -17.369930267333984, -16.394615173339844, -15.419301986694336, -14.443986892700195, -13.468673706054688, -12.493359565734863, -11.518045425415039, -10.542731285095215, -9.56741714477539, -8.592103004455566, -7.6167893409729, -6.641475200653076, -5.666161060333252, -4.690847396850586, -3.7155332565307617, -2.7402210235595703, -1.7649070024490356, -0.789592981338501, 0.18572092056274414, 1.1610350608825684, 2.1363492012023926, 3.1116628646850586, 4.086977005004883, 5.062291145324707, 6.037605285644531, 7.0129194259643555, 7.9882330894470215, 8.963546752929688, 9.938861846923828, 10.914175033569336, 11.88948917388916, 12.864803314208984, 13.840117454528809, 14.815431594848633, 15.79074478149414, 16.76605987548828, 17.74137306213379, 18.716686248779297, 19.692001342773438, 20.667316436767578, 21.642629623413086, 22.617944717407227, 23.593257904052734, 24.568572998046875, 25.543886184692383, 26.51919937133789, 27.49451446533203, 28.46982765197754]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 18.0, 11.0, 18.0, 20.0, 26.0, 25.0, 29.0, 43.0, 33.0, 43.0, 43.0, 52.0, 68.0, 63.0, 51.0, 60.0, 36.0, 48.0, 34.0, 46.0, 39.0, 30.0, 25.0, 22.0, 17.0, 23.0, 17.0, 13.0, 7.0, 4.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.099609375, -3.0047607421875, -2.909912109375, -2.8150634765625, -2.72021484375, -2.6253662109375, -2.530517578125, -2.4356689453125, -2.3408203125, -2.2459716796875, -2.151123046875, -2.0562744140625, -1.96142578125, -1.8665771484375, -1.771728515625, -1.6768798828125, -1.58203125, -1.4871826171875, -1.392333984375, -1.2974853515625, -1.20263671875, -1.1077880859375, -1.012939453125, -0.9180908203125, -0.8232421875, -0.7283935546875, -0.633544921875, -0.5386962890625, -0.44384765625, -0.3489990234375, -0.254150390625, -0.1593017578125, -0.064453125, 0.0303955078125, 0.125244140625, 0.2200927734375, 0.31494140625, 0.4097900390625, 0.504638671875, 0.5994873046875, 0.6943359375, 0.7891845703125, 0.884033203125, 0.9788818359375, 1.07373046875, 1.1685791015625, 1.263427734375, 1.3582763671875, 1.453125, 1.5479736328125, 1.642822265625, 1.7376708984375, 1.83251953125, 1.9273681640625, 2.022216796875, 2.1170654296875, 2.2119140625, 2.3067626953125, 2.401611328125, 2.4964599609375, 2.59130859375, 2.6861572265625, 2.781005859375, 2.8758544921875, 2.970703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 32.0, 57.0, 74.0, 128.0, 197.0, 413.0, 717.0, 1265.0, 2224.0, 4202.0, 8247.0, 18704.0, 63547.0, 623958.0, 258419.0, 38580.0, 13794.0, 6439.0, 3430.0, 1877.0, 968.0, 534.0, 295.0, 156.0, 106.0, 72.0, 31.0, 21.0, 14.0, 15.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.279052734375, -8.93310546875, -8.587158203125, -8.2412109375, -7.895263671875, -7.54931640625, -7.203369140625, -6.857421875, -6.511474609375, -6.16552734375, -5.819580078125, -5.4736328125, -5.127685546875, -4.78173828125, -4.435791015625, -4.08984375, -3.743896484375, -3.39794921875, -3.052001953125, -2.7060546875, -2.360107421875, -2.01416015625, -1.668212890625, -1.322265625, -0.976318359375, -0.63037109375, -0.284423828125, 0.0615234375, 0.407470703125, 0.75341796875, 1.099365234375, 1.4453125, 1.791259765625, 2.13720703125, 2.483154296875, 2.8291015625, 3.175048828125, 3.52099609375, 3.866943359375, 4.212890625, 4.558837890625, 4.90478515625, 5.250732421875, 5.5966796875, 5.942626953125, 6.28857421875, 6.634521484375, 6.98046875, 7.326416015625, 7.67236328125, 8.018310546875, 8.3642578125, 8.710205078125, 9.05615234375, 9.402099609375, 9.748046875, 10.093994140625, 10.43994140625, 10.785888671875, 11.1318359375, 11.477783203125, 11.82373046875, 12.169677734375, 12.515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 10.0, 9.0, 9.0, 22.0, 14.0, 13.0, 19.0, 26.0, 26.0, 27.0, 31.0, 33.0, 29.0, 35.0, 43.0, 29.0, 48.0, 44.0, 1057.0, 36.0, 49.0, 40.0, 36.0, 41.0, 32.0, 37.0, 22.0, 39.0, 17.0, 18.0, 19.0, 19.0, 18.0, 11.0, 12.0, 8.0, 7.0, 8.0, 5.0, 1.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9697265625, -1.8999786376953125, -1.830230712890625, -1.7604827880859375, -1.69073486328125, -1.6209869384765625, -1.551239013671875, -1.4814910888671875, -1.4117431640625, -1.3419952392578125, -1.272247314453125, -1.2024993896484375, -1.13275146484375, -1.0630035400390625, -0.993255615234375, -0.9235076904296875, -0.853759765625, -0.7840118408203125, -0.714263916015625, -0.6445159912109375, -0.57476806640625, -0.5050201416015625, -0.435272216796875, -0.3655242919921875, -0.2957763671875, -0.2260284423828125, -0.156280517578125, -0.0865325927734375, -0.01678466796875, 0.0529632568359375, 0.122711181640625, 0.1924591064453125, 0.26220703125, 0.3319549560546875, 0.401702880859375, 0.4714508056640625, 0.54119873046875, 0.6109466552734375, 0.680694580078125, 0.7504425048828125, 0.8201904296875, 0.8899383544921875, 0.959686279296875, 1.0294342041015625, 1.09918212890625, 1.1689300537109375, 1.238677978515625, 1.3084259033203125, 1.378173828125, 1.4479217529296875, 1.517669677734375, 1.5874176025390625, 1.65716552734375, 1.7269134521484375, 1.796661376953125, 1.8664093017578125, 1.9361572265625, 2.0059051513671875, 2.075653076171875, 2.1454010009765625, 2.21514892578125, 2.2848968505859375, 2.354644775390625, 2.4243927001953125, 2.494140625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 11.0, 6.0, 20.0, 24.0, 32.0, 55.0, 58.0, 95.0, 127.0, 191.0, 285.0, 380.0, 527.0, 782.0, 1154.0, 1702.0, 2716.0, 4268.0, 7634.0, 14969.0, 35009.0, 123499.0, 1402762.0, 384011.0, 66258.0, 23636.0, 10983.0, 5867.0, 3451.0, 2119.0, 1441.0, 905.0, 646.0, 407.0, 295.0, 210.0, 139.0, 113.0, 89.0, 72.0, 56.0, 33.0, 26.0, 14.0, 16.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.42578125, -4.290771484375, -4.15576171875, -4.020751953125, -3.8857421875, -3.750732421875, -3.61572265625, -3.480712890625, -3.345703125, -3.210693359375, -3.07568359375, -2.940673828125, -2.8056640625, -2.670654296875, -2.53564453125, -2.400634765625, -2.265625, -2.130615234375, -1.99560546875, -1.860595703125, -1.7255859375, -1.590576171875, -1.45556640625, -1.320556640625, -1.185546875, -1.050537109375, -0.91552734375, -0.780517578125, -0.6455078125, -0.510498046875, -0.37548828125, -0.240478515625, -0.10546875, 0.029541015625, 0.16455078125, 0.299560546875, 0.4345703125, 0.569580078125, 0.70458984375, 0.839599609375, 0.974609375, 1.109619140625, 1.24462890625, 1.379638671875, 1.5146484375, 1.649658203125, 1.78466796875, 1.919677734375, 2.0546875, 2.189697265625, 2.32470703125, 2.459716796875, 2.5947265625, 2.729736328125, 2.86474609375, 2.999755859375, 3.134765625, 3.269775390625, 3.40478515625, 3.539794921875, 3.6748046875, 3.809814453125, 3.94482421875, 4.079833984375, 4.21484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 7.0, 4.0, 4.0, 14.0, 16.0, 24.0, 38.0, 56.0, 181.0, 447.0, 81.0, 44.0, 30.0, 16.0, 14.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.383758544921875, -2.29290771484375, -2.202056884765625, -2.1112060546875, -2.020355224609375, -1.92950439453125, -1.838653564453125, -1.747802734375, -1.656951904296875, -1.56610107421875, -1.475250244140625, -1.3843994140625, -1.293548583984375, -1.20269775390625, -1.111846923828125, -1.02099609375, -0.930145263671875, -0.83929443359375, -0.748443603515625, -0.6575927734375, -0.566741943359375, -0.47589111328125, -0.385040283203125, -0.294189453125, -0.203338623046875, -0.11248779296875, -0.021636962890625, 0.0692138671875, 0.160064697265625, 0.25091552734375, 0.341766357421875, 0.4326171875, 0.523468017578125, 0.61431884765625, 0.705169677734375, 0.7960205078125, 0.886871337890625, 0.97772216796875, 1.068572998046875, 1.159423828125, 1.250274658203125, 1.34112548828125, 1.431976318359375, 1.5228271484375, 1.613677978515625, 1.70452880859375, 1.795379638671875, 1.88623046875, 1.977081298828125, 2.06793212890625, 2.158782958984375, 2.2496337890625, 2.340484619140625, 2.43133544921875, 2.522186279296875, 2.613037109375, 2.703887939453125, 2.79473876953125, 2.885589599609375, 2.9764404296875, 3.067291259765625, 3.15814208984375, 3.248992919921875, 3.33984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 0.0, 0.0, 4.0, 8.0, 7.0, 13.0, 17.0, 23.0, 48.0, 75.0, 116.0, 404.0, 5001.0, 1035705.0, 6368.0, 433.0, 112.0, 69.0, 49.0, 23.0, 20.0, 8.0, 9.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.6875, -42.2080078125, -40.728515625, -39.2490234375, -37.76953125, -36.2900390625, -34.810546875, -33.3310546875, -31.8515625, -30.3720703125, -28.892578125, -27.4130859375, -25.93359375, -24.4541015625, -22.974609375, -21.4951171875, -20.015625, -18.5361328125, -17.056640625, -15.5771484375, -14.09765625, -12.6181640625, -11.138671875, -9.6591796875, -8.1796875, -6.7001953125, -5.220703125, -3.7412109375, -2.26171875, -0.7822265625, 0.697265625, 2.1767578125, 3.65625, 5.1357421875, 6.615234375, 8.0947265625, 9.57421875, 11.0537109375, 12.533203125, 14.0126953125, 15.4921875, 16.9716796875, 18.451171875, 19.9306640625, 21.41015625, 22.8896484375, 24.369140625, 25.8486328125, 27.328125, 28.8076171875, 30.287109375, 31.7666015625, 33.24609375, 34.7255859375, 36.205078125, 37.6845703125, 39.1640625, 40.6435546875, 42.123046875, 43.6025390625, 45.08203125, 46.5615234375, 48.041015625, 49.5205078125, 51.0]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 18.0, 35.0, 191.0, 392.0, 271.0, 77.0, 22.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.16488265991211, -9.91533088684082, -9.665778160095215, -9.416226387023926, -9.16667366027832, -8.917121887207031, -8.667570114135742, -8.418017387390137, -8.168465614318848, -7.9189133644104, -7.669361114501953, -7.419809341430664, -7.170257091522217, -6.9207048416137695, -6.671152591705322, -6.421600341796875, -6.172048091888428, -5.9224958419799805, -5.672943592071533, -5.423391342163086, -5.173839569091797, -4.92428731918335, -4.674735069274902, -4.425182819366455, -4.175630569458008, -3.9260783195495605, -3.6765263080596924, -3.426974058151245, -3.177422046661377, -2.9278697967529297, -2.6783175468444824, -2.428765296936035, -2.179213523864746, -1.9296613931655884, -1.6801092624664307, -1.4305570125579834, -1.1810048818588257, -0.931452751159668, -0.6819005012512207, -0.432348370552063, -0.18279623985290527, 0.06675592064857483, 0.31630808115005493, 0.5658602714538574, 0.8154124021530151, 1.0649645328521729, 1.3145167827606201, 1.5640689134597778, 1.8136210441589355, 2.063173294067383, 2.312725305557251, 2.5622775554656982, 2.8118295669555664, 3.0613818168640137, 3.310934066772461, 3.560486316680908, 3.8100383281707764, 4.0595903396606445, 4.309142589569092, 4.558694839477539, 4.808247089385986, 5.057799339294434, 5.307351112365723, 5.55690336227417, 5.806455612182617]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 8.0, 9.0, 8.0, 12.0, 10.0, 18.0, 21.0, 24.0, 19.0, 18.0, 33.0, 29.0, 33.0, 41.0, 29.0, 44.0, 39.0, 38.0, 40.0, 38.0, 46.0, 35.0, 50.0, 37.0, 42.0, 37.0, 38.0, 34.0, 18.0, 24.0, 18.0, 19.0, 18.0, 14.0, 8.0, 11.0, 10.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5163404941558838, -1.465317726135254, -1.4142950773239136, -1.3632723093032837, -1.3122496604919434, -1.2612268924713135, -1.2102041244506836, -1.1591814756393433, -1.108158826828003, -1.057136058807373, -1.0061134099960327, -0.9550906419754028, -0.9040679931640625, -0.8530452251434326, -0.8020225167274475, -0.7509998083114624, -0.6999770402908325, -0.6489543318748474, -0.5979316234588623, -0.5469088554382324, -0.4958861768245697, -0.4448634684085846, -0.3938407301902771, -0.342818021774292, -0.2917953133583069, -0.24077260494232178, -0.18974988162517548, -0.13872715830802917, -0.08770444989204407, -0.03668174147605896, 0.014340996742248535, 0.06536370515823364, 0.11638641357421875, 0.16740912199020386, 0.21843184530735016, 0.26945456862449646, 0.32047727704048157, 0.3714999854564667, 0.42252272367477417, 0.4735454320907593, 0.5245681405067444, 0.5755908489227295, 0.6266135573387146, 0.6776362657546997, 0.7286590337753296, 0.7796816825866699, 0.8307044506072998, 0.8817271590232849, 0.93274986743927, 0.9837725758552551, 1.0347952842712402, 1.0858180522918701, 1.1368407011032104, 1.1878634691238403, 1.2388861179351807, 1.2899088859558105, 1.3409316539764404, 1.3919544219970703, 1.4429770708084106, 1.4939998388290405, 1.5450224876403809, 1.5960452556610107, 1.6470680236816406, 1.698090672492981, 1.7491133213043213]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 13.0, 8.0, 8.0, 9.0, 11.0, 15.0, 7.0, 21.0, 24.0, 19.0, 22.0, 28.0, 25.0, 36.0, 56.0, 39.0, 38.0, 44.0, 53.0, 50.0, 44.0, 52.0, 57.0, 39.0, 25.0, 40.0, 27.0, 31.0, 24.0, 16.0, 15.0, 18.0, 24.0, 14.0, 13.0, 10.0, 7.0, 2.0, 3.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.611328125, -2.5301513671875, -2.448974609375, -2.3677978515625, -2.28662109375, -2.2054443359375, -2.124267578125, -2.0430908203125, -1.9619140625, -1.8807373046875, -1.799560546875, -1.7183837890625, -1.63720703125, -1.5560302734375, -1.474853515625, -1.3936767578125, -1.3125, -1.2313232421875, -1.150146484375, -1.0689697265625, -0.98779296875, -0.9066162109375, -0.825439453125, -0.7442626953125, -0.6630859375, -0.5819091796875, -0.500732421875, -0.4195556640625, -0.33837890625, -0.2572021484375, -0.176025390625, -0.0948486328125, -0.013671875, 0.0675048828125, 0.148681640625, 0.2298583984375, 0.31103515625, 0.3922119140625, 0.473388671875, 0.5545654296875, 0.6357421875, 0.7169189453125, 0.798095703125, 0.8792724609375, 0.96044921875, 1.0416259765625, 1.122802734375, 1.2039794921875, 1.28515625, 1.3663330078125, 1.447509765625, 1.5286865234375, 1.60986328125, 1.6910400390625, 1.772216796875, 1.8533935546875, 1.9345703125, 2.0157470703125, 2.096923828125, 2.1781005859375, 2.25927734375, 2.3404541015625, 2.421630859375, 2.5028076171875, 2.583984375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 8.0, 7.0, 7.0, 9.0, 13.0, 15.0, 25.0, 43.0, 41.0, 76.0, 128.0, 198.0, 293.0, 493.0, 813.0, 1500.0, 2522.0, 4930.0, 9852.0, 22603.0, 56741.0, 153830.0, 350894.0, 270696.0, 102198.0, 38496.0, 15924.0, 7511.0, 3644.0, 2104.0, 1138.0, 690.0, 413.0, 246.0, 161.0, 91.0, 61.0, 48.0, 26.0, 19.0, 22.0, 12.0, 4.0, 6.0, 5.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.26953125, -5.11810302734375, -4.9666748046875, -4.81524658203125, -4.663818359375, -4.51239013671875, -4.3609619140625, -4.20953369140625, -4.05810546875, -3.90667724609375, -3.7552490234375, -3.60382080078125, -3.452392578125, -3.30096435546875, -3.1495361328125, -2.99810791015625, -2.8466796875, -2.69525146484375, -2.5438232421875, -2.39239501953125, -2.240966796875, -2.08953857421875, -1.9381103515625, -1.78668212890625, -1.63525390625, -1.48382568359375, -1.3323974609375, -1.18096923828125, -1.029541015625, -0.87811279296875, -0.7266845703125, -0.57525634765625, -0.423828125, -0.27239990234375, -0.1209716796875, 0.03045654296875, 0.181884765625, 0.33331298828125, 0.4847412109375, 0.63616943359375, 0.78759765625, 0.93902587890625, 1.0904541015625, 1.24188232421875, 1.393310546875, 1.54473876953125, 1.6961669921875, 1.84759521484375, 1.9990234375, 2.15045166015625, 2.3018798828125, 2.45330810546875, 2.604736328125, 2.75616455078125, 2.9075927734375, 3.05902099609375, 3.21044921875, 3.36187744140625, 3.5133056640625, 3.66473388671875, 3.816162109375, 3.96759033203125, 4.1190185546875, 4.27044677734375, 4.421875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 7.0, 14.0, 4.0, 9.0, 18.0, 14.0, 14.0, 16.0, 15.0, 30.0, 13.0, 18.0, 35.0, 27.0, 47.0, 75.0, 72.0, 89.0, 140.0, 205.0, 1250.0, 218.0, 157.0, 85.0, 69.0, 48.0, 40.0, 50.0, 41.0, 36.0, 28.0, 33.0, 22.0, 19.0, 10.0, 13.0, 13.0, 11.0, 6.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-8.875, -8.6102294921875, -8.345458984375, -8.0806884765625, -7.81591796875, -7.5511474609375, -7.286376953125, -7.0216064453125, -6.7568359375, -6.4920654296875, -6.227294921875, -5.9625244140625, -5.69775390625, -5.4329833984375, -5.168212890625, -4.9034423828125, -4.638671875, -4.3739013671875, -4.109130859375, -3.8443603515625, -3.57958984375, -3.3148193359375, -3.050048828125, -2.7852783203125, -2.5205078125, -2.2557373046875, -1.990966796875, -1.7261962890625, -1.46142578125, -1.1966552734375, -0.931884765625, -0.6671142578125, -0.40234375, -0.1375732421875, 0.127197265625, 0.3919677734375, 0.65673828125, 0.9215087890625, 1.186279296875, 1.4510498046875, 1.7158203125, 1.9805908203125, 2.245361328125, 2.5101318359375, 2.77490234375, 3.0396728515625, 3.304443359375, 3.5692138671875, 3.833984375, 4.0987548828125, 4.363525390625, 4.6282958984375, 4.89306640625, 5.1578369140625, 5.422607421875, 5.6873779296875, 5.9521484375, 6.2169189453125, 6.481689453125, 6.7464599609375, 7.01123046875, 7.2760009765625, 7.540771484375, 7.8055419921875, 8.0703125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 7.0, 11.0, 21.0, 20.0, 22.0, 32.0, 44.0, 81.0, 87.0, 158.0, 338.0, 649.0, 1432.0, 3834.0, 11772.0, 48233.0, 314328.0, 2022866.0, 634693.0, 80750.0, 17423.0, 5224.0, 1906.0, 778.0, 400.0, 179.0, 108.0, 68.0, 49.0, 39.0, 38.0, 31.0, 21.0, 10.0, 2.0, 15.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.098876953125, -10.73681640625, -10.374755859375, -10.0126953125, -9.650634765625, -9.28857421875, -8.926513671875, -8.564453125, -8.202392578125, -7.84033203125, -7.478271484375, -7.1162109375, -6.754150390625, -6.39208984375, -6.030029296875, -5.66796875, -5.305908203125, -4.94384765625, -4.581787109375, -4.2197265625, -3.857666015625, -3.49560546875, -3.133544921875, -2.771484375, -2.409423828125, -2.04736328125, -1.685302734375, -1.3232421875, -0.961181640625, -0.59912109375, -0.237060546875, 0.125, 0.487060546875, 0.84912109375, 1.211181640625, 1.5732421875, 1.935302734375, 2.29736328125, 2.659423828125, 3.021484375, 3.383544921875, 3.74560546875, 4.107666015625, 4.4697265625, 4.831787109375, 5.19384765625, 5.555908203125, 5.91796875, 6.280029296875, 6.64208984375, 7.004150390625, 7.3662109375, 7.728271484375, 8.09033203125, 8.452392578125, 8.814453125, 9.176513671875, 9.53857421875, 9.900634765625, 10.2626953125, 10.624755859375, 10.98681640625, 11.348876953125, 11.7109375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 53.0, 192.0, 372.0, 280.0, 80.0, 25.0, 9.0], "bins": [-131.65765380859375, -129.45008850097656, -127.24251556396484, -125.03495025634766, -122.82737731933594, -120.61981201171875, -118.41224670410156, -116.20467376708984, -113.99710845947266, -111.78954315185547, -109.58197021484375, -107.37440490722656, -105.16683197021484, -102.95926666259766, -100.75169372558594, -98.54412841796875, -96.33656311035156, -94.12899780273438, -91.92142486572266, -89.71385955810547, -87.50628662109375, -85.29872131347656, -83.09115600585938, -80.88358306884766, -78.67601013183594, -76.46844482421875, -74.26087188720703, -72.05330657958984, -69.84573364257812, -67.63816833496094, -65.43060302734375, -63.22303009033203, -61.01546096801758, -58.807891845703125, -56.60032272338867, -54.39275360107422, -52.18518829345703, -49.97761917114258, -47.770050048828125, -45.56248092651367, -43.35491180419922, -41.147342681884766, -38.93977355957031, -36.732208251953125, -34.52463912963867, -32.31707000732422, -30.109500885009766, -27.901931762695312, -25.694366455078125, -23.486797332763672, -21.27923011779785, -19.0716609954834, -16.864093780517578, -14.656524658203125, -12.448955535888672, -10.241387367248535, -8.033819198608398, -5.826251029968262, -3.618682384490967, -1.4111137390136719, 0.7964544296264648, 3.0040225982666016, 5.211591720581055, 7.419159889221191, 9.626728057861328]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 10.0, 6.0, 9.0, 16.0, 11.0, 12.0, 15.0, 13.0, 21.0, 22.0, 29.0, 33.0, 46.0, 35.0, 19.0, 47.0, 32.0, 33.0, 46.0, 40.0, 43.0, 51.0, 41.0, 30.0, 35.0, 42.0, 30.0, 26.0, 16.0, 33.0, 28.0, 22.0, 20.0, 10.0, 17.0, 13.0, 10.0, 10.0, 8.0, 5.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.84212875366211, -30.879226684570312, -29.91632652282715, -28.95342445373535, -27.990522384643555, -27.02762222290039, -26.064720153808594, -25.101818084716797, -24.138916015625, -23.176013946533203, -22.21311378479004, -21.250211715698242, -20.287309646606445, -19.32440948486328, -18.361507415771484, -17.398605346679688, -16.435705184936523, -15.472804069519043, -14.509902000427246, -13.547000885009766, -12.584098815917969, -11.621197700500488, -10.658296585083008, -9.695394515991211, -8.73249340057373, -7.769591808319092, -6.806690216064453, -5.843789100646973, -4.880887508392334, -3.9179859161376953, -2.955084800720215, -1.9921832084655762, -1.0292816162109375, -0.06638014316558838, 0.8965213298797607, 1.8594226837158203, 2.822324275970459, 3.7852258682250977, 4.748126983642578, 5.711028575897217, 6.6739301681518555, 7.636831760406494, 8.599733352661133, 9.562634468078613, 10.525535583496094, 11.48843765258789, 12.451338768005371, 13.414239883422852, 14.377141952514648, 15.340043067932129, 16.30294418334961, 17.265846252441406, 18.228748321533203, 19.191650390625, 20.154550552368164, 21.11745262145996, 22.080352783203125, 23.043254852294922, 24.006155014038086, 24.969057083129883, 25.93195915222168, 26.894859313964844, 27.85776138305664, 28.820663452148438, 29.783565521240234]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 7.0, 6.0, 12.0, 18.0, 18.0, 12.0, 24.0, 27.0, 24.0, 33.0, 39.0, 30.0, 45.0, 49.0, 42.0, 55.0, 50.0, 64.0, 42.0, 54.0, 42.0, 40.0, 44.0, 33.0, 32.0, 21.0, 21.0, 19.0, 19.0, 17.0, 11.0, 12.0, 11.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.680145263671875, -2.58685302734375, -2.493560791015625, -2.4002685546875, -2.306976318359375, -2.21368408203125, -2.120391845703125, -2.027099609375, -1.933807373046875, -1.84051513671875, -1.747222900390625, -1.6539306640625, -1.560638427734375, -1.46734619140625, -1.374053955078125, -1.28076171875, -1.187469482421875, -1.09417724609375, -1.000885009765625, -0.9075927734375, -0.814300537109375, -0.72100830078125, -0.627716064453125, -0.534423828125, -0.441131591796875, -0.34783935546875, -0.254547119140625, -0.1612548828125, -0.067962646484375, 0.02532958984375, 0.118621826171875, 0.2119140625, 0.305206298828125, 0.39849853515625, 0.491790771484375, 0.5850830078125, 0.678375244140625, 0.77166748046875, 0.864959716796875, 0.958251953125, 1.051544189453125, 1.14483642578125, 1.238128662109375, 1.3314208984375, 1.424713134765625, 1.51800537109375, 1.611297607421875, 1.70458984375, 1.797882080078125, 1.89117431640625, 1.984466552734375, 2.0777587890625, 2.171051025390625, 2.26434326171875, 2.357635498046875, 2.450927734375, 2.544219970703125, 2.63751220703125, 2.730804443359375, 2.8240966796875, 2.917388916015625, 3.01068115234375, 3.103973388671875, 3.197265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 10.0, 10.0, 6.0, 26.0, 26.0, 34.0, 57.0, 72.0, 89.0, 142.0, 206.0, 438.0, 1059.0, 2825.0, 9880.0, 41382.0, 243513.0, 3151226.0, 644660.0, 75120.0, 16697.0, 4313.0, 1391.0, 489.0, 208.0, 117.0, 79.0, 48.0, 46.0, 22.0, 21.0, 23.0, 11.0, 6.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.5963134765625, -13.192626953125, -12.7889404296875, -12.38525390625, -11.9815673828125, -11.577880859375, -11.1741943359375, -10.7705078125, -10.3668212890625, -9.963134765625, -9.5594482421875, -9.15576171875, -8.7520751953125, -8.348388671875, -7.9447021484375, -7.541015625, -7.1373291015625, -6.733642578125, -6.3299560546875, -5.92626953125, -5.5225830078125, -5.118896484375, -4.7152099609375, -4.3115234375, -3.9078369140625, -3.504150390625, -3.1004638671875, -2.69677734375, -2.2930908203125, -1.889404296875, -1.4857177734375, -1.08203125, -0.6783447265625, -0.274658203125, 0.1290283203125, 0.53271484375, 0.9364013671875, 1.340087890625, 1.7437744140625, 2.1474609375, 2.5511474609375, 2.954833984375, 3.3585205078125, 3.76220703125, 4.1658935546875, 4.569580078125, 4.9732666015625, 5.376953125, 5.7806396484375, 6.184326171875, 6.5880126953125, 6.99169921875, 7.3953857421875, 7.799072265625, 8.2027587890625, 8.6064453125, 9.0101318359375, 9.413818359375, 9.8175048828125, 10.22119140625, 10.6248779296875, 11.028564453125, 11.4322509765625, 11.8359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 3.0, 5.0, 10.0, 16.0, 19.0, 17.0, 32.0, 57.0, 56.0, 78.0, 109.0, 111.0, 193.0, 203.0, 344.0, 428.0, 523.0, 505.0, 347.0, 253.0, 186.0, 142.0, 113.0, 81.0, 61.0, 39.0, 35.0, 30.0, 20.0, 12.0, 8.0, 8.0, 10.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98046875, -7.71063232421875, -7.4407958984375, -7.17095947265625, -6.901123046875, -6.63128662109375, -6.3614501953125, -6.09161376953125, -5.82177734375, -5.55194091796875, -5.2821044921875, -5.01226806640625, -4.742431640625, -4.47259521484375, -4.2027587890625, -3.93292236328125, -3.6630859375, -3.39324951171875, -3.1234130859375, -2.85357666015625, -2.583740234375, -2.31390380859375, -2.0440673828125, -1.77423095703125, -1.50439453125, -1.23455810546875, -0.9647216796875, -0.69488525390625, -0.425048828125, -0.15521240234375, 0.1146240234375, 0.38446044921875, 0.654296875, 0.92413330078125, 1.1939697265625, 1.46380615234375, 1.733642578125, 2.00347900390625, 2.2733154296875, 2.54315185546875, 2.81298828125, 3.08282470703125, 3.3526611328125, 3.62249755859375, 3.892333984375, 4.16217041015625, 4.4320068359375, 4.70184326171875, 4.9716796875, 5.24151611328125, 5.5113525390625, 5.78118896484375, 6.051025390625, 6.32086181640625, 6.5906982421875, 6.86053466796875, 7.13037109375, 7.40020751953125, 7.6700439453125, 7.93988037109375, 8.209716796875, 8.47955322265625, 8.7493896484375, 9.01922607421875, 9.2890625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 14.0, 24.0, 29.0, 40.0, 52.0, 110.0, 165.0, 276.0, 413.0, 751.0, 1260.0, 2470.0, 4960.0, 9999.0, 22222.0, 52464.0, 135039.0, 416021.0, 1786240.0, 1271605.0, 307139.0, 105190.0, 42283.0, 18230.0, 8369.0, 4086.0, 2051.0, 1140.0, 589.0, 365.0, 220.0, 156.0, 86.0, 70.0, 39.0, 30.0, 20.0, 14.0, 8.0, 5.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.7230224609375, -10.375732421875, -10.0284423828125, -9.68115234375, -9.3338623046875, -8.986572265625, -8.6392822265625, -8.2919921875, -7.9447021484375, -7.597412109375, -7.2501220703125, -6.90283203125, -6.5555419921875, -6.208251953125, -5.8609619140625, -5.513671875, -5.1663818359375, -4.819091796875, -4.4718017578125, -4.12451171875, -3.7772216796875, -3.429931640625, -3.0826416015625, -2.7353515625, -2.3880615234375, -2.040771484375, -1.6934814453125, -1.34619140625, -0.9989013671875, -0.651611328125, -0.3043212890625, 0.04296875, 0.3902587890625, 0.737548828125, 1.0848388671875, 1.43212890625, 1.7794189453125, 2.126708984375, 2.4739990234375, 2.8212890625, 3.1685791015625, 3.515869140625, 3.8631591796875, 4.21044921875, 4.5577392578125, 4.905029296875, 5.2523193359375, 5.599609375, 5.9468994140625, 6.294189453125, 6.6414794921875, 6.98876953125, 7.3360595703125, 7.683349609375, 8.0306396484375, 8.3779296875, 8.7252197265625, 9.072509765625, 9.4197998046875, 9.76708984375, 10.1143798828125, 10.461669921875, 10.8089599609375, 11.15625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 12.0, 18.0, 31.0, 42.0, 72.0, 104.0, 106.0, 118.0, 119.0, 97.0, 76.0, 70.0, 46.0, 32.0, 21.0, 11.0, 10.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.48310089111328, -31.801393508911133, -30.11968421936035, -28.437976837158203, -26.756269454956055, -25.074562072753906, -23.392852783203125, -21.711145401000977, -20.029438018798828, -18.34773063659668, -16.6660213470459, -14.98431396484375, -13.302606582641602, -11.620898246765137, -9.939189910888672, -8.257482528686523, -6.575773239135742, -4.8940653800964355, -3.21235728263855, -1.530649185180664, 0.15105867385864258, 1.8327665328979492, 3.514474868774414, 5.1961822509765625, 6.877890586853027, 8.559598922729492, 10.24130630493164, 11.923014640808105, 13.60472297668457, 15.286430358886719, 16.9681396484375, 18.649845123291016, 20.331554412841797, 22.013261795043945, 23.694971084594727, 25.376678466796875, 27.058385848999023, 28.740093231201172, 30.421802520751953, 32.10350799560547, 33.78521728515625, 35.46692657470703, 37.14863204956055, 38.83034133911133, 40.51205062866211, 42.193756103515625, 43.875465393066406, 45.55717468261719, 47.23888397216797, 48.92059326171875, 50.602298736572266, 52.28400802612305, 53.96571731567383, 55.647422790527344, 57.329132080078125, 59.010841369628906, 60.69254684448242, 62.3742561340332, 64.05596160888672, 65.7376708984375, 67.41938018798828, 69.10108947753906, 70.78279113769531, 72.4645004272461, 74.14620971679688]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 5.0, 6.0, 12.0, 7.0, 19.0, 14.0, 25.0, 19.0, 19.0, 32.0, 25.0, 27.0, 31.0, 29.0, 31.0, 23.0, 37.0, 44.0, 40.0, 43.0, 31.0, 35.0, 30.0, 36.0, 28.0, 41.0, 25.0, 24.0, 29.0, 26.0, 23.0, 26.0, 21.0, 21.0, 12.0, 9.0, 8.0, 14.0, 11.0, 5.0, 10.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-23.457971572875977, -22.67638397216797, -21.894798278808594, -21.113210678100586, -20.331623077392578, -19.550037384033203, -18.768449783325195, -17.986862182617188, -17.205276489257812, -16.423688888549805, -15.642102241516113, -14.860515594482422, -14.078927993774414, -13.297341346740723, -12.515754699707031, -11.734167098999023, -10.952579498291016, -10.170992851257324, -9.389405250549316, -8.607818603515625, -7.826231479644775, -7.044644355773926, -6.263057708740234, -5.481470584869385, -4.699883460998535, -3.9182963371276855, -3.136709451675415, -2.3551225662231445, -1.573535442352295, -0.7919483184814453, -0.010361671447753906, 0.7712254524230957, 1.5528106689453125, 2.334397792816162, 3.1159846782684326, 3.897571563720703, 4.679158687591553, 5.460745811462402, 6.242332458496094, 7.023919582366943, 7.805506706237793, 8.587093353271484, 9.368680953979492, 10.150267601013184, 10.931854248046875, 11.713441848754883, 12.495028495788574, 13.276615142822266, 14.058202743530273, 14.839789390563965, 15.621376991271973, 16.402963638305664, 17.184551239013672, 17.966136932373047, 18.747724533081055, 19.529312133789062, 20.310897827148438, 21.092485427856445, 21.87407112121582, 22.655658721923828, 23.437246322631836, 24.218833923339844, 25.00041961669922, 25.782007217407227, 26.563594818115234]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 7.0, 7.0, 8.0, 9.0, 14.0, 11.0, 20.0, 27.0, 25.0, 25.0, 22.0, 22.0, 43.0, 46.0, 32.0, 40.0, 53.0, 54.0, 41.0, 40.0, 55.0, 45.0, 40.0, 33.0, 36.0, 28.0, 25.0, 30.0, 27.0, 20.0, 22.0, 24.0, 13.0, 8.0, 8.0, 5.0, 5.0, 7.0, 1.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-3.205078125, -3.119659423828125, -3.03424072265625, -2.948822021484375, -2.8634033203125, -2.777984619140625, -2.69256591796875, -2.607147216796875, -2.521728515625, -2.436309814453125, -2.35089111328125, -2.265472412109375, -2.1800537109375, -2.094635009765625, -2.00921630859375, -1.923797607421875, -1.83837890625, -1.752960205078125, -1.66754150390625, -1.582122802734375, -1.4967041015625, -1.411285400390625, -1.32586669921875, -1.240447998046875, -1.155029296875, -1.069610595703125, -0.98419189453125, -0.898773193359375, -0.8133544921875, -0.727935791015625, -0.64251708984375, -0.557098388671875, -0.4716796875, -0.386260986328125, -0.30084228515625, -0.215423583984375, -0.1300048828125, -0.044586181640625, 0.04083251953125, 0.126251220703125, 0.211669921875, 0.297088623046875, 0.38250732421875, 0.467926025390625, 0.5533447265625, 0.638763427734375, 0.72418212890625, 0.809600830078125, 0.89501953125, 0.980438232421875, 1.06585693359375, 1.151275634765625, 1.2366943359375, 1.322113037109375, 1.40753173828125, 1.492950439453125, 1.578369140625, 1.663787841796875, 1.74920654296875, 1.834625244140625, 1.9200439453125, 2.005462646484375, 2.09088134765625, 2.176300048828125, 2.26171875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 18.0, 16.0, 30.0, 42.0, 48.0, 84.0, 151.0, 243.0, 411.0, 696.0, 1106.0, 2007.0, 3663.0, 6465.0, 11642.0, 20738.0, 36624.0, 63697.0, 108125.0, 169672.0, 210704.0, 165801.0, 103977.0, 61419.0, 35484.0, 19879.0, 11132.0, 6247.0, 3622.0, 2001.0, 1140.0, 622.0, 415.0, 223.0, 147.0, 81.0, 56.0, 30.0, 35.0, 19.0, 13.0, 5.0, 7.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.822021484375, -8.55029296875, -8.278564453125, -8.0068359375, -7.735107421875, -7.46337890625, -7.191650390625, -6.919921875, -6.648193359375, -6.37646484375, -6.104736328125, -5.8330078125, -5.561279296875, -5.28955078125, -5.017822265625, -4.74609375, -4.474365234375, -4.20263671875, -3.930908203125, -3.6591796875, -3.387451171875, -3.11572265625, -2.843994140625, -2.572265625, -2.300537109375, -2.02880859375, -1.757080078125, -1.4853515625, -1.213623046875, -0.94189453125, -0.670166015625, -0.3984375, -0.126708984375, 0.14501953125, 0.416748046875, 0.6884765625, 0.960205078125, 1.23193359375, 1.503662109375, 1.775390625, 2.047119140625, 2.31884765625, 2.590576171875, 2.8623046875, 3.134033203125, 3.40576171875, 3.677490234375, 3.94921875, 4.220947265625, 4.49267578125, 4.764404296875, 5.0361328125, 5.307861328125, 5.57958984375, 5.851318359375, 6.123046875, 6.394775390625, 6.66650390625, 6.938232421875, 7.2099609375, 7.481689453125, 7.75341796875, 8.025146484375, 8.296875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 6.0, 13.0, 10.0, 11.0, 21.0, 11.0, 27.0, 24.0, 34.0, 38.0, 37.0, 45.0, 42.0, 26.0, 39.0, 45.0, 1065.0, 44.0, 26.0, 40.0, 50.0, 48.0, 36.0, 33.0, 29.0, 29.0, 29.0, 30.0, 21.0, 21.0, 10.0, 14.0, 13.0, 10.0, 7.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0], "bins": [-3.095703125, -3.013916015625, -2.93212890625, -2.850341796875, -2.7685546875, -2.686767578125, -2.60498046875, -2.523193359375, -2.44140625, -2.359619140625, -2.27783203125, -2.196044921875, -2.1142578125, -2.032470703125, -1.95068359375, -1.868896484375, -1.787109375, -1.705322265625, -1.62353515625, -1.541748046875, -1.4599609375, -1.378173828125, -1.29638671875, -1.214599609375, -1.1328125, -1.051025390625, -0.96923828125, -0.887451171875, -0.8056640625, -0.723876953125, -0.64208984375, -0.560302734375, -0.478515625, -0.396728515625, -0.31494140625, -0.233154296875, -0.1513671875, -0.069580078125, 0.01220703125, 0.093994140625, 0.17578125, 0.257568359375, 0.33935546875, 0.421142578125, 0.5029296875, 0.584716796875, 0.66650390625, 0.748291015625, 0.830078125, 0.911865234375, 0.99365234375, 1.075439453125, 1.1572265625, 1.239013671875, 1.32080078125, 1.402587890625, 1.484375, 1.566162109375, 1.64794921875, 1.729736328125, 1.8115234375, 1.893310546875, 1.97509765625, 2.056884765625, 2.138671875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 18.0, 13.0, 26.0, 48.0, 58.0, 82.0, 132.0, 173.0, 269.0, 325.0, 527.0, 865.0, 1259.0, 1950.0, 2870.0, 4819.0, 7792.0, 12962.0, 22089.0, 39442.0, 76980.0, 165527.0, 460942.0, 786702.0, 270316.0, 112549.0, 54791.0, 29724.0, 16845.0, 9934.0, 6027.0, 3904.0, 2373.0, 1622.0, 1008.0, 706.0, 446.0, 324.0, 235.0, 141.0, 99.0, 70.0, 41.0, 34.0, 24.0, 12.0, 10.0, 7.0, 9.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.54296875, -4.39764404296875, -4.2523193359375, -4.10699462890625, -3.961669921875, -3.81634521484375, -3.6710205078125, -3.52569580078125, -3.38037109375, -3.23504638671875, -3.0897216796875, -2.94439697265625, -2.799072265625, -2.65374755859375, -2.5084228515625, -2.36309814453125, -2.2177734375, -2.07244873046875, -1.9271240234375, -1.78179931640625, -1.636474609375, -1.49114990234375, -1.3458251953125, -1.20050048828125, -1.05517578125, -0.90985107421875, -0.7645263671875, -0.61920166015625, -0.473876953125, -0.32855224609375, -0.1832275390625, -0.03790283203125, 0.107421875, 0.25274658203125, 0.3980712890625, 0.54339599609375, 0.688720703125, 0.83404541015625, 0.9793701171875, 1.12469482421875, 1.27001953125, 1.41534423828125, 1.5606689453125, 1.70599365234375, 1.851318359375, 1.99664306640625, 2.1419677734375, 2.28729248046875, 2.4326171875, 2.57794189453125, 2.7232666015625, 2.86859130859375, 3.013916015625, 3.15924072265625, 3.3045654296875, 3.44989013671875, 3.59521484375, 3.74053955078125, 3.8858642578125, 4.03118896484375, 4.176513671875, 4.32183837890625, 4.4671630859375, 4.61248779296875, 4.7578125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 1.0, 5.0, 5.0, 4.0, 8.0, 16.0, 21.0, 32.0, 44.0, 45.0, 58.0, 112.0, 137.0, 130.0, 99.0, 78.0, 59.0, 38.0, 37.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.617462158203125, -2.53375244140625, -2.450042724609375, -2.3663330078125, -2.282623291015625, -2.19891357421875, -2.115203857421875, -2.031494140625, -1.947784423828125, -1.86407470703125, -1.780364990234375, -1.6966552734375, -1.612945556640625, -1.52923583984375, -1.445526123046875, -1.36181640625, -1.278106689453125, -1.19439697265625, -1.110687255859375, -1.0269775390625, -0.943267822265625, -0.85955810546875, -0.775848388671875, -0.692138671875, -0.608428955078125, -0.52471923828125, -0.441009521484375, -0.3572998046875, -0.273590087890625, -0.18988037109375, -0.106170654296875, -0.0224609375, 0.061248779296875, 0.14495849609375, 0.228668212890625, 0.3123779296875, 0.396087646484375, 0.47979736328125, 0.563507080078125, 0.647216796875, 0.730926513671875, 0.81463623046875, 0.898345947265625, 0.9820556640625, 1.065765380859375, 1.14947509765625, 1.233184814453125, 1.31689453125, 1.400604248046875, 1.48431396484375, 1.568023681640625, 1.6517333984375, 1.735443115234375, 1.81915283203125, 1.902862548828125, 1.986572265625, 2.070281982421875, 2.15399169921875, 2.237701416015625, 2.3214111328125, 2.405120849609375, 2.48883056640625, 2.572540283203125, 2.65625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 11.0, 3.0, 7.0, 12.0, 15.0, 19.0, 24.0, 38.0, 78.0, 99.0, 177.0, 323.0, 793.0, 2892.0, 21694.0, 991743.0, 25888.0, 3040.0, 910.0, 301.0, 172.0, 99.0, 61.0, 40.0, 28.0, 13.0, 9.0, 17.0, 6.0, 9.0, 7.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.90625, -34.80224609375, -33.6982421875, -32.59423828125, -31.490234375, -30.38623046875, -29.2822265625, -28.17822265625, -27.07421875, -25.97021484375, -24.8662109375, -23.76220703125, -22.658203125, -21.55419921875, -20.4501953125, -19.34619140625, -18.2421875, -17.13818359375, -16.0341796875, -14.93017578125, -13.826171875, -12.72216796875, -11.6181640625, -10.51416015625, -9.41015625, -8.30615234375, -7.2021484375, -6.09814453125, -4.994140625, -3.89013671875, -2.7861328125, -1.68212890625, -0.578125, 0.52587890625, 1.6298828125, 2.73388671875, 3.837890625, 4.94189453125, 6.0458984375, 7.14990234375, 8.25390625, 9.35791015625, 10.4619140625, 11.56591796875, 12.669921875, 13.77392578125, 14.8779296875, 15.98193359375, 17.0859375, 18.18994140625, 19.2939453125, 20.39794921875, 21.501953125, 22.60595703125, 23.7099609375, 24.81396484375, 25.91796875, 27.02197265625, 28.1259765625, 29.22998046875, 30.333984375, 31.43798828125, 32.5419921875, 33.64599609375, 34.75]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 15.0, 40.0, 74.0, 179.0, 277.0, 234.0, 117.0, 35.0, 19.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.985456705093384, -2.708726644515991, -2.4319965839385986, -2.155266523361206, -1.8785364627838135, -1.601806402206421, -1.3250763416290283, -1.0483462810516357, -0.7716162204742432, -0.4948861598968506, -0.218156099319458, 0.05857396125793457, 0.33530402183532715, 0.6120340824127197, 0.8887641429901123, 1.1654942035675049, 1.4422242641448975, 1.71895432472229, 1.9956843852996826, 2.272414445877075, 2.5491445064544678, 2.8258745670318604, 3.102604627609253, 3.3793346881866455, 3.656064748764038, 3.9327948093414307, 4.209525108337402, 4.486254692077637, 4.7629852294921875, 5.039714813232422, 5.316445350646973, 5.593174934387207, 5.869905471801758, 6.14663553237915, 6.423365592956543, 6.7000956535339355, 6.976825714111328, 7.253555774688721, 7.530285835266113, 7.807015895843506, 8.083745956420898, 8.360475540161133, 8.637206077575684, 8.913936614990234, 9.190666198730469, 9.467395782470703, 9.744126319885254, 10.020856857299805, 10.297586441040039, 10.574316024780273, 10.851046562194824, 11.127777099609375, 11.40450668334961, 11.681236267089844, 11.957966804504395, 12.234697341918945, 12.51142692565918, 12.788156509399414, 13.064887046813965, 13.341617584228516, 13.61834716796875, 13.895076751708984, 14.171807289123535, 14.448537826538086, 14.72526741027832]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 4.0, 13.0, 10.0, 11.0, 16.0, 19.0, 19.0, 18.0, 29.0, 14.0, 30.0, 37.0, 38.0, 32.0, 47.0, 26.0, 32.0, 40.0, 42.0, 33.0, 45.0, 47.0, 44.0, 38.0, 41.0, 36.0, 26.0, 37.0, 25.0, 19.0, 10.0, 22.0, 14.0, 13.0, 12.0, 6.0, 18.0, 6.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.1520514488220215, -2.0776078701019287, -2.003164529800415, -1.9287210702896118, -1.8542776107788086, -1.7798341512680054, -1.7053906917572021, -1.6309471130371094, -1.5565037727355957, -1.4820603132247925, -1.4076168537139893, -1.333173394203186, -1.2587299346923828, -1.1842864751815796, -1.1098430156707764, -1.0353994369506836, -0.9609559774398804, -0.8865125179290771, -0.8120690584182739, -0.7376255989074707, -0.6631821393966675, -0.5887386798858643, -0.5142951607704163, -0.43985170125961304, -0.3654082417488098, -0.2909647822380066, -0.21652130782604218, -0.14207783341407776, -0.06763437390327454, 0.0068090856075286865, 0.0812525749206543, 0.15569603443145752, 0.23013949394226074, 0.30458295345306396, 0.3790264129638672, 0.4534699022769928, 0.5279133319854736, 0.6023567914962769, 0.6768003106117249, 0.7512437701225281, 0.8256872296333313, 0.9001306891441345, 0.9745741486549377, 1.0490176677703857, 1.123461127281189, 1.1979045867919922, 1.2723480463027954, 1.3467915058135986, 1.4212349653244019, 1.495678424835205, 1.5701218843460083, 1.6445653438568115, 1.7190088033676147, 1.793452262878418, 1.8678958415985107, 1.9423391819000244, 2.016782760620117, 2.09122633934021, 2.1656696796417236, 2.2401132583618164, 2.31455659866333, 2.389000177383423, 2.4634435176849365, 2.5378870964050293, 2.612330436706543]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 10.0, 10.0, 9.0, 13.0, 23.0, 26.0, 26.0, 25.0, 23.0, 30.0, 29.0, 36.0, 34.0, 29.0, 47.0, 49.0, 51.0, 49.0, 52.0, 48.0, 38.0, 49.0, 28.0, 34.0, 31.0, 29.0, 25.0, 29.0, 20.0, 18.0, 14.0, 11.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.595703125, -2.5093994140625, -2.423095703125, -2.3367919921875, -2.25048828125, -2.1641845703125, -2.077880859375, -1.9915771484375, -1.9052734375, -1.8189697265625, -1.732666015625, -1.6463623046875, -1.56005859375, -1.4737548828125, -1.387451171875, -1.3011474609375, -1.21484375, -1.1285400390625, -1.042236328125, -0.9559326171875, -0.86962890625, -0.7833251953125, -0.697021484375, -0.6107177734375, -0.5244140625, -0.4381103515625, -0.351806640625, -0.2655029296875, -0.17919921875, -0.0928955078125, -0.006591796875, 0.0797119140625, 0.166015625, 0.2523193359375, 0.338623046875, 0.4249267578125, 0.51123046875, 0.5975341796875, 0.683837890625, 0.7701416015625, 0.8564453125, 0.9427490234375, 1.029052734375, 1.1153564453125, 1.20166015625, 1.2879638671875, 1.374267578125, 1.4605712890625, 1.546875, 1.6331787109375, 1.719482421875, 1.8057861328125, 1.89208984375, 1.9783935546875, 2.064697265625, 2.1510009765625, 2.2373046875, 2.3236083984375, 2.409912109375, 2.4962158203125, 2.58251953125, 2.6688232421875, 2.755126953125, 2.8414306640625, 2.927734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 8.0, 9.0, 9.0, 14.0, 20.0, 36.0, 38.0, 53.0, 62.0, 100.0, 131.0, 139.0, 217.0, 217.0, 350.0, 481.0, 669.0, 833.0, 1282.0, 1838.0, 2900.0, 5092.0, 10417.0, 29727.0, 124476.0, 515108.0, 265023.0, 54863.0, 16194.0, 6824.0, 3697.0, 2326.0, 1524.0, 1013.0, 757.0, 518.0, 388.0, 309.0, 208.0, 160.0, 123.0, 88.0, 90.0, 57.0, 37.0, 41.0, 25.0, 23.0, 15.0, 10.0, 4.0, 5.0, 6.0, 2.0, 4.0, 3.0], "bins": [-6.8203125, -6.61810302734375, -6.4158935546875, -6.21368408203125, -6.011474609375, -5.80926513671875, -5.6070556640625, -5.40484619140625, -5.20263671875, -5.00042724609375, -4.7982177734375, -4.59600830078125, -4.393798828125, -4.19158935546875, -3.9893798828125, -3.78717041015625, -3.5849609375, -3.38275146484375, -3.1805419921875, -2.97833251953125, -2.776123046875, -2.57391357421875, -2.3717041015625, -2.16949462890625, -1.96728515625, -1.76507568359375, -1.5628662109375, -1.36065673828125, -1.158447265625, -0.95623779296875, -0.7540283203125, -0.55181884765625, -0.349609375, -0.14739990234375, 0.0548095703125, 0.25701904296875, 0.459228515625, 0.66143798828125, 0.8636474609375, 1.06585693359375, 1.26806640625, 1.47027587890625, 1.6724853515625, 1.87469482421875, 2.076904296875, 2.27911376953125, 2.4813232421875, 2.68353271484375, 2.8857421875, 3.08795166015625, 3.2901611328125, 3.49237060546875, 3.694580078125, 3.89678955078125, 4.0989990234375, 4.30120849609375, 4.50341796875, 4.70562744140625, 4.9078369140625, 5.11004638671875, 5.312255859375, 5.51446533203125, 5.7166748046875, 5.91888427734375, 6.12109375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 7.0, 5.0, 11.0, 2.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 16.0, 32.0, 41.0, 35.0, 56.0, 44.0, 70.0, 106.0, 131.0, 1436.0, 325.0, 143.0, 88.0, 50.0, 45.0, 46.0, 31.0, 39.0, 28.0, 20.0, 27.0, 23.0, 15.0, 14.0, 11.0, 10.0, 7.0, 8.0, 10.0, 8.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.4737548828125, -10.135009765625, -9.7962646484375, -9.45751953125, -9.1187744140625, -8.780029296875, -8.4412841796875, -8.1025390625, -7.7637939453125, -7.425048828125, -7.0863037109375, -6.74755859375, -6.4088134765625, -6.070068359375, -5.7313232421875, -5.392578125, -5.0538330078125, -4.715087890625, -4.3763427734375, -4.03759765625, -3.6988525390625, -3.360107421875, -3.0213623046875, -2.6826171875, -2.3438720703125, -2.005126953125, -1.6663818359375, -1.32763671875, -0.9888916015625, -0.650146484375, -0.3114013671875, 0.02734375, 0.3660888671875, 0.704833984375, 1.0435791015625, 1.38232421875, 1.7210693359375, 2.059814453125, 2.3985595703125, 2.7373046875, 3.0760498046875, 3.414794921875, 3.7535400390625, 4.09228515625, 4.4310302734375, 4.769775390625, 5.1085205078125, 5.447265625, 5.7860107421875, 6.124755859375, 6.4635009765625, 6.80224609375, 7.1409912109375, 7.479736328125, 7.8184814453125, 8.1572265625, 8.4959716796875, 8.834716796875, 9.1734619140625, 9.51220703125, 9.8509521484375, 10.189697265625, 10.5284423828125, 10.8671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 7.0, 10.0, 11.0, 15.0, 11.0, 11.0, 19.0, 21.0, 34.0, 53.0, 60.0, 88.0, 166.0, 304.0, 674.0, 1735.0, 4694.0, 15175.0, 68103.0, 1128803.0, 1811984.0, 86848.0, 17988.0, 5406.0, 1920.0, 725.0, 320.0, 166.0, 102.0, 60.0, 40.0, 40.0, 20.0, 23.0, 16.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.796875, -13.3526611328125, -12.908447265625, -12.4642333984375, -12.02001953125, -11.5758056640625, -11.131591796875, -10.6873779296875, -10.2431640625, -9.7989501953125, -9.354736328125, -8.9105224609375, -8.46630859375, -8.0220947265625, -7.577880859375, -7.1336669921875, -6.689453125, -6.2452392578125, -5.801025390625, -5.3568115234375, -4.91259765625, -4.4683837890625, -4.024169921875, -3.5799560546875, -3.1357421875, -2.6915283203125, -2.247314453125, -1.8031005859375, -1.35888671875, -0.9146728515625, -0.470458984375, -0.0262451171875, 0.41796875, 0.8621826171875, 1.306396484375, 1.7506103515625, 2.19482421875, 2.6390380859375, 3.083251953125, 3.5274658203125, 3.9716796875, 4.4158935546875, 4.860107421875, 5.3043212890625, 5.74853515625, 6.1927490234375, 6.636962890625, 7.0811767578125, 7.525390625, 7.9696044921875, 8.413818359375, 8.8580322265625, 9.30224609375, 9.7464599609375, 10.190673828125, 10.6348876953125, 11.0791015625, 11.5233154296875, 11.967529296875, 12.4117431640625, 12.85595703125, 13.3001708984375, 13.744384765625, 14.1885986328125, 14.6328125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 18.0, 102.0, 255.0, 362.0, 195.0, 69.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.799560546875, -82.53303527832031, -80.26651763916016, -77.99999237060547, -75.73346710205078, -73.4669418334961, -71.20042419433594, -68.93389892578125, -66.66737365722656, -64.40084838867188, -62.13432693481445, -59.86780548095703, -57.601280212402344, -55.33475875854492, -53.0682373046875, -50.80171203613281, -48.53519058227539, -46.26866912841797, -44.00214385986328, -41.73562240600586, -39.46909713745117, -37.20257568359375, -34.93605041503906, -32.66952896118164, -30.403005599975586, -28.13648223876953, -25.869958877563477, -23.603435516357422, -21.3369140625, -19.070388793945312, -16.80386734008789, -14.537343978881836, -12.270820617675781, -10.004297256469727, -7.73777437210083, -5.471251487731934, -3.204728126525879, -0.9382047653198242, 1.328317642211914, 3.5948410034179688, 5.861364364624023, 8.127887725830078, 10.394411087036133, 12.660933494567871, 14.927456855773926, 17.193981170654297, 19.46050262451172, 21.727025985717773, 23.993549346923828, 26.260072708129883, 28.526596069335938, 30.79311752319336, 33.05964279174805, 35.32616424560547, 37.592689514160156, 39.85921096801758, 42.125732421875, 44.39225387573242, 46.65877914428711, 48.92530059814453, 51.19182586669922, 53.45834732055664, 55.72486877441406, 57.99139404296875, 60.25791931152344]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 15.0, 6.0, 17.0, 15.0, 10.0, 17.0, 19.0, 23.0, 23.0, 31.0, 28.0, 24.0, 32.0, 40.0, 45.0, 43.0, 45.0, 49.0, 31.0, 49.0, 35.0, 41.0, 39.0, 31.0, 32.0, 30.0, 34.0, 23.0, 21.0, 15.0, 26.0, 14.0, 15.0, 13.0, 10.0, 6.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0], "bins": [-38.788143157958984, -37.717044830322266, -36.64594650268555, -35.57484817504883, -34.50374984741211, -33.43265151977539, -32.36155319213867, -31.290454864501953, -30.219356536865234, -29.148258209228516, -28.077159881591797, -27.006061553955078, -25.93496322631836, -24.86386489868164, -23.792766571044922, -22.721668243408203, -21.65056800842285, -20.579469680786133, -19.508371353149414, -18.437273025512695, -17.366174697875977, -16.295076370239258, -15.223977088928223, -14.152878761291504, -13.081780433654785, -12.010682106018066, -10.939583778381348, -9.868484497070312, -8.797386169433594, -7.726288318634033, -6.655189514160156, -5.5840911865234375, -4.512994766235352, -3.441896438598633, -2.370797872543335, -1.299699306488037, -0.22860097885131836, 0.8424973487854004, 1.9135961532592773, 2.984694480895996, 4.055792808532715, 5.126891136169434, 6.197989463806152, 7.269088268280029, 8.340187072753906, 9.411285400390625, 10.482383728027344, 11.553482055664062, 12.624580383300781, 13.6956787109375, 14.766777038574219, 15.837875366210938, 16.908973693847656, 17.980072021484375, 19.051170349121094, 20.122268676757812, 21.19336700439453, 22.26446533203125, 23.33556365966797, 24.406661987304688, 25.477760314941406, 26.548858642578125, 27.619956970214844, 28.691055297851562, 29.762155532836914]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 3.0, 6.0, 7.0, 8.0, 15.0, 8.0, 17.0, 13.0, 10.0, 24.0, 18.0, 34.0, 32.0, 37.0, 32.0, 32.0, 40.0, 40.0, 43.0, 60.0, 47.0, 39.0, 37.0, 42.0, 57.0, 34.0, 43.0, 27.0, 34.0, 21.0, 22.0, 27.0, 14.0, 24.0, 15.0, 7.0, 7.0, 2.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.865234375, -2.7734375, -2.681640625, -2.58984375, -2.498046875, -2.40625, -2.314453125, -2.22265625, -2.130859375, -2.0390625, -1.947265625, -1.85546875, -1.763671875, -1.671875, -1.580078125, -1.48828125, -1.396484375, -1.3046875, -1.212890625, -1.12109375, -1.029296875, -0.9375, -0.845703125, -0.75390625, -0.662109375, -0.5703125, -0.478515625, -0.38671875, -0.294921875, -0.203125, -0.111328125, -0.01953125, 0.072265625, 0.1640625, 0.255859375, 0.34765625, 0.439453125, 0.53125, 0.623046875, 0.71484375, 0.806640625, 0.8984375, 0.990234375, 1.08203125, 1.173828125, 1.265625, 1.357421875, 1.44921875, 1.541015625, 1.6328125, 1.724609375, 1.81640625, 1.908203125, 2.0, 2.091796875, 2.18359375, 2.275390625, 2.3671875, 2.458984375, 2.55078125, 2.642578125, 2.734375, 2.826171875, 2.91796875, 3.009765625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 10.0, 4.0, 21.0, 22.0, 23.0, 39.0, 48.0, 75.0, 89.0, 162.0, 275.0, 487.0, 845.0, 1720.0, 3655.0, 8357.0, 21014.0, 59518.0, 233208.0, 2135934.0, 1473490.0, 172676.0, 49698.0, 18272.0, 7450.0, 3444.0, 1720.0, 839.0, 406.0, 288.0, 150.0, 105.0, 66.0, 42.0, 30.0, 21.0, 17.0, 16.0, 12.0, 8.0, 5.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8306884765625, -7.559814453125, -7.2889404296875, -7.01806640625, -6.7471923828125, -6.476318359375, -6.2054443359375, -5.9345703125, -5.6636962890625, -5.392822265625, -5.1219482421875, -4.85107421875, -4.5802001953125, -4.309326171875, -4.0384521484375, -3.767578125, -3.4967041015625, -3.225830078125, -2.9549560546875, -2.68408203125, -2.4132080078125, -2.142333984375, -1.8714599609375, -1.6005859375, -1.3297119140625, -1.058837890625, -0.7879638671875, -0.51708984375, -0.2462158203125, 0.024658203125, 0.2955322265625, 0.56640625, 0.8372802734375, 1.108154296875, 1.3790283203125, 1.64990234375, 1.9207763671875, 2.191650390625, 2.4625244140625, 2.7333984375, 3.0042724609375, 3.275146484375, 3.5460205078125, 3.81689453125, 4.0877685546875, 4.358642578125, 4.6295166015625, 4.900390625, 5.1712646484375, 5.442138671875, 5.7130126953125, 5.98388671875, 6.2547607421875, 6.525634765625, 6.7965087890625, 7.0673828125, 7.3382568359375, 7.609130859375, 7.8800048828125, 8.15087890625, 8.4217529296875, 8.692626953125, 8.9635009765625, 9.234375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 15.0, 9.0, 17.0, 21.0, 39.0, 34.0, 53.0, 65.0, 84.0, 106.0, 99.0, 166.0, 212.0, 293.0, 413.0, 499.0, 438.0, 355.0, 274.0, 202.0, 131.0, 97.0, 85.0, 72.0, 45.0, 39.0, 27.0, 33.0, 28.0, 22.0, 19.0, 13.0, 7.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.933349609375, -6.71435546875, -6.495361328125, -6.2763671875, -6.057373046875, -5.83837890625, -5.619384765625, -5.400390625, -5.181396484375, -4.96240234375, -4.743408203125, -4.5244140625, -4.305419921875, -4.08642578125, -3.867431640625, -3.6484375, -3.429443359375, -3.21044921875, -2.991455078125, -2.7724609375, -2.553466796875, -2.33447265625, -2.115478515625, -1.896484375, -1.677490234375, -1.45849609375, -1.239501953125, -1.0205078125, -0.801513671875, -0.58251953125, -0.363525390625, -0.14453125, 0.074462890625, 0.29345703125, 0.512451171875, 0.7314453125, 0.950439453125, 1.16943359375, 1.388427734375, 1.607421875, 1.826416015625, 2.04541015625, 2.264404296875, 2.4833984375, 2.702392578125, 2.92138671875, 3.140380859375, 3.359375, 3.578369140625, 3.79736328125, 4.016357421875, 4.2353515625, 4.454345703125, 4.67333984375, 4.892333984375, 5.111328125, 5.330322265625, 5.54931640625, 5.768310546875, 5.9873046875, 6.206298828125, 6.42529296875, 6.644287109375, 6.86328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 11.0, 8.0, 18.0, 20.0, 43.0, 59.0, 103.0, 162.0, 244.0, 478.0, 907.0, 1743.0, 3582.0, 7651.0, 17187.0, 42960.0, 117006.0, 397122.0, 1949928.0, 1247151.0, 265127.0, 85117.0, 32281.0, 13383.0, 6012.0, 2813.0, 1405.0, 766.0, 353.0, 247.0, 150.0, 92.0, 47.0, 24.0, 20.0, 12.0, 13.0, 9.0, 3.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.40625, -10.0576171875, -9.708984375, -9.3603515625, -9.01171875, -8.6630859375, -8.314453125, -7.9658203125, -7.6171875, -7.2685546875, -6.919921875, -6.5712890625, -6.22265625, -5.8740234375, -5.525390625, -5.1767578125, -4.828125, -4.4794921875, -4.130859375, -3.7822265625, -3.43359375, -3.0849609375, -2.736328125, -2.3876953125, -2.0390625, -1.6904296875, -1.341796875, -0.9931640625, -0.64453125, -0.2958984375, 0.052734375, 0.4013671875, 0.75, 1.0986328125, 1.447265625, 1.7958984375, 2.14453125, 2.4931640625, 2.841796875, 3.1904296875, 3.5390625, 3.8876953125, 4.236328125, 4.5849609375, 4.93359375, 5.2822265625, 5.630859375, 5.9794921875, 6.328125, 6.6767578125, 7.025390625, 7.3740234375, 7.72265625, 8.0712890625, 8.419921875, 8.7685546875, 9.1171875, 9.4658203125, 9.814453125, 10.1630859375, 10.51171875, 10.8603515625, 11.208984375, 11.5576171875, 11.90625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 11.0, 24.0, 50.0, 121.0, 213.0, 229.0, 179.0, 106.0, 44.0, 26.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.73938751220703, -82.72002410888672, -79.70066833496094, -76.68130493164062, -73.66194152832031, -70.642578125, -67.62322235107422, -64.6038589477539, -61.58449935913086, -58.56513977050781, -55.5457763671875, -52.52641677856445, -49.507057189941406, -46.487693786621094, -43.46833419799805, -40.448974609375, -37.42961120605469, -34.41025161743164, -31.390888214111328, -28.37152862548828, -25.3521671295166, -22.332805633544922, -19.313446044921875, -16.294084548950195, -13.274723052978516, -10.255361557006836, -7.236001014709473, -4.216640472412109, -1.1972789764404297, 1.82208251953125, 4.841442108154297, 7.860803604125977, 10.880165100097656, 13.899526596069336, 16.918888092041016, 19.938247680664062, 22.957609176635742, 25.976970672607422, 28.99633026123047, 32.01569366455078, 35.03505325317383, 38.054412841796875, 41.07377624511719, 44.093135833740234, 47.11249542236328, 50.131858825683594, 53.15121841430664, 56.17057800292969, 59.18994140625, 62.20930099487305, 65.2286605834961, 68.2480239868164, 71.26738739013672, 74.2867431640625, 77.30610656738281, 80.32546997070312, 83.34483337402344, 86.36419677734375, 89.38355255126953, 92.40291595458984, 95.42227935791016, 98.44163513183594, 101.46099853515625, 104.48036193847656, 107.49971771240234]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 8.0, 16.0, 18.0, 5.0, 15.0, 22.0, 23.0, 33.0, 28.0, 20.0, 25.0, 34.0, 30.0, 34.0, 33.0, 36.0, 41.0, 41.0, 46.0, 40.0, 39.0, 33.0, 45.0, 35.0, 32.0, 29.0, 33.0, 25.0, 24.0, 18.0, 19.0, 15.0, 16.0, 15.0, 16.0, 4.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-24.272066116333008, -23.5133056640625, -22.754545211791992, -21.995784759521484, -21.237024307250977, -20.47826385498047, -19.719505310058594, -18.960742950439453, -18.201984405517578, -17.44322395324707, -16.684463500976562, -15.925703048706055, -15.166942596435547, -14.408182144165039, -13.649422645568848, -12.89066219329834, -12.131900787353516, -11.373140335083008, -10.6143798828125, -9.855619430541992, -9.096858978271484, -8.338098526000977, -7.579339027404785, -6.820578575134277, -6.0618181228637695, -5.303057670593262, -4.544297218322754, -3.7855372428894043, -3.0267767906188965, -2.2680163383483887, -1.509256362915039, -0.7504959106445312, 0.00826263427734375, 0.767022967338562, 1.5257833003997803, 2.284543514251709, 3.043303966522217, 3.8020644187927246, 4.560824394226074, 5.319584846496582, 6.07834529876709, 6.837105751037598, 7.5958662033081055, 8.354625701904297, 9.113386154174805, 9.872146606445312, 10.63090705871582, 11.389667510986328, 12.148427963256836, 12.907188415527344, 13.665948867797852, 14.42470932006836, 15.183469772338867, 15.942230224609375, 16.70098876953125, 17.45975112915039, 18.218509674072266, 18.977270126342773, 19.73603057861328, 20.49479103088379, 21.253551483154297, 22.012311935424805, 22.771072387695312, 23.529830932617188, 24.288593292236328]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 11.0, 14.0, 9.0, 15.0, 18.0, 19.0, 9.0, 22.0, 32.0, 37.0, 25.0, 44.0, 47.0, 32.0, 54.0, 66.0, 56.0, 51.0, 38.0, 40.0, 45.0, 36.0, 39.0, 33.0, 30.0, 28.0, 22.0, 28.0, 16.0, 18.0, 10.0, 9.0, 16.0, 4.0, 5.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.750823974609375, -2.65203857421875, -2.553253173828125, -2.4544677734375, -2.355682373046875, -2.25689697265625, -2.158111572265625, -2.059326171875, -1.960540771484375, -1.86175537109375, -1.762969970703125, -1.6641845703125, -1.565399169921875, -1.46661376953125, -1.367828369140625, -1.26904296875, -1.170257568359375, -1.07147216796875, -0.972686767578125, -0.8739013671875, -0.775115966796875, -0.67633056640625, -0.577545166015625, -0.478759765625, -0.379974365234375, -0.28118896484375, -0.182403564453125, -0.0836181640625, 0.015167236328125, 0.11395263671875, 0.212738037109375, 0.3115234375, 0.410308837890625, 0.50909423828125, 0.607879638671875, 0.7066650390625, 0.805450439453125, 0.90423583984375, 1.003021240234375, 1.101806640625, 1.200592041015625, 1.29937744140625, 1.398162841796875, 1.4969482421875, 1.595733642578125, 1.69451904296875, 1.793304443359375, 1.89208984375, 1.990875244140625, 2.08966064453125, 2.188446044921875, 2.2872314453125, 2.386016845703125, 2.48480224609375, 2.583587646484375, 2.682373046875, 2.781158447265625, 2.87994384765625, 2.978729248046875, 3.0775146484375, 3.176300048828125, 3.27508544921875, 3.373870849609375, 3.47265625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 11.0, 17.0, 20.0, 25.0, 56.0, 70.0, 123.0, 205.0, 308.0, 515.0, 764.0, 1243.0, 2109.0, 3350.0, 5792.0, 9677.0, 15658.0, 25828.0, 41987.0, 66963.0, 104375.0, 165425.0, 223594.0, 140407.0, 90590.0, 57704.0, 35775.0, 22019.0, 13255.0, 8056.0, 4875.0, 3011.0, 1830.0, 1124.0, 665.0, 404.0, 262.0, 176.0, 96.0, 66.0, 43.0, 19.0, 20.0, 16.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.625, -8.3582763671875, -8.091552734375, -7.8248291015625, -7.55810546875, -7.2913818359375, -7.024658203125, -6.7579345703125, -6.4912109375, -6.2244873046875, -5.957763671875, -5.6910400390625, -5.42431640625, -5.1575927734375, -4.890869140625, -4.6241455078125, -4.357421875, -4.0906982421875, -3.823974609375, -3.5572509765625, -3.29052734375, -3.0238037109375, -2.757080078125, -2.4903564453125, -2.2236328125, -1.9569091796875, -1.690185546875, -1.4234619140625, -1.15673828125, -0.8900146484375, -0.623291015625, -0.3565673828125, -0.08984375, 0.1768798828125, 0.443603515625, 0.7103271484375, 0.97705078125, 1.2437744140625, 1.510498046875, 1.7772216796875, 2.0439453125, 2.3106689453125, 2.577392578125, 2.8441162109375, 3.11083984375, 3.3775634765625, 3.644287109375, 3.9110107421875, 4.177734375, 4.4444580078125, 4.711181640625, 4.9779052734375, 5.24462890625, 5.5113525390625, 5.778076171875, 6.0447998046875, 6.3115234375, 6.5782470703125, 6.844970703125, 7.1116943359375, 7.37841796875, 7.6451416015625, 7.911865234375, 8.1785888671875, 8.4453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 4.0, 3.0, 4.0, 7.0, 4.0, 14.0, 16.0, 17.0, 13.0, 22.0, 15.0, 34.0, 30.0, 32.0, 35.0, 41.0, 34.0, 39.0, 43.0, 44.0, 1065.0, 39.0, 35.0, 30.0, 51.0, 42.0, 32.0, 39.0, 30.0, 25.0, 30.0, 16.0, 18.0, 22.0, 19.0, 19.0, 15.0, 7.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.638580322265625, -2.55059814453125, -2.462615966796875, -2.3746337890625, -2.286651611328125, -2.19866943359375, -2.110687255859375, -2.022705078125, -1.934722900390625, -1.84674072265625, -1.758758544921875, -1.6707763671875, -1.582794189453125, -1.49481201171875, -1.406829833984375, -1.31884765625, -1.230865478515625, -1.14288330078125, -1.054901123046875, -0.9669189453125, -0.878936767578125, -0.79095458984375, -0.702972412109375, -0.614990234375, -0.527008056640625, -0.43902587890625, -0.351043701171875, -0.2630615234375, -0.175079345703125, -0.08709716796875, 0.000885009765625, 0.0888671875, 0.176849365234375, 0.26483154296875, 0.352813720703125, 0.4407958984375, 0.528778076171875, 0.61676025390625, 0.704742431640625, 0.792724609375, 0.880706787109375, 0.96868896484375, 1.056671142578125, 1.1446533203125, 1.232635498046875, 1.32061767578125, 1.408599853515625, 1.49658203125, 1.584564208984375, 1.67254638671875, 1.760528564453125, 1.8485107421875, 1.936492919921875, 2.02447509765625, 2.112457275390625, 2.200439453125, 2.288421630859375, 2.37640380859375, 2.464385986328125, 2.5523681640625, 2.640350341796875, 2.72833251953125, 2.816314697265625, 2.904296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 14.0, 16.0, 26.0, 39.0, 45.0, 61.0, 112.0, 150.0, 180.0, 262.0, 369.0, 537.0, 759.0, 1024.0, 1591.0, 2188.0, 3304.0, 5010.0, 7429.0, 11715.0, 18800.0, 31026.0, 53240.0, 98597.0, 207736.0, 680460.0, 566181.0, 186296.0, 91029.0, 49457.0, 28884.0, 17623.0, 11161.0, 7106.0, 4539.0, 3100.0, 2089.0, 1443.0, 1061.0, 706.0, 509.0, 354.0, 256.0, 170.0, 147.0, 100.0, 74.0, 55.0, 25.0, 20.0, 17.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.84765625, -4.69586181640625, -4.5440673828125, -4.39227294921875, -4.240478515625, -4.08868408203125, -3.9368896484375, -3.78509521484375, -3.63330078125, -3.48150634765625, -3.3297119140625, -3.17791748046875, -3.026123046875, -2.87432861328125, -2.7225341796875, -2.57073974609375, -2.4189453125, -2.26715087890625, -2.1153564453125, -1.96356201171875, -1.811767578125, -1.65997314453125, -1.5081787109375, -1.35638427734375, -1.20458984375, -1.05279541015625, -0.9010009765625, -0.74920654296875, -0.597412109375, -0.44561767578125, -0.2938232421875, -0.14202880859375, 0.009765625, 0.16156005859375, 0.3133544921875, 0.46514892578125, 0.616943359375, 0.76873779296875, 0.9205322265625, 1.07232666015625, 1.22412109375, 1.37591552734375, 1.5277099609375, 1.67950439453125, 1.831298828125, 1.98309326171875, 2.1348876953125, 2.28668212890625, 2.4384765625, 2.59027099609375, 2.7420654296875, 2.89385986328125, 3.045654296875, 3.19744873046875, 3.3492431640625, 3.50103759765625, 3.65283203125, 3.80462646484375, 3.9564208984375, 4.10821533203125, 4.260009765625, 4.41180419921875, 4.5635986328125, 4.71539306640625, 4.8671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 8.0, 5.0, 6.0, 9.0, 16.0, 3.0, 15.0, 18.0, 30.0, 32.0, 42.0, 52.0, 57.0, 103.0, 92.0, 105.0, 70.0, 75.0, 54.0, 44.0, 35.0, 26.0, 22.0, 14.0, 17.0, 17.0, 8.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.452545166015625, -2.37774658203125, -2.302947998046875, -2.2281494140625, -2.153350830078125, -2.07855224609375, -2.003753662109375, -1.928955078125, -1.854156494140625, -1.77935791015625, -1.704559326171875, -1.6297607421875, -1.554962158203125, -1.48016357421875, -1.405364990234375, -1.33056640625, -1.255767822265625, -1.18096923828125, -1.106170654296875, -1.0313720703125, -0.956573486328125, -0.88177490234375, -0.806976318359375, -0.732177734375, -0.657379150390625, -0.58258056640625, -0.507781982421875, -0.4329833984375, -0.358184814453125, -0.28338623046875, -0.208587646484375, -0.1337890625, -0.058990478515625, 0.01580810546875, 0.090606689453125, 0.1654052734375, 0.240203857421875, 0.31500244140625, 0.389801025390625, 0.464599609375, 0.539398193359375, 0.61419677734375, 0.688995361328125, 0.7637939453125, 0.838592529296875, 0.91339111328125, 0.988189697265625, 1.06298828125, 1.137786865234375, 1.21258544921875, 1.287384033203125, 1.3621826171875, 1.436981201171875, 1.51177978515625, 1.586578369140625, 1.661376953125, 1.736175537109375, 1.81097412109375, 1.885772705078125, 1.9605712890625, 2.035369873046875, 2.11016845703125, 2.184967041015625, 2.259765625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 12.0, 12.0, 9.0, 14.0, 32.0, 30.0, 39.0, 49.0, 64.0, 75.0, 106.0, 183.0, 232.0, 576.0, 2911.0, 86224.0, 926432.0, 28494.0, 1681.0, 492.0, 285.0, 152.0, 109.0, 77.0, 59.0, 48.0, 40.0, 19.0, 20.0, 17.0, 11.0, 4.0, 7.0, 6.0, 7.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.5, -27.5615234375, -26.623046875, -25.6845703125, -24.74609375, -23.8076171875, -22.869140625, -21.9306640625, -20.9921875, -20.0537109375, -19.115234375, -18.1767578125, -17.23828125, -16.2998046875, -15.361328125, -14.4228515625, -13.484375, -12.5458984375, -11.607421875, -10.6689453125, -9.73046875, -8.7919921875, -7.853515625, -6.9150390625, -5.9765625, -5.0380859375, -4.099609375, -3.1611328125, -2.22265625, -1.2841796875, -0.345703125, 0.5927734375, 1.53125, 2.4697265625, 3.408203125, 4.3466796875, 5.28515625, 6.2236328125, 7.162109375, 8.1005859375, 9.0390625, 9.9775390625, 10.916015625, 11.8544921875, 12.79296875, 13.7314453125, 14.669921875, 15.6083984375, 16.546875, 17.4853515625, 18.423828125, 19.3623046875, 20.30078125, 21.2392578125, 22.177734375, 23.1162109375, 24.0546875, 24.9931640625, 25.931640625, 26.8701171875, 27.80859375, 28.7470703125, 29.685546875, 30.6240234375, 31.5625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 71.0, 531.0, 370.0, 36.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.049037456512451, -6.25663948059082, -5.464241981506348, -4.671844005584717, -3.879446029663086, -3.087048053741455, -2.2946505546569824, -1.5022525787353516, -0.7098546028137207, 0.0825432538986206, 0.8749411106109619, 1.6673388481140137, 2.4597368240356445, 3.2521347999572754, 4.044532299041748, 4.836930274963379, 5.62932825088501, 6.421726226806641, 7.214123725891113, 8.006521224975586, 8.798919677734375, 9.591318130493164, 10.38371467590332, 11.17611312866211, 11.968511581420898, 12.760909080505371, 13.55330753326416, 14.345705032348633, 15.138103485107422, 15.930500984191895, 16.722898483276367, 17.515296936035156, 18.307693481445312, 19.1000919342041, 19.892488479614258, 20.684886932373047, 21.477285385131836, 22.269683837890625, 23.06208038330078, 23.85447883605957, 24.64687728881836, 25.43927574157715, 26.231672286987305, 27.024070739746094, 27.816469192504883, 28.608867645263672, 29.401264190673828, 30.193662643432617, 30.986059188842773, 31.778457641601562, 32.57085418701172, 33.363250732421875, 34.1556510925293, 34.94804763793945, 35.740447998046875, 36.53284454345703, 37.32524108886719, 38.117637634277344, 38.910037994384766, 39.70243453979492, 40.49483108520508, 41.2872314453125, 42.079627990722656, 42.87202453613281, 43.664424896240234]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 8.0, 10.0, 26.0, 16.0, 28.0, 26.0, 28.0, 25.0, 43.0, 42.0, 50.0, 50.0, 40.0, 56.0, 48.0, 57.0, 60.0, 56.0, 46.0, 51.0, 50.0, 30.0, 25.0, 23.0, 19.0, 17.0, 17.0, 8.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.715695858001709, -4.592813014984131, -4.469930648803711, -4.347047805786133, -4.224165439605713, -4.101282596588135, -3.9783999919891357, -3.8555173873901367, -3.7326345443725586, -3.6097519397735596, -3.4868693351745605, -3.3639864921569824, -3.2411038875579834, -3.1182212829589844, -2.9953386783599854, -2.8724560737609863, -2.7495734691619873, -2.6266908645629883, -2.5038082599639893, -2.3809256553649902, -2.258042812347412, -2.135160207748413, -2.012277603149414, -1.889394998550415, -1.7665122747421265, -1.6436296701431274, -1.5207469463348389, -1.3978643417358398, -1.2749817371368408, -1.1520990133285522, -1.0292164087295532, -0.9063337445259094, -0.7834513187408447, -0.6605686545372009, -0.5376859903335571, -0.4148033857345581, -0.2919207215309143, -0.1690380573272705, -0.046155452728271484, 0.07672721147537231, 0.1996098756790161, 0.3224925398826599, 0.4453751742839813, 0.5682578086853027, 0.6911404728889465, 0.8140231370925903, 0.9369057416915894, 1.059788465499878, 1.182671070098877, 1.305553674697876, 1.4284363985061646, 1.5513190031051636, 1.6742017269134521, 1.7970843315124512, 1.9199669361114502, 2.042849540710449, 2.1657323837280273, 2.2886149883270264, 2.4114975929260254, 2.5343804359436035, 2.6572630405426025, 2.7801456451416016, 2.9030282497406006, 3.0259108543395996, 3.1487934589385986]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 4.0, 4.0, 18.0, 15.0, 13.0, 24.0, 15.0, 28.0, 22.0, 30.0, 42.0, 41.0, 41.0, 48.0, 45.0, 46.0, 58.0, 37.0, 52.0, 45.0, 46.0, 37.0, 36.0, 48.0, 34.0, 33.0, 24.0, 27.0, 17.0, 11.0, 14.0, 5.0, 10.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.130859375, -3.030059814453125, -2.92926025390625, -2.828460693359375, -2.7276611328125, -2.626861572265625, -2.52606201171875, -2.425262451171875, -2.324462890625, -2.223663330078125, -2.12286376953125, -2.022064208984375, -1.9212646484375, -1.820465087890625, -1.71966552734375, -1.618865966796875, -1.51806640625, -1.417266845703125, -1.31646728515625, -1.215667724609375, -1.1148681640625, -1.014068603515625, -0.91326904296875, -0.812469482421875, -0.711669921875, -0.610870361328125, -0.51007080078125, -0.409271240234375, -0.3084716796875, -0.207672119140625, -0.10687255859375, -0.006072998046875, 0.0947265625, 0.195526123046875, 0.29632568359375, 0.397125244140625, 0.4979248046875, 0.598724365234375, 0.69952392578125, 0.800323486328125, 0.901123046875, 1.001922607421875, 1.10272216796875, 1.203521728515625, 1.3043212890625, 1.405120849609375, 1.50592041015625, 1.606719970703125, 1.70751953125, 1.808319091796875, 1.90911865234375, 2.009918212890625, 2.1107177734375, 2.211517333984375, 2.31231689453125, 2.413116455078125, 2.513916015625, 2.614715576171875, 2.71551513671875, 2.816314697265625, 2.9171142578125, 3.017913818359375, 3.11871337890625, 3.219512939453125, 3.3203125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 10.0, 12.0, 9.0, 7.0, 15.0, 21.0, 34.0, 44.0, 69.0, 80.0, 194.0, 246.0, 443.0, 717.0, 1210.0, 2063.0, 3530.0, 6463.0, 11394.0, 21964.0, 44275.0, 102210.0, 258662.0, 330251.0, 144422.0, 59153.0, 27877.0, 14544.0, 7911.0, 4400.0, 2554.0, 1483.0, 841.0, 527.0, 314.0, 210.0, 122.0, 72.0, 53.0, 38.0, 24.0, 17.0, 19.0, 22.0, 10.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.43359375, -4.29583740234375, -4.1580810546875, -4.02032470703125, -3.882568359375, -3.74481201171875, -3.6070556640625, -3.46929931640625, -3.33154296875, -3.19378662109375, -3.0560302734375, -2.91827392578125, -2.780517578125, -2.64276123046875, -2.5050048828125, -2.36724853515625, -2.2294921875, -2.09173583984375, -1.9539794921875, -1.81622314453125, -1.678466796875, -1.54071044921875, -1.4029541015625, -1.26519775390625, -1.12744140625, -0.98968505859375, -0.8519287109375, -0.71417236328125, -0.576416015625, -0.43865966796875, -0.3009033203125, -0.16314697265625, -0.025390625, 0.11236572265625, 0.2501220703125, 0.38787841796875, 0.525634765625, 0.66339111328125, 0.8011474609375, 0.93890380859375, 1.07666015625, 1.21441650390625, 1.3521728515625, 1.48992919921875, 1.627685546875, 1.76544189453125, 1.9031982421875, 2.04095458984375, 2.1787109375, 2.31646728515625, 2.4542236328125, 2.59197998046875, 2.729736328125, 2.86749267578125, 3.0052490234375, 3.14300537109375, 3.28076171875, 3.41851806640625, 3.5562744140625, 3.69403076171875, 3.831787109375, 3.96954345703125, 4.1072998046875, 4.24505615234375, 4.3828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 10.0, 15.0, 20.0, 25.0, 22.0, 24.0, 27.0, 18.0, 39.0, 41.0, 39.0, 49.0, 71.0, 93.0, 154.0, 264.0, 1367.0, 232.0, 105.0, 60.0, 58.0, 44.0, 32.0, 37.0, 29.0, 23.0, 23.0, 16.0, 15.0, 14.0, 11.0, 11.0, 8.0, 7.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.5234375, -12.158203125, -11.79296875, -11.427734375, -11.0625, -10.697265625, -10.33203125, -9.966796875, -9.6015625, -9.236328125, -8.87109375, -8.505859375, -8.140625, -7.775390625, -7.41015625, -7.044921875, -6.6796875, -6.314453125, -5.94921875, -5.583984375, -5.21875, -4.853515625, -4.48828125, -4.123046875, -3.7578125, -3.392578125, -3.02734375, -2.662109375, -2.296875, -1.931640625, -1.56640625, -1.201171875, -0.8359375, -0.470703125, -0.10546875, 0.259765625, 0.625, 0.990234375, 1.35546875, 1.720703125, 2.0859375, 2.451171875, 2.81640625, 3.181640625, 3.546875, 3.912109375, 4.27734375, 4.642578125, 5.0078125, 5.373046875, 5.73828125, 6.103515625, 6.46875, 6.833984375, 7.19921875, 7.564453125, 7.9296875, 8.294921875, 8.66015625, 9.025390625, 9.390625, 9.755859375, 10.12109375, 10.486328125, 10.8515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 10.0, 11.0, 14.0, 17.0, 16.0, 25.0, 44.0, 61.0, 93.0, 163.0, 310.0, 670.0, 1613.0, 4652.0, 17052.0, 90428.0, 1067516.0, 1785827.0, 143553.0, 23634.0, 6167.0, 2079.0, 810.0, 349.0, 181.0, 127.0, 72.0, 53.0, 38.0, 31.0, 18.0, 18.0, 19.0, 7.0, 7.0, 3.0, 1.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.3023681640625, -11.893798828125, -11.4852294921875, -11.07666015625, -10.6680908203125, -10.259521484375, -9.8509521484375, -9.4423828125, -9.0338134765625, -8.625244140625, -8.2166748046875, -7.80810546875, -7.3995361328125, -6.990966796875, -6.5823974609375, -6.173828125, -5.7652587890625, -5.356689453125, -4.9481201171875, -4.53955078125, -4.1309814453125, -3.722412109375, -3.3138427734375, -2.9052734375, -2.4967041015625, -2.088134765625, -1.6795654296875, -1.27099609375, -0.8624267578125, -0.453857421875, -0.0452880859375, 0.36328125, 0.7718505859375, 1.180419921875, 1.5889892578125, 1.99755859375, 2.4061279296875, 2.814697265625, 3.2232666015625, 3.6318359375, 4.0404052734375, 4.448974609375, 4.8575439453125, 5.26611328125, 5.6746826171875, 6.083251953125, 6.4918212890625, 6.900390625, 7.3089599609375, 7.717529296875, 8.1260986328125, 8.53466796875, 8.9432373046875, 9.351806640625, 9.7603759765625, 10.1689453125, 10.5775146484375, 10.986083984375, 11.3946533203125, 11.80322265625, 12.2117919921875, 12.620361328125, 13.0289306640625, 13.4375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 14.0, 30.0, 87.0, 196.0, 260.0, 249.0, 117.0, 46.0, 12.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.437591552734375, -18.315786361694336, -16.193981170654297, -14.072175979614258, -11.950370788574219, -9.82856559753418, -7.706760406494141, -5.584955215454102, -3.4631500244140625, -1.3413448333740234, 0.7804603576660156, 2.9022655487060547, 5.024070739746094, 7.145875930786133, 9.267681121826172, 11.389486312866211, 13.51129150390625, 15.633096694946289, 17.754901885986328, 19.876707077026367, 21.998512268066406, 24.120317459106445, 26.242122650146484, 28.363927841186523, 30.485733032226562, 32.60753631591797, 34.72934341430664, 36.85115051269531, 38.97295379638672, 41.094757080078125, 43.2165641784668, 45.33837127685547, 47.460166931152344, 49.58197021484375, 51.70377731323242, 53.825584411621094, 55.9473876953125, 58.069190979003906, 60.19099807739258, 62.31280517578125, 64.43460845947266, 66.55641174316406, 68.67822265625, 70.8000259399414, 72.92182922363281, 75.04363250732422, 77.16543579101562, 79.28724670410156, 81.40904998779297, 83.53085327148438, 85.65266418457031, 87.77446746826172, 89.89627075195312, 92.01807403564453, 94.13987731933594, 96.26168823242188, 98.38349151611328, 100.50529479980469, 102.62710571289062, 104.74890899658203, 106.87071228027344, 108.99251556396484, 111.11431884765625, 113.23612976074219, 115.3579330444336]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 3.0, 8.0, 5.0, 5.0, 7.0, 13.0, 12.0, 30.0, 20.0, 27.0, 19.0, 26.0, 28.0, 27.0, 32.0, 30.0, 39.0, 35.0, 42.0, 36.0, 42.0, 50.0, 42.0, 29.0, 25.0, 38.0, 28.0, 38.0, 41.0, 23.0, 24.0, 32.0, 16.0, 22.0, 20.0, 14.0, 11.0, 16.0, 15.0, 5.0, 11.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.983036041259766, -32.884639739990234, -31.786243438720703, -30.687847137451172, -29.58945083618164, -28.49105453491211, -27.39266014099121, -26.29426383972168, -25.19586753845215, -24.097471237182617, -22.999074935913086, -21.900678634643555, -20.802284240722656, -19.703887939453125, -18.605491638183594, -17.507095336914062, -16.40869903564453, -15.310302734375, -14.211906433105469, -13.113511085510254, -12.015114784240723, -10.916718482971191, -9.818323135375977, -8.719926834106445, -7.621530532836914, -6.523134231567383, -5.42473840713501, -4.326342582702637, -3.2279462814331055, -2.129549980163574, -1.0311541557312012, 0.06724166870117188, 1.1656341552734375, 2.2640302181243896, 3.362426280975342, 4.460822105407715, 5.559218406677246, 6.657614707946777, 7.75601053237915, 8.854406356811523, 9.952802658081055, 11.051198959350586, 12.149595260620117, 13.247990608215332, 14.346386909484863, 15.444783210754395, 16.54317855834961, 17.64157485961914, 18.739971160888672, 19.838367462158203, 20.936763763427734, 22.035160064697266, 23.133556365966797, 24.231952667236328, 25.330347061157227, 26.428743362426758, 27.52713966369629, 28.62553596496582, 29.72393226623535, 30.822328567504883, 31.92072296142578, 33.01911926269531, 34.117515563964844, 35.215911865234375, 36.314308166503906]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 13.0, 10.0, 16.0, 17.0, 20.0, 23.0, 24.0, 32.0, 23.0, 31.0, 32.0, 33.0, 47.0, 43.0, 41.0, 46.0, 43.0, 43.0, 48.0, 38.0, 52.0, 30.0, 28.0, 31.0, 32.0, 38.0, 17.0, 23.0, 18.0, 14.0, 12.0, 9.0, 12.0, 7.0, 5.0, 4.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.11328125, -3.02008056640625, -2.9268798828125, -2.83367919921875, -2.740478515625, -2.64727783203125, -2.5540771484375, -2.46087646484375, -2.36767578125, -2.27447509765625, -2.1812744140625, -2.08807373046875, -1.994873046875, -1.90167236328125, -1.8084716796875, -1.71527099609375, -1.6220703125, -1.52886962890625, -1.4356689453125, -1.34246826171875, -1.249267578125, -1.15606689453125, -1.0628662109375, -0.96966552734375, -0.87646484375, -0.78326416015625, -0.6900634765625, -0.59686279296875, -0.503662109375, -0.41046142578125, -0.3172607421875, -0.22406005859375, -0.130859375, -0.03765869140625, 0.0555419921875, 0.14874267578125, 0.241943359375, 0.33514404296875, 0.4283447265625, 0.52154541015625, 0.61474609375, 0.70794677734375, 0.8011474609375, 0.89434814453125, 0.987548828125, 1.08074951171875, 1.1739501953125, 1.26715087890625, 1.3603515625, 1.45355224609375, 1.5467529296875, 1.63995361328125, 1.733154296875, 1.82635498046875, 1.9195556640625, 2.01275634765625, 2.10595703125, 2.19915771484375, 2.2923583984375, 2.38555908203125, 2.478759765625, 2.57196044921875, 2.6651611328125, 2.75836181640625, 2.8515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 10.0, 11.0, 23.0, 19.0, 25.0, 38.0, 50.0, 78.0, 113.0, 183.0, 300.0, 434.0, 790.0, 1338.0, 2259.0, 4067.0, 7610.0, 14572.0, 30216.0, 68113.0, 188925.0, 902507.0, 2156379.0, 569452.0, 137882.0, 54628.0, 25512.0, 12986.0, 6859.0, 3766.0, 2024.0, 1228.0, 716.0, 433.0, 238.0, 162.0, 100.0, 79.0, 49.0, 25.0, 24.0, 23.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.31640625, -6.13262939453125, -5.9488525390625, -5.76507568359375, -5.581298828125, -5.39752197265625, -5.2137451171875, -5.02996826171875, -4.84619140625, -4.66241455078125, -4.4786376953125, -4.29486083984375, -4.111083984375, -3.92730712890625, -3.7435302734375, -3.55975341796875, -3.3759765625, -3.19219970703125, -3.0084228515625, -2.82464599609375, -2.640869140625, -2.45709228515625, -2.2733154296875, -2.08953857421875, -1.90576171875, -1.72198486328125, -1.5382080078125, -1.35443115234375, -1.170654296875, -0.98687744140625, -0.8031005859375, -0.61932373046875, -0.435546875, -0.25177001953125, -0.0679931640625, 0.11578369140625, 0.299560546875, 0.48333740234375, 0.6671142578125, 0.85089111328125, 1.03466796875, 1.21844482421875, 1.4022216796875, 1.58599853515625, 1.769775390625, 1.95355224609375, 2.1373291015625, 2.32110595703125, 2.5048828125, 2.68865966796875, 2.8724365234375, 3.05621337890625, 3.239990234375, 3.42376708984375, 3.6075439453125, 3.79132080078125, 3.97509765625, 4.15887451171875, 4.3426513671875, 4.52642822265625, 4.710205078125, 4.89398193359375, 5.0777587890625, 5.26153564453125, 5.4453125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 9.0, 21.0, 19.0, 30.0, 31.0, 51.0, 72.0, 112.0, 144.0, 230.0, 300.0, 436.0, 629.0, 606.0, 425.0, 281.0, 187.0, 128.0, 89.0, 63.0, 43.0, 41.0, 29.0, 26.0, 10.0, 11.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.9256591796875, -9.632568359375, -9.3394775390625, -9.04638671875, -8.7532958984375, -8.460205078125, -8.1671142578125, -7.8740234375, -7.5809326171875, -7.287841796875, -6.9947509765625, -6.70166015625, -6.4085693359375, -6.115478515625, -5.8223876953125, -5.529296875, -5.2362060546875, -4.943115234375, -4.6500244140625, -4.35693359375, -4.0638427734375, -3.770751953125, -3.4776611328125, -3.1845703125, -2.8914794921875, -2.598388671875, -2.3052978515625, -2.01220703125, -1.7191162109375, -1.426025390625, -1.1329345703125, -0.83984375, -0.5467529296875, -0.253662109375, 0.0394287109375, 0.33251953125, 0.6256103515625, 0.918701171875, 1.2117919921875, 1.5048828125, 1.7979736328125, 2.091064453125, 2.3841552734375, 2.67724609375, 2.9703369140625, 3.263427734375, 3.5565185546875, 3.849609375, 4.1427001953125, 4.435791015625, 4.7288818359375, 5.02197265625, 5.3150634765625, 5.608154296875, 5.9012451171875, 6.1943359375, 6.4874267578125, 6.780517578125, 7.0736083984375, 7.36669921875, 7.6597900390625, 7.952880859375, 8.2459716796875, 8.5390625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 12.0, 10.0, 19.0, 15.0, 29.0, 40.0, 49.0, 81.0, 120.0, 156.0, 256.0, 432.0, 714.0, 1251.0, 2293.0, 4483.0, 9227.0, 20490.0, 50328.0, 140840.0, 536635.0, 2225155.0, 882601.0, 202152.0, 66888.0, 26325.0, 11594.0, 5496.0, 2838.0, 1520.0, 839.0, 516.0, 266.0, 180.0, 143.0, 79.0, 53.0, 42.0, 27.0, 18.0, 22.0, 14.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.802490234375, -8.47216796875, -8.141845703125, -7.8115234375, -7.481201171875, -7.15087890625, -6.820556640625, -6.490234375, -6.159912109375, -5.82958984375, -5.499267578125, -5.1689453125, -4.838623046875, -4.50830078125, -4.177978515625, -3.84765625, -3.517333984375, -3.18701171875, -2.856689453125, -2.5263671875, -2.196044921875, -1.86572265625, -1.535400390625, -1.205078125, -0.874755859375, -0.54443359375, -0.214111328125, 0.1162109375, 0.446533203125, 0.77685546875, 1.107177734375, 1.4375, 1.767822265625, 2.09814453125, 2.428466796875, 2.7587890625, 3.089111328125, 3.41943359375, 3.749755859375, 4.080078125, 4.410400390625, 4.74072265625, 5.071044921875, 5.4013671875, 5.731689453125, 6.06201171875, 6.392333984375, 6.72265625, 7.052978515625, 7.38330078125, 7.713623046875, 8.0439453125, 8.374267578125, 8.70458984375, 9.034912109375, 9.365234375, 9.695556640625, 10.02587890625, 10.356201171875, 10.6865234375, 11.016845703125, 11.34716796875, 11.677490234375, 12.0078125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 4.0, 29.0, 88.0, 191.0, 285.0, 207.0, 133.0, 47.0, 18.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.6121826171875, -140.6797332763672, -136.74728393554688, -132.81483459472656, -128.88238525390625, -124.94993591308594, -121.01748657226562, -117.08503723144531, -113.152587890625, -109.22013854980469, -105.28768920898438, -101.35523986816406, -97.42279052734375, -93.49034118652344, -89.55789184570312, -85.62544250488281, -81.6929931640625, -77.76054382324219, -73.82809448242188, -69.89564514160156, -65.96319580078125, -62.03074645996094, -58.098297119140625, -54.16584777832031, -50.23340606689453, -46.30095672607422, -42.368507385253906, -38.436058044433594, -34.50360870361328, -30.5711612701416, -26.63871192932129, -22.706262588500977, -18.77381134033203, -14.841361999511719, -10.908912658691406, -6.97646427154541, -3.0440149307250977, 0.8884334564208984, 4.820882797241211, 8.753332138061523, 12.685781478881836, 16.61823081970215, 20.55068016052246, 24.48312759399414, 28.415576934814453, 32.348026275634766, 36.28047561645508, 40.21292495727539, 44.1453742980957, 48.077823638916016, 52.01027297973633, 55.94272232055664, 59.87517166137695, 63.8076171875, 67.74006652832031, 71.67251586914062, 75.60496520996094, 79.53741455078125, 83.46986389160156, 87.40231323242188, 91.33476257324219, 95.2672119140625, 99.19966125488281, 103.13211059570312, 107.06455993652344]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 10.0, 10.0, 15.0, 21.0, 14.0, 21.0, 10.0, 27.0, 22.0, 27.0, 24.0, 29.0, 34.0, 31.0, 33.0, 47.0, 35.0, 39.0, 41.0, 32.0, 40.0, 29.0, 39.0, 40.0, 26.0, 28.0, 20.0, 31.0, 28.0, 32.0, 18.0, 18.0, 22.0, 12.0, 15.0, 10.0, 18.0, 10.0, 10.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-26.393157958984375, -25.594867706298828, -24.79657745361328, -23.998289108276367, -23.19999885559082, -22.401708602905273, -21.60342025756836, -20.805130004882812, -20.006839752197266, -19.20854949951172, -18.410259246826172, -17.611970901489258, -16.81368064880371, -16.015390396118164, -15.217101097106934, -14.418811798095703, -13.620521545410156, -12.82223129272461, -12.023941993713379, -11.225652694702148, -10.427362442016602, -9.629072189331055, -8.830782890319824, -8.032493591308594, -7.234203338623047, -6.435913562774658, -5.6376237869262695, -4.839334011077881, -4.041044235229492, -3.2427544593811035, -2.444464683532715, -1.6461749076843262, -0.8478851318359375, -0.04959535598754883, 0.7486944198608398, 1.5469841957092285, 2.345273971557617, 3.143563747406006, 3.9418535232543945, 4.740143299102783, 5.538433074951172, 6.3367228507995605, 7.135012626647949, 7.933302402496338, 8.731592178344727, 9.529882431030273, 10.328171730041504, 11.126461029052734, 11.924751281738281, 12.723041534423828, 13.521330833435059, 14.319620132446289, 15.117910385131836, 15.916200637817383, 16.714488983154297, 17.512779235839844, 18.31106948852539, 19.109359741210938, 19.907649993896484, 20.7059383392334, 21.504228591918945, 22.302518844604492, 23.100807189941406, 23.899097442626953, 24.6973876953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 4.0, 7.0, 11.0, 14.0, 15.0, 10.0, 27.0, 16.0, 10.0, 16.0, 18.0, 24.0, 23.0, 26.0, 32.0, 30.0, 31.0, 49.0, 39.0, 37.0, 46.0, 41.0, 28.0, 43.0, 47.0, 34.0, 47.0, 23.0, 17.0, 22.0, 30.0, 24.0, 26.0, 20.0, 21.0, 18.0, 9.0, 14.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.623046875, -2.5338134765625, -2.444580078125, -2.3553466796875, -2.26611328125, -2.1768798828125, -2.087646484375, -1.9984130859375, -1.9091796875, -1.8199462890625, -1.730712890625, -1.6414794921875, -1.55224609375, -1.4630126953125, -1.373779296875, -1.2845458984375, -1.1953125, -1.1060791015625, -1.016845703125, -0.9276123046875, -0.83837890625, -0.7491455078125, -0.659912109375, -0.5706787109375, -0.4814453125, -0.3922119140625, -0.302978515625, -0.2137451171875, -0.12451171875, -0.0352783203125, 0.053955078125, 0.1431884765625, 0.232421875, 0.3216552734375, 0.410888671875, 0.5001220703125, 0.58935546875, 0.6785888671875, 0.767822265625, 0.8570556640625, 0.9462890625, 1.0355224609375, 1.124755859375, 1.2139892578125, 1.30322265625, 1.3924560546875, 1.481689453125, 1.5709228515625, 1.66015625, 1.7493896484375, 1.838623046875, 1.9278564453125, 2.01708984375, 2.1063232421875, 2.195556640625, 2.2847900390625, 2.3740234375, 2.4632568359375, 2.552490234375, 2.6417236328125, 2.73095703125, 2.8201904296875, 2.909423828125, 2.9986572265625, 3.087890625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 6.0, 11.0, 27.0, 26.0, 50.0, 60.0, 127.0, 201.0, 313.0, 516.0, 801.0, 1301.0, 2126.0, 3409.0, 6006.0, 10235.0, 17469.0, 30943.0, 54355.0, 91485.0, 142296.0, 186793.0, 178527.0, 128980.0, 80939.0, 47089.0, 26803.0, 15513.0, 9034.0, 5162.0, 3089.0, 1791.0, 1102.0, 737.0, 438.0, 251.0, 196.0, 112.0, 79.0, 62.0, 36.0, 22.0, 12.0, 9.0, 1.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-8.6796875, -8.4234619140625, -8.167236328125, -7.9110107421875, -7.65478515625, -7.3985595703125, -7.142333984375, -6.8861083984375, -6.6298828125, -6.3736572265625, -6.117431640625, -5.8612060546875, -5.60498046875, -5.3487548828125, -5.092529296875, -4.8363037109375, -4.580078125, -4.3238525390625, -4.067626953125, -3.8114013671875, -3.55517578125, -3.2989501953125, -3.042724609375, -2.7864990234375, -2.5302734375, -2.2740478515625, -2.017822265625, -1.7615966796875, -1.50537109375, -1.2491455078125, -0.992919921875, -0.7366943359375, -0.48046875, -0.2242431640625, 0.031982421875, 0.2882080078125, 0.54443359375, 0.8006591796875, 1.056884765625, 1.3131103515625, 1.5693359375, 1.8255615234375, 2.081787109375, 2.3380126953125, 2.59423828125, 2.8504638671875, 3.106689453125, 3.3629150390625, 3.619140625, 3.8753662109375, 4.131591796875, 4.3878173828125, 4.64404296875, 4.9002685546875, 5.156494140625, 5.4127197265625, 5.6689453125, 5.9251708984375, 6.181396484375, 6.4376220703125, 6.69384765625, 6.9500732421875, 7.206298828125, 7.4625244140625, 7.71875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 3.0, 10.0, 8.0, 12.0, 11.0, 9.0, 9.0, 13.0, 13.0, 17.0, 18.0, 30.0, 24.0, 26.0, 26.0, 47.0, 29.0, 41.0, 48.0, 30.0, 38.0, 894.0, 201.0, 38.0, 32.0, 39.0, 38.0, 26.0, 29.0, 27.0, 33.0, 30.0, 21.0, 30.0, 17.0, 19.0, 14.0, 16.0, 8.0, 10.0, 6.0, 11.0, 6.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.625, -2.54779052734375, -2.4705810546875, -2.39337158203125, -2.316162109375, -2.23895263671875, -2.1617431640625, -2.08453369140625, -2.00732421875, -1.93011474609375, -1.8529052734375, -1.77569580078125, -1.698486328125, -1.62127685546875, -1.5440673828125, -1.46685791015625, -1.3896484375, -1.31243896484375, -1.2352294921875, -1.15802001953125, -1.080810546875, -1.00360107421875, -0.9263916015625, -0.84918212890625, -0.77197265625, -0.69476318359375, -0.6175537109375, -0.54034423828125, -0.463134765625, -0.38592529296875, -0.3087158203125, -0.23150634765625, -0.154296875, -0.07708740234375, 0.0001220703125, 0.07733154296875, 0.154541015625, 0.23175048828125, 0.3089599609375, 0.38616943359375, 0.46337890625, 0.54058837890625, 0.6177978515625, 0.69500732421875, 0.772216796875, 0.84942626953125, 0.9266357421875, 1.00384521484375, 1.0810546875, 1.15826416015625, 1.2354736328125, 1.31268310546875, 1.389892578125, 1.46710205078125, 1.5443115234375, 1.62152099609375, 1.69873046875, 1.77593994140625, 1.8531494140625, 1.93035888671875, 2.007568359375, 2.08477783203125, 2.1619873046875, 2.23919677734375, 2.31640625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 12.0, 19.0, 18.0, 37.0, 57.0, 84.0, 124.0, 139.0, 214.0, 309.0, 498.0, 765.0, 1101.0, 1699.0, 2667.0, 4225.0, 7206.0, 12189.0, 21968.0, 40414.0, 78441.0, 169929.0, 439834.0, 760370.0, 295123.0, 124186.0, 60523.0, 31568.0, 17451.0, 10052.0, 5874.0, 3548.0, 2258.0, 1337.0, 936.0, 615.0, 403.0, 263.0, 199.0, 140.0, 81.0, 66.0, 43.0, 37.0, 32.0, 18.0, 17.0, 13.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.10699462890625, -4.9327392578125, -4.75848388671875, -4.584228515625, -4.40997314453125, -4.2357177734375, -4.06146240234375, -3.88720703125, -3.71295166015625, -3.5386962890625, -3.36444091796875, -3.190185546875, -3.01593017578125, -2.8416748046875, -2.66741943359375, -2.4931640625, -2.31890869140625, -2.1446533203125, -1.97039794921875, -1.796142578125, -1.62188720703125, -1.4476318359375, -1.27337646484375, -1.09912109375, -0.92486572265625, -0.7506103515625, -0.57635498046875, -0.402099609375, -0.22784423828125, -0.0535888671875, 0.12066650390625, 0.294921875, 0.46917724609375, 0.6434326171875, 0.81768798828125, 0.991943359375, 1.16619873046875, 1.3404541015625, 1.51470947265625, 1.68896484375, 1.86322021484375, 2.0374755859375, 2.21173095703125, 2.385986328125, 2.56024169921875, 2.7344970703125, 2.90875244140625, 3.0830078125, 3.25726318359375, 3.4315185546875, 3.60577392578125, 3.780029296875, 3.95428466796875, 4.1285400390625, 4.30279541015625, 4.47705078125, 4.65130615234375, 4.8255615234375, 4.99981689453125, 5.174072265625, 5.34832763671875, 5.5225830078125, 5.69683837890625, 5.87109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 9.0, 9.0, 17.0, 10.0, 17.0, 21.0, 31.0, 49.0, 51.0, 52.0, 79.0, 89.0, 100.0, 83.0, 57.0, 75.0, 43.0, 37.0, 39.0, 24.0, 21.0, 11.0, 10.0, 9.0, 9.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.500701904296875, -2.42327880859375, -2.345855712890625, -2.2684326171875, -2.191009521484375, -2.11358642578125, -2.036163330078125, -1.958740234375, -1.881317138671875, -1.80389404296875, -1.726470947265625, -1.6490478515625, -1.571624755859375, -1.49420166015625, -1.416778564453125, -1.33935546875, -1.261932373046875, -1.18450927734375, -1.107086181640625, -1.0296630859375, -0.952239990234375, -0.87481689453125, -0.797393798828125, -0.719970703125, -0.642547607421875, -0.56512451171875, -0.487701416015625, -0.4102783203125, -0.332855224609375, -0.25543212890625, -0.178009033203125, -0.1005859375, -0.023162841796875, 0.05426025390625, 0.131683349609375, 0.2091064453125, 0.286529541015625, 0.36395263671875, 0.441375732421875, 0.518798828125, 0.596221923828125, 0.67364501953125, 0.751068115234375, 0.8284912109375, 0.905914306640625, 0.98333740234375, 1.060760498046875, 1.13818359375, 1.215606689453125, 1.29302978515625, 1.370452880859375, 1.4478759765625, 1.525299072265625, 1.60272216796875, 1.680145263671875, 1.757568359375, 1.834991455078125, 1.91241455078125, 1.989837646484375, 2.0672607421875, 2.144683837890625, 2.22210693359375, 2.299530029296875, 2.376953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 8.0, 30.0, 27.0, 18.0, 36.0, 46.0, 67.0, 110.0, 130.0, 222.0, 404.0, 1269.0, 9154.0, 410643.0, 611623.0, 12026.0, 1482.0, 470.0, 226.0, 129.0, 100.0, 88.0, 56.0, 39.0, 36.0, 13.0, 17.0, 12.0, 10.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.890625, -30.829345703125, -29.76806640625, -28.706787109375, -27.6455078125, -26.584228515625, -25.52294921875, -24.461669921875, -23.400390625, -22.339111328125, -21.27783203125, -20.216552734375, -19.1552734375, -18.093994140625, -17.03271484375, -15.971435546875, -14.91015625, -13.848876953125, -12.78759765625, -11.726318359375, -10.6650390625, -9.603759765625, -8.54248046875, -7.481201171875, -6.419921875, -5.358642578125, -4.29736328125, -3.236083984375, -2.1748046875, -1.113525390625, -0.05224609375, 1.009033203125, 2.0703125, 3.131591796875, 4.19287109375, 5.254150390625, 6.3154296875, 7.376708984375, 8.43798828125, 9.499267578125, 10.560546875, 11.621826171875, 12.68310546875, 13.744384765625, 14.8056640625, 15.866943359375, 16.92822265625, 17.989501953125, 19.05078125, 20.112060546875, 21.17333984375, 22.234619140625, 23.2958984375, 24.357177734375, 25.41845703125, 26.479736328125, 27.541015625, 28.602294921875, 29.66357421875, 30.724853515625, 31.7861328125, 32.847412109375, 33.90869140625, 34.969970703125, 36.03125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 5.0, 7.0, 9.0, 17.0, 19.0, 31.0, 25.0, 57.0, 89.0, 91.0, 92.0, 119.0, 116.0, 84.0, 68.0, 44.0, 36.0, 25.0, 23.0, 12.0, 8.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.301427841186523, -4.159679412841797, -4.01793098449707, -3.8761823177337646, -3.734433889389038, -3.5926852226257324, -3.450936794281006, -3.3091883659362793, -3.1674399375915527, -3.025691509246826, -2.8839428424835205, -2.742194414138794, -2.6004459857940674, -2.4586973190307617, -2.316948890686035, -2.1752004623413086, -2.033451795578003, -1.8917032480239868, -1.7499548196792603, -1.6082062721252441, -1.4664578437805176, -1.3247092962265015, -1.1829607486724854, -1.0412123203277588, -0.8994637727737427, -0.7577152848243713, -0.615966796875, -0.4742182493209839, -0.33246976137161255, -0.1907212734222412, -0.0489727258682251, 0.09277576208114624, 0.23452425003051758, 0.3762727379798889, 0.5180212259292603, 0.6597697734832764, 0.8015182614326477, 0.943266749382019, 1.0850152969360352, 1.2267637252807617, 1.3685122728347778, 1.510260820388794, 1.6520092487335205, 1.7937577962875366, 1.9355063438415527, 2.0772547721862793, 2.219003200531006, 2.3607518672943115, 2.502500295639038, 2.6442487239837646, 2.7859973907470703, 2.927745819091797, 3.0694942474365234, 3.21124267578125, 3.3529913425445557, 3.4947397708892822, 3.636488437652588, 3.7782368659973145, 3.91998553276062, 4.061734199523926, 4.203482627868652, 4.345231056213379, 4.4869794845581055, 4.628727912902832, 4.770476341247559]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 4.0, 6.0, 8.0, 14.0, 14.0, 27.0, 21.0, 19.0, 25.0, 22.0, 28.0, 29.0, 30.0, 30.0, 48.0, 49.0, 42.0, 33.0, 46.0, 48.0, 41.0, 51.0, 50.0, 25.0, 32.0, 36.0, 33.0, 33.0, 28.0, 27.0, 21.0, 12.0, 13.0, 10.0, 7.0, 9.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.653494358062744, -3.54390549659729, -3.434316396713257, -3.3247275352478027, -3.2151384353637695, -3.1055495738983154, -2.9959607124328613, -2.886371612548828, -2.776782512664795, -2.667193651199341, -2.5576045513153076, -2.4480156898498535, -2.3384265899658203, -2.228837728500366, -2.119248867034912, -2.009659767150879, -1.9000709056854248, -1.7904819250106812, -1.6808929443359375, -1.5713040828704834, -1.4617149829864502, -1.352126121520996, -1.2425371408462524, -1.1329481601715088, -1.0233591794967651, -0.9137701988220215, -0.8041812181472778, -0.694592297077179, -0.5850033164024353, -0.47541433572769165, -0.3658254146575928, -0.2562364339828491, -0.14664721488952637, -0.03705824911594391, 0.07253071665763855, 0.18211966753005981, 0.29170864820480347, 0.4012976288795471, 0.510886549949646, 0.6204755306243896, 0.7300645112991333, 0.839653491973877, 0.9492424726486206, 1.0588314533233643, 1.1684203147888184, 1.2780094146728516, 1.3875982761383057, 1.4971872568130493, 1.606776237487793, 1.7163652181625366, 1.8259541988372803, 1.9355430603027344, 2.0451321601867676, 2.1547210216522217, 2.264309883117676, 2.373898983001709, 2.483488082885742, 2.5930769443511963, 2.7026660442352295, 2.8122549057006836, 2.921844005584717, 3.031432867050171, 3.141021728515625, 3.250610828399658, 3.3601996898651123]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 11.0, 19.0, 15.0, 16.0, 8.0, 14.0, 25.0, 18.0, 25.0, 18.0, 27.0, 28.0, 33.0, 36.0, 36.0, 29.0, 39.0, 49.0, 40.0, 29.0, 43.0, 33.0, 40.0, 41.0, 28.0, 28.0, 40.0, 33.0, 16.0, 29.0, 23.0, 17.0, 14.0, 7.0, 12.0, 12.0, 10.0, 9.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.74609375, -2.656829833984375, -2.56756591796875, -2.478302001953125, -2.3890380859375, -2.299774169921875, -2.21051025390625, -2.121246337890625, -2.031982421875, -1.942718505859375, -1.85345458984375, -1.764190673828125, -1.6749267578125, -1.585662841796875, -1.49639892578125, -1.407135009765625, -1.31787109375, -1.228607177734375, -1.13934326171875, -1.050079345703125, -0.9608154296875, -0.871551513671875, -0.78228759765625, -0.693023681640625, -0.603759765625, -0.514495849609375, -0.42523193359375, -0.335968017578125, -0.2467041015625, -0.157440185546875, -0.06817626953125, 0.021087646484375, 0.1103515625, 0.199615478515625, 0.28887939453125, 0.378143310546875, 0.4674072265625, 0.556671142578125, 0.64593505859375, 0.735198974609375, 0.824462890625, 0.913726806640625, 1.00299072265625, 1.092254638671875, 1.1815185546875, 1.270782470703125, 1.36004638671875, 1.449310302734375, 1.53857421875, 1.627838134765625, 1.71710205078125, 1.806365966796875, 1.8956298828125, 1.984893798828125, 2.07415771484375, 2.163421630859375, 2.252685546875, 2.341949462890625, 2.43121337890625, 2.520477294921875, 2.6097412109375, 2.699005126953125, 2.78826904296875, 2.877532958984375, 2.966796875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 10.0, 10.0, 20.0, 23.0, 30.0, 33.0, 64.0, 83.0, 143.0, 216.0, 325.0, 546.0, 796.0, 1358.0, 2358.0, 3989.0, 7017.0, 12667.0, 23957.0, 48751.0, 107124.0, 242464.0, 307761.0, 152200.0, 66859.0, 31972.0, 16561.0, 8947.0, 4874.0, 2896.0, 1733.0, 1027.0, 593.0, 412.0, 247.0, 149.0, 112.0, 63.0, 52.0, 30.0, 26.0, 14.0, 17.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.84765625, -2.75640869140625, -2.6651611328125, -2.57391357421875, -2.482666015625, -2.39141845703125, -2.3001708984375, -2.20892333984375, -2.11767578125, -2.02642822265625, -1.9351806640625, -1.84393310546875, -1.752685546875, -1.66143798828125, -1.5701904296875, -1.47894287109375, -1.3876953125, -1.29644775390625, -1.2052001953125, -1.11395263671875, -1.022705078125, -0.93145751953125, -0.8402099609375, -0.74896240234375, -0.65771484375, -0.56646728515625, -0.4752197265625, -0.38397216796875, -0.292724609375, -0.20147705078125, -0.1102294921875, -0.01898193359375, 0.072265625, 0.16351318359375, 0.2547607421875, 0.34600830078125, 0.437255859375, 0.52850341796875, 0.6197509765625, 0.71099853515625, 0.80224609375, 0.89349365234375, 0.9847412109375, 1.07598876953125, 1.167236328125, 1.25848388671875, 1.3497314453125, 1.44097900390625, 1.5322265625, 1.62347412109375, 1.7147216796875, 1.80596923828125, 1.897216796875, 1.98846435546875, 2.0797119140625, 2.17095947265625, 2.26220703125, 2.35345458984375, 2.4447021484375, 2.53594970703125, 2.627197265625, 2.71844482421875, 2.8096923828125, 2.90093994140625, 2.9921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 10.0, 4.0, 12.0, 4.0, 15.0, 13.0, 14.0, 14.0, 22.0, 24.0, 42.0, 47.0, 38.0, 59.0, 62.0, 103.0, 258.0, 1497.0, 253.0, 121.0, 69.0, 57.0, 51.0, 44.0, 37.0, 36.0, 18.0, 26.0, 21.0, 20.0, 16.0, 10.0, 14.0, 7.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1640625, -10.743896484375, -10.32373046875, -9.903564453125, -9.4833984375, -9.063232421875, -8.64306640625, -8.222900390625, -7.802734375, -7.382568359375, -6.96240234375, -6.542236328125, -6.1220703125, -5.701904296875, -5.28173828125, -4.861572265625, -4.44140625, -4.021240234375, -3.60107421875, -3.180908203125, -2.7607421875, -2.340576171875, -1.92041015625, -1.500244140625, -1.080078125, -0.659912109375, -0.23974609375, 0.180419921875, 0.6005859375, 1.020751953125, 1.44091796875, 1.861083984375, 2.28125, 2.701416015625, 3.12158203125, 3.541748046875, 3.9619140625, 4.382080078125, 4.80224609375, 5.222412109375, 5.642578125, 6.062744140625, 6.48291015625, 6.903076171875, 7.3232421875, 7.743408203125, 8.16357421875, 8.583740234375, 9.00390625, 9.424072265625, 9.84423828125, 10.264404296875, 10.6845703125, 11.104736328125, 11.52490234375, 11.945068359375, 12.365234375, 12.785400390625, 13.20556640625, 13.625732421875, 14.0458984375, 14.466064453125, 14.88623046875, 15.306396484375, 15.7265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 8.0, 13.0, 13.0, 9.0, 16.0, 39.0, 41.0, 49.0, 81.0, 118.0, 228.0, 499.0, 1352.0, 6117.0, 67997.0, 2380960.0, 660090.0, 23282.0, 3059.0, 852.0, 360.0, 189.0, 125.0, 56.0, 44.0, 22.0, 26.0, 16.0, 9.0, 7.0, 10.0, 10.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.4365234375, -15.935546875, -15.4345703125, -14.93359375, -14.4326171875, -13.931640625, -13.4306640625, -12.9296875, -12.4287109375, -11.927734375, -11.4267578125, -10.92578125, -10.4248046875, -9.923828125, -9.4228515625, -8.921875, -8.4208984375, -7.919921875, -7.4189453125, -6.91796875, -6.4169921875, -5.916015625, -5.4150390625, -4.9140625, -4.4130859375, -3.912109375, -3.4111328125, -2.91015625, -2.4091796875, -1.908203125, -1.4072265625, -0.90625, -0.4052734375, 0.095703125, 0.5966796875, 1.09765625, 1.5986328125, 2.099609375, 2.6005859375, 3.1015625, 3.6025390625, 4.103515625, 4.6044921875, 5.10546875, 5.6064453125, 6.107421875, 6.6083984375, 7.109375, 7.6103515625, 8.111328125, 8.6123046875, 9.11328125, 9.6142578125, 10.115234375, 10.6162109375, 11.1171875, 11.6181640625, 12.119140625, 12.6201171875, 13.12109375, 13.6220703125, 14.123046875, 14.6240234375, 15.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 44.0, 460.0, 474.0, 40.0], "bins": [-235.141357421875, -231.34625244140625, -227.5511474609375, -223.75604248046875, -219.96092224121094, -216.1658172607422, -212.37071228027344, -208.5756072998047, -204.78050231933594, -200.9853973388672, -197.19029235839844, -193.3951873779297, -189.60006713867188, -185.80496215820312, -182.00985717773438, -178.21475219726562, -174.41964721679688, -170.62454223632812, -166.82943725585938, -163.03433227539062, -159.2392120361328, -155.44410705566406, -151.6490020751953, -147.85389709472656, -144.0587921142578, -140.26368713378906, -136.4685821533203, -132.67347717285156, -128.87835693359375, -125.083251953125, -121.28814697265625, -117.4930419921875, -113.69793701171875, -109.90283203125, -106.10771942138672, -102.31261444091797, -98.51750946044922, -94.72239685058594, -90.92729187011719, -87.13218688964844, -83.33707427978516, -79.5419692993164, -75.74685668945312, -71.95175170898438, -68.15664672851562, -64.36154174804688, -60.566429138183594, -56.771324157714844, -52.976219177246094, -49.18111038208008, -45.38600540161133, -41.59089660644531, -37.79579162597656, -34.00068283081055, -30.205575942993164, -26.41046905517578, -22.6153621673584, -18.820255279541016, -15.025148391723633, -11.230040550231934, -7.434933662414551, -3.6398258209228516, 0.15528106689453125, 3.950387954711914, 7.745494842529297]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 15.0, 15.0, 14.0, 16.0, 25.0, 27.0, 24.0, 22.0, 30.0, 27.0, 37.0, 39.0, 40.0, 32.0, 38.0, 39.0, 44.0, 45.0, 31.0, 35.0, 32.0, 30.0, 35.0, 41.0, 19.0, 18.0, 30.0, 24.0, 24.0, 25.0, 10.0, 9.0, 19.0, 7.0, 12.0, 5.0, 7.0, 2.0, 4.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-31.177780151367188, -30.143125534057617, -29.108470916748047, -28.073814392089844, -27.039159774780273, -26.004505157470703, -24.969850540161133, -23.935195922851562, -22.90053939819336, -21.86588478088379, -20.83123016357422, -19.796573638916016, -18.761919021606445, -17.727264404296875, -16.692609786987305, -15.657955169677734, -14.623300552368164, -13.588645935058594, -12.553990364074707, -11.519335746765137, -10.48468017578125, -9.45002555847168, -8.41537094116211, -7.380715847015381, -6.346060752868652, -5.311405658721924, -4.276750564575195, -3.242095947265625, -2.2074408531188965, -1.172785758972168, -0.13813114166259766, 0.8965239524841309, 1.9311790466308594, 2.965834140777588, 4.000489234924316, 5.035143852233887, 6.069798946380615, 7.104454040527344, 8.139108657836914, 9.173763275146484, 10.208418846130371, 11.243073463439941, 12.277729034423828, 13.312383651733398, 14.347038269042969, 15.381693840026855, 16.41634750366211, 17.451004028320312, 18.485658645629883, 19.520313262939453, 20.554967880249023, 21.589622497558594, 22.624279022216797, 23.658933639526367, 24.693588256835938, 25.728242874145508, 26.762897491455078, 27.79755210876465, 28.83220672607422, 29.866863250732422, 30.901517868041992, 31.936172485351562, 32.9708251953125, 34.0054817199707, 35.040138244628906]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 15.0, 17.0, 15.0, 15.0, 17.0, 16.0, 20.0, 23.0, 21.0, 21.0, 33.0, 35.0, 35.0, 33.0, 42.0, 46.0, 33.0, 39.0, 27.0, 32.0, 47.0, 43.0, 48.0, 31.0, 42.0, 32.0, 29.0, 22.0, 16.0, 22.0, 21.0, 11.0, 14.0, 21.0, 10.0, 7.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8671875, -2.772308349609375, -2.67742919921875, -2.582550048828125, -2.4876708984375, -2.392791748046875, -2.29791259765625, -2.203033447265625, -2.108154296875, -2.013275146484375, -1.91839599609375, -1.823516845703125, -1.7286376953125, -1.633758544921875, -1.53887939453125, -1.444000244140625, -1.34912109375, -1.254241943359375, -1.15936279296875, -1.064483642578125, -0.9696044921875, -0.874725341796875, -0.77984619140625, -0.684967041015625, -0.590087890625, -0.495208740234375, -0.40032958984375, -0.305450439453125, -0.2105712890625, -0.115692138671875, -0.02081298828125, 0.074066162109375, 0.1689453125, 0.263824462890625, 0.35870361328125, 0.453582763671875, 0.5484619140625, 0.643341064453125, 0.73822021484375, 0.833099365234375, 0.927978515625, 1.022857666015625, 1.11773681640625, 1.212615966796875, 1.3074951171875, 1.402374267578125, 1.49725341796875, 1.592132568359375, 1.68701171875, 1.781890869140625, 1.87677001953125, 1.971649169921875, 2.0665283203125, 2.161407470703125, 2.25628662109375, 2.351165771484375, 2.446044921875, 2.540924072265625, 2.63580322265625, 2.730682373046875, 2.8255615234375, 2.920440673828125, 3.01531982421875, 3.110198974609375, 3.205078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 11.0, 8.0, 12.0, 26.0, 31.0, 32.0, 52.0, 71.0, 95.0, 151.0, 187.0, 346.0, 440.0, 673.0, 1133.0, 1726.0, 2735.0, 4557.0, 7781.0, 13803.0, 26117.0, 52465.0, 125851.0, 450737.0, 1696221.0, 1314372.0, 303961.0, 95982.0, 42780.0, 22001.0, 11932.0, 6990.0, 4089.0, 2512.0, 1572.0, 952.0, 610.0, 419.0, 255.0, 162.0, 159.0, 88.0, 53.0, 37.0, 30.0, 23.0, 19.0, 7.0, 11.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.24554443359375, -5.0809326171875, -4.91632080078125, -4.751708984375, -4.58709716796875, -4.4224853515625, -4.25787353515625, -4.09326171875, -3.92864990234375, -3.7640380859375, -3.59942626953125, -3.434814453125, -3.27020263671875, -3.1055908203125, -2.94097900390625, -2.7763671875, -2.61175537109375, -2.4471435546875, -2.28253173828125, -2.117919921875, -1.95330810546875, -1.7886962890625, -1.62408447265625, -1.45947265625, -1.29486083984375, -1.1302490234375, -0.96563720703125, -0.801025390625, -0.63641357421875, -0.4718017578125, -0.30718994140625, -0.142578125, 0.02203369140625, 0.1866455078125, 0.35125732421875, 0.515869140625, 0.68048095703125, 0.8450927734375, 1.00970458984375, 1.17431640625, 1.33892822265625, 1.5035400390625, 1.66815185546875, 1.832763671875, 1.99737548828125, 2.1619873046875, 2.32659912109375, 2.4912109375, 2.65582275390625, 2.8204345703125, 2.98504638671875, 3.149658203125, 3.31427001953125, 3.4788818359375, 3.64349365234375, 3.80810546875, 3.97271728515625, 4.1373291015625, 4.30194091796875, 4.466552734375, 4.63116455078125, 4.7957763671875, 4.96038818359375, 5.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 15.0, 11.0, 15.0, 16.0, 28.0, 33.0, 43.0, 68.0, 82.0, 114.0, 164.0, 209.0, 310.0, 440.0, 598.0, 556.0, 388.0, 285.0, 193.0, 142.0, 93.0, 74.0, 60.0, 38.0, 22.0, 19.0, 14.0, 11.0, 7.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5546875, -9.272216796875, -8.98974609375, -8.707275390625, -8.4248046875, -8.142333984375, -7.85986328125, -7.577392578125, -7.294921875, -7.012451171875, -6.72998046875, -6.447509765625, -6.1650390625, -5.882568359375, -5.60009765625, -5.317626953125, -5.03515625, -4.752685546875, -4.47021484375, -4.187744140625, -3.9052734375, -3.622802734375, -3.34033203125, -3.057861328125, -2.775390625, -2.492919921875, -2.21044921875, -1.927978515625, -1.6455078125, -1.363037109375, -1.08056640625, -0.798095703125, -0.515625, -0.233154296875, 0.04931640625, 0.331787109375, 0.6142578125, 0.896728515625, 1.17919921875, 1.461669921875, 1.744140625, 2.026611328125, 2.30908203125, 2.591552734375, 2.8740234375, 3.156494140625, 3.43896484375, 3.721435546875, 4.00390625, 4.286376953125, 4.56884765625, 4.851318359375, 5.1337890625, 5.416259765625, 5.69873046875, 5.981201171875, 6.263671875, 6.546142578125, 6.82861328125, 7.111083984375, 7.3935546875, 7.676025390625, 7.95849609375, 8.240966796875, 8.5234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 12.0, 2.0, 17.0, 15.0, 15.0, 41.0, 39.0, 55.0, 87.0, 159.0, 223.0, 333.0, 535.0, 950.0, 1772.0, 3255.0, 6869.0, 14958.0, 35029.0, 93251.0, 290046.0, 1314641.0, 1831780.0, 399984.0, 120330.0, 44522.0, 18246.0, 8216.0, 3933.0, 2041.0, 1134.0, 627.0, 410.0, 263.0, 179.0, 91.0, 73.0, 47.0, 25.0, 25.0, 20.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.1484375, -9.842041015625, -9.53564453125, -9.229248046875, -8.9228515625, -8.616455078125, -8.31005859375, -8.003662109375, -7.697265625, -7.390869140625, -7.08447265625, -6.778076171875, -6.4716796875, -6.165283203125, -5.85888671875, -5.552490234375, -5.24609375, -4.939697265625, -4.63330078125, -4.326904296875, -4.0205078125, -3.714111328125, -3.40771484375, -3.101318359375, -2.794921875, -2.488525390625, -2.18212890625, -1.875732421875, -1.5693359375, -1.262939453125, -0.95654296875, -0.650146484375, -0.34375, -0.037353515625, 0.26904296875, 0.575439453125, 0.8818359375, 1.188232421875, 1.49462890625, 1.801025390625, 2.107421875, 2.413818359375, 2.72021484375, 3.026611328125, 3.3330078125, 3.639404296875, 3.94580078125, 4.252197265625, 4.55859375, 4.864990234375, 5.17138671875, 5.477783203125, 5.7841796875, 6.090576171875, 6.39697265625, 6.703369140625, 7.009765625, 7.316162109375, 7.62255859375, 7.928955078125, 8.2353515625, 8.541748046875, 8.84814453125, 9.154541015625, 9.4609375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 16.0, 46.0, 83.0, 137.0, 205.0, 186.0, 168.0, 78.0, 43.0, 29.0, 11.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.63381958007812, -131.83978271484375, -129.04576110839844, -126.25172424316406, -123.45769500732422, -120.66366577148438, -117.86962890625, -115.07559967041016, -112.28157043457031, -109.48754119873047, -106.6935043334961, -103.89947509765625, -101.1054458618164, -98.31141662597656, -95.51737976074219, -92.72335052490234, -89.92931365966797, -87.13528442382812, -84.34124755859375, -81.5472183227539, -78.75318908691406, -75.95915222167969, -73.16512298583984, -70.37109375, -67.57705688476562, -64.78302764892578, -61.98899459838867, -59.19496154785156, -56.40093231201172, -53.60689926147461, -50.8128662109375, -48.018836975097656, -45.22481155395508, -42.43077850341797, -39.636749267578125, -36.842716217041016, -34.048683166503906, -31.254653930664062, -28.460620880126953, -25.666589736938477, -22.87255859375, -20.078527450561523, -17.284496307373047, -14.490463256835938, -11.696432113647461, -8.902400970458984, -6.108367919921875, -3.3143367767333984, -0.5203056335449219, 2.273725986480713, 5.067757606506348, 7.861789703369141, 10.655820846557617, 13.449851989746094, 16.243885040283203, 19.03791618347168, 21.831947326660156, 24.625978469848633, 27.42000961303711, 30.21404266357422, 33.00807189941406, 35.80210494995117, 38.59613800048828, 41.390167236328125, 44.184200286865234]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 6.0, 0.0, 9.0, 10.0, 4.0, 14.0, 17.0, 24.0, 24.0, 22.0, 25.0, 27.0, 31.0, 41.0, 46.0, 46.0, 45.0, 38.0, 37.0, 24.0, 39.0, 48.0, 30.0, 34.0, 44.0, 40.0, 36.0, 30.0, 33.0, 29.0, 21.0, 24.0, 24.0, 18.0, 8.0, 15.0, 10.0, 8.0, 4.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.9023380279541, -27.00385284423828, -26.105365753173828, -25.206880569458008, -24.308395385742188, -23.409910202026367, -22.511425018310547, -21.612937927246094, -20.714452743530273, -19.815967559814453, -18.91748046875, -18.01899528503418, -17.12051010131836, -16.22202491760254, -15.323538780212402, -14.425052642822266, -13.526567459106445, -12.628082275390625, -11.729596138000488, -10.831110000610352, -9.932624816894531, -9.034139633178711, -8.135653495788574, -7.237167835235596, -6.338682174682617, -5.440196514129639, -4.54171085357666, -3.6432251930236816, -2.744739532470703, -1.8462538719177246, -0.9477682113647461, -0.04928255081176758, 0.8492012023925781, 1.7476868629455566, 2.646172523498535, 3.5446581840515137, 4.443143844604492, 5.341629505157471, 6.240115165710449, 7.138600826263428, 8.037086486816406, 8.935571670532227, 9.834057807922363, 10.7325439453125, 11.63102912902832, 12.52951431274414, 13.428000450134277, 14.326486587524414, 15.224971771240234, 16.123456954956055, 17.021942138671875, 17.920429229736328, 18.81891441345215, 19.71739959716797, 20.615886688232422, 21.514371871948242, 22.412857055664062, 23.311342239379883, 24.209827423095703, 25.108314514160156, 26.006799697875977, 26.905284881591797, 27.80377197265625, 28.70225715637207, 29.60074234008789]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 0.0, 4.0, 2.0, 5.0, 5.0, 11.0, 4.0, 8.0, 16.0, 9.0, 18.0, 20.0, 20.0, 23.0, 34.0, 32.0, 29.0, 22.0, 28.0, 28.0, 30.0, 43.0, 42.0, 37.0, 40.0, 43.0, 47.0, 35.0, 29.0, 38.0, 34.0, 25.0, 29.0, 28.0, 24.0, 30.0, 20.0, 25.0, 12.0, 15.0, 7.0, 11.0, 8.0, 13.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.96484375, -2.867828369140625, -2.77081298828125, -2.673797607421875, -2.5767822265625, -2.479766845703125, -2.38275146484375, -2.285736083984375, -2.188720703125, -2.091705322265625, -1.99468994140625, -1.897674560546875, -1.8006591796875, -1.703643798828125, -1.60662841796875, -1.509613037109375, -1.41259765625, -1.315582275390625, -1.21856689453125, -1.121551513671875, -1.0245361328125, -0.927520751953125, -0.83050537109375, -0.733489990234375, -0.636474609375, -0.539459228515625, -0.44244384765625, -0.345428466796875, -0.2484130859375, -0.151397705078125, -0.05438232421875, 0.042633056640625, 0.1396484375, 0.236663818359375, 0.33367919921875, 0.430694580078125, 0.5277099609375, 0.624725341796875, 0.72174072265625, 0.818756103515625, 0.915771484375, 1.012786865234375, 1.10980224609375, 1.206817626953125, 1.3038330078125, 1.400848388671875, 1.49786376953125, 1.594879150390625, 1.69189453125, 1.788909912109375, 1.88592529296875, 1.982940673828125, 2.0799560546875, 2.176971435546875, 2.27398681640625, 2.371002197265625, 2.468017578125, 2.565032958984375, 2.66204833984375, 2.759063720703125, 2.8560791015625, 2.953094482421875, 3.05010986328125, 3.147125244140625, 3.244140625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 11.0, 34.0, 19.0, 39.0, 78.0, 109.0, 180.0, 273.0, 427.0, 637.0, 1055.0, 1705.0, 2647.0, 4533.0, 7787.0, 13479.0, 24188.0, 44440.0, 83040.0, 151002.0, 244719.0, 206987.0, 117955.0, 63732.0, 34570.0, 18746.0, 10517.0, 6035.0, 3563.0, 2228.0, 1376.0, 864.0, 597.0, 337.0, 220.0, 151.0, 92.0, 57.0, 43.0, 21.0, 18.0, 13.0, 12.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328125, -9.025146484375, -8.72216796875, -8.419189453125, -8.1162109375, -7.813232421875, -7.51025390625, -7.207275390625, -6.904296875, -6.601318359375, -6.29833984375, -5.995361328125, -5.6923828125, -5.389404296875, -5.08642578125, -4.783447265625, -4.48046875, -4.177490234375, -3.87451171875, -3.571533203125, -3.2685546875, -2.965576171875, -2.66259765625, -2.359619140625, -2.056640625, -1.753662109375, -1.45068359375, -1.147705078125, -0.8447265625, -0.541748046875, -0.23876953125, 0.064208984375, 0.3671875, 0.670166015625, 0.97314453125, 1.276123046875, 1.5791015625, 1.882080078125, 2.18505859375, 2.488037109375, 2.791015625, 3.093994140625, 3.39697265625, 3.699951171875, 4.0029296875, 4.305908203125, 4.60888671875, 4.911865234375, 5.21484375, 5.517822265625, 5.82080078125, 6.123779296875, 6.4267578125, 6.729736328125, 7.03271484375, 7.335693359375, 7.638671875, 7.941650390625, 8.24462890625, 8.547607421875, 8.8505859375, 9.153564453125, 9.45654296875, 9.759521484375, 10.0625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 9.0, 6.0, 10.0, 13.0, 17.0, 20.0, 12.0, 24.0, 20.0, 12.0, 23.0, 17.0, 39.0, 29.0, 28.0, 24.0, 30.0, 43.0, 45.0, 28.0, 1059.0, 38.0, 54.0, 38.0, 30.0, 40.0, 35.0, 21.0, 15.0, 25.0, 33.0, 20.0, 26.0, 24.0, 18.0, 14.0, 11.0, 5.0, 5.0, 7.0, 11.0, 9.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.216796875, -2.141571044921875, -2.06634521484375, -1.991119384765625, -1.9158935546875, -1.840667724609375, -1.76544189453125, -1.690216064453125, -1.614990234375, -1.539764404296875, -1.46453857421875, -1.389312744140625, -1.3140869140625, -1.238861083984375, -1.16363525390625, -1.088409423828125, -1.01318359375, -0.937957763671875, -0.86273193359375, -0.787506103515625, -0.7122802734375, -0.637054443359375, -0.56182861328125, -0.486602783203125, -0.411376953125, -0.336151123046875, -0.26092529296875, -0.185699462890625, -0.1104736328125, -0.035247802734375, 0.03997802734375, 0.115203857421875, 0.1904296875, 0.265655517578125, 0.34088134765625, 0.416107177734375, 0.4913330078125, 0.566558837890625, 0.64178466796875, 0.717010498046875, 0.792236328125, 0.867462158203125, 0.94268798828125, 1.017913818359375, 1.0931396484375, 1.168365478515625, 1.24359130859375, 1.318817138671875, 1.39404296875, 1.469268798828125, 1.54449462890625, 1.619720458984375, 1.6949462890625, 1.770172119140625, 1.84539794921875, 1.920623779296875, 1.995849609375, 2.071075439453125, 2.14630126953125, 2.221527099609375, 2.2967529296875, 2.371978759765625, 2.44720458984375, 2.522430419921875, 2.59765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 11.0, 18.0, 34.0, 33.0, 56.0, 85.0, 110.0, 122.0, 204.0, 315.0, 450.0, 671.0, 938.0, 1348.0, 2261.0, 3414.0, 5463.0, 9246.0, 16479.0, 30819.0, 61395.0, 138798.0, 403695.0, 909052.0, 289264.0, 109912.0, 50962.0, 25927.0, 14154.0, 8109.0, 4818.0, 2982.0, 1965.0, 1277.0, 850.0, 543.0, 371.0, 280.0, 197.0, 136.0, 106.0, 83.0, 51.0, 40.0, 28.0, 15.0, 6.0, 9.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0], "bins": [-6.6875, -6.487060546875, -6.28662109375, -6.086181640625, -5.8857421875, -5.685302734375, -5.48486328125, -5.284423828125, -5.083984375, -4.883544921875, -4.68310546875, -4.482666015625, -4.2822265625, -4.081787109375, -3.88134765625, -3.680908203125, -3.48046875, -3.280029296875, -3.07958984375, -2.879150390625, -2.6787109375, -2.478271484375, -2.27783203125, -2.077392578125, -1.876953125, -1.676513671875, -1.47607421875, -1.275634765625, -1.0751953125, -0.874755859375, -0.67431640625, -0.473876953125, -0.2734375, -0.072998046875, 0.12744140625, 0.327880859375, 0.5283203125, 0.728759765625, 0.92919921875, 1.129638671875, 1.330078125, 1.530517578125, 1.73095703125, 1.931396484375, 2.1318359375, 2.332275390625, 2.53271484375, 2.733154296875, 2.93359375, 3.134033203125, 3.33447265625, 3.534912109375, 3.7353515625, 3.935791015625, 4.13623046875, 4.336669921875, 4.537109375, 4.737548828125, 4.93798828125, 5.138427734375, 5.3388671875, 5.539306640625, 5.73974609375, 5.940185546875, 6.140625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 10.0, 8.0, 9.0, 8.0, 7.0, 14.0, 13.0, 19.0, 24.0, 21.0, 26.0, 28.0, 45.0, 50.0, 65.0, 74.0, 63.0, 45.0, 63.0, 75.0, 63.0, 44.0, 41.0, 35.0, 31.0, 18.0, 14.0, 11.0, 17.0, 7.0, 7.0, 4.0, 4.0, 2.0, 6.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.123046875, -2.0592193603515625, -1.995391845703125, -1.9315643310546875, -1.86773681640625, -1.8039093017578125, -1.740081787109375, -1.6762542724609375, -1.6124267578125, -1.5485992431640625, -1.484771728515625, -1.4209442138671875, -1.35711669921875, -1.2932891845703125, -1.229461669921875, -1.1656341552734375, -1.101806640625, -1.0379791259765625, -0.974151611328125, -0.9103240966796875, -0.84649658203125, -0.7826690673828125, -0.718841552734375, -0.6550140380859375, -0.5911865234375, -0.5273590087890625, -0.463531494140625, -0.3997039794921875, -0.33587646484375, -0.2720489501953125, -0.208221435546875, -0.1443939208984375, -0.08056640625, -0.0167388916015625, 0.047088623046875, 0.1109161376953125, 0.17474365234375, 0.2385711669921875, 0.302398681640625, 0.3662261962890625, 0.4300537109375, 0.4938812255859375, 0.557708740234375, 0.6215362548828125, 0.68536376953125, 0.7491912841796875, 0.813018798828125, 0.8768463134765625, 0.940673828125, 1.0045013427734375, 1.068328857421875, 1.1321563720703125, 1.19598388671875, 1.2598114013671875, 1.323638916015625, 1.3874664306640625, 1.4512939453125, 1.5151214599609375, 1.578948974609375, 1.6427764892578125, 1.70660400390625, 1.7704315185546875, 1.834259033203125, 1.8980865478515625, 1.9619140625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 12.0, 10.0, 14.0, 7.0, 23.0, 28.0, 51.0, 61.0, 61.0, 91.0, 142.0, 150.0, 266.0, 690.0, 3202.0, 29633.0, 791650.0, 209658.0, 9941.0, 1540.0, 476.0, 232.0, 145.0, 86.0, 75.0, 58.0, 43.0, 43.0, 27.0, 30.0, 17.0, 19.0, 13.0, 11.0, 8.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.015625, -28.102783203125, -27.18994140625, -26.277099609375, -25.3642578125, -24.451416015625, -23.53857421875, -22.625732421875, -21.712890625, -20.800048828125, -19.88720703125, -18.974365234375, -18.0615234375, -17.148681640625, -16.23583984375, -15.322998046875, -14.41015625, -13.497314453125, -12.58447265625, -11.671630859375, -10.7587890625, -9.845947265625, -8.93310546875, -8.020263671875, -7.107421875, -6.194580078125, -5.28173828125, -4.368896484375, -3.4560546875, -2.543212890625, -1.63037109375, -0.717529296875, 0.1953125, 1.108154296875, 2.02099609375, 2.933837890625, 3.8466796875, 4.759521484375, 5.67236328125, 6.585205078125, 7.498046875, 8.410888671875, 9.32373046875, 10.236572265625, 11.1494140625, 12.062255859375, 12.97509765625, 13.887939453125, 14.80078125, 15.713623046875, 16.62646484375, 17.539306640625, 18.4521484375, 19.364990234375, 20.27783203125, 21.190673828125, 22.103515625, 23.016357421875, 23.92919921875, 24.842041015625, 25.7548828125, 26.667724609375, 27.58056640625, 28.493408203125, 29.40625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 19.0, 25.0, 60.0, 71.0, 123.0, 177.0, 174.0, 125.0, 105.0, 59.0, 25.0, 15.0, 10.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.151393890380859, -3.946289539337158, -3.741185188293457, -3.536080837249756, -3.3309762477874756, -3.1258718967437744, -2.9207675457000732, -2.715662956237793, -2.510558605194092, -2.3054542541503906, -2.1003499031066895, -1.8952454328536987, -1.690140962600708, -1.4850366115570068, -1.2799322605133057, -1.074827790260315, -0.8697235584259033, -0.6646191477775574, -0.4595147669315338, -0.25441038608551025, -0.04930597543716431, 0.15579843521118164, 0.3609027862548828, 0.5660072565078735, 0.7711116075515747, 0.9762160181999207, 1.1813204288482666, 1.3864247798919678, 1.591529130935669, 1.7966336011886597, 2.0017380714416504, 2.2068424224853516, 2.4119467735290527, 2.617051124572754, 2.822155475616455, 3.0272598266601562, 3.2323644161224365, 3.4374687671661377, 3.642573118209839, 3.847677707672119, 4.05278205871582, 4.2578864097595215, 4.462990760803223, 4.668095111846924, 4.873199462890625, 5.078304290771484, 5.283408164978027, 5.488512992858887, 5.69361686706543, 5.898721218109131, 6.103825569152832, 6.308929920196533, 6.514034271240234, 6.719139099121094, 6.924242973327637, 7.129347801208496, 7.334452152252197, 7.539556503295898, 7.7446608543396, 7.949765205383301, 8.15487003326416, 8.359973907470703, 8.565078735351562, 8.770182609558105, 8.975287437438965]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 7.0, 9.0, 10.0, 9.0, 14.0, 17.0, 23.0, 22.0, 30.0, 31.0, 37.0, 25.0, 28.0, 41.0, 42.0, 35.0, 46.0, 51.0, 44.0, 45.0, 33.0, 42.0, 36.0, 28.0, 36.0, 34.0, 24.0, 30.0, 21.0, 25.0, 17.0, 23.0, 19.0, 18.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.8581655025482178, -2.77230167388916, -2.6864376068115234, -2.600573778152466, -2.514709711074829, -2.4288458824157715, -2.3429818153381348, -2.257117986679077, -2.1712541580200195, -2.085390329360962, -1.9995262622833252, -1.9136624336242676, -1.8277983665466309, -1.7419345378875732, -1.656070590019226, -1.570206642150879, -1.4843425750732422, -1.398478627204895, -1.3126146793365479, -1.2267508506774902, -1.1408867835998535, -1.055022954940796, -0.9691590070724487, -0.8832950592041016, -0.7974311113357544, -0.7115671634674072, -0.6257032155990601, -0.5398393273353577, -0.4539753794670105, -0.36811143159866333, -0.28224754333496094, -0.19638359546661377, -0.1105196475982666, -0.024655714631080627, 0.06120821833610535, 0.14707213640213013, 0.2329360842704773, 0.31880003213882446, 0.40466392040252686, 0.490527868270874, 0.5763918161392212, 0.6622557640075684, 0.7481197118759155, 0.8339836001396179, 0.9198475480079651, 1.005711555480957, 1.0915753841400146, 1.1774393320083618, 1.263303279876709, 1.3491672277450562, 1.4350311756134033, 1.520895004272461, 1.6067590713500977, 1.6926229000091553, 1.7784868478775024, 1.8643507957458496, 1.9502147436141968, 2.036078691482544, 2.1219425201416016, 2.2078065872192383, 2.293670415878296, 2.3795344829559326, 2.4653983116149902, 2.551262378692627, 2.6371262073516846]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 17.0, 7.0, 21.0, 22.0, 31.0, 24.0, 30.0, 35.0, 31.0, 34.0, 39.0, 34.0, 43.0, 33.0, 47.0, 43.0, 30.0, 44.0, 46.0, 42.0, 39.0, 29.0, 35.0, 33.0, 24.0, 28.0, 27.0, 18.0, 13.0, 14.0, 12.0, 8.0, 6.0, 9.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.390625, -3.28546142578125, -3.1802978515625, -3.07513427734375, -2.969970703125, -2.86480712890625, -2.7596435546875, -2.65447998046875, -2.54931640625, -2.44415283203125, -2.3389892578125, -2.23382568359375, -2.128662109375, -2.02349853515625, -1.9183349609375, -1.81317138671875, -1.7080078125, -1.60284423828125, -1.4976806640625, -1.39251708984375, -1.287353515625, -1.18218994140625, -1.0770263671875, -0.97186279296875, -0.86669921875, -0.76153564453125, -0.6563720703125, -0.55120849609375, -0.446044921875, -0.34088134765625, -0.2357177734375, -0.13055419921875, -0.025390625, 0.07977294921875, 0.1849365234375, 0.29010009765625, 0.395263671875, 0.50042724609375, 0.6055908203125, 0.71075439453125, 0.81591796875, 0.92108154296875, 1.0262451171875, 1.13140869140625, 1.236572265625, 1.34173583984375, 1.4468994140625, 1.55206298828125, 1.6572265625, 1.76239013671875, 1.8675537109375, 1.97271728515625, 2.077880859375, 2.18304443359375, 2.2882080078125, 2.39337158203125, 2.49853515625, 2.60369873046875, 2.7088623046875, 2.81402587890625, 2.919189453125, 3.02435302734375, 3.1295166015625, 3.23468017578125, 3.33984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 13.0, 19.0, 32.0, 43.0, 65.0, 111.0, 157.0, 235.0, 341.0, 586.0, 903.0, 1429.0, 2217.0, 3574.0, 5872.0, 10096.0, 18675.0, 38934.0, 104699.0, 455925.0, 269846.0, 69337.0, 29194.0, 14871.0, 8170.0, 4908.0, 3017.0, 1865.0, 1226.0, 780.0, 493.0, 308.0, 213.0, 139.0, 94.0, 54.0, 38.0, 22.0, 17.0, 14.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.67901611328125, -4.5220947265625, -4.36517333984375, -4.208251953125, -4.05133056640625, -3.8944091796875, -3.73748779296875, -3.58056640625, -3.42364501953125, -3.2667236328125, -3.10980224609375, -2.952880859375, -2.79595947265625, -2.6390380859375, -2.48211669921875, -2.3251953125, -2.16827392578125, -2.0113525390625, -1.85443115234375, -1.697509765625, -1.54058837890625, -1.3836669921875, -1.22674560546875, -1.06982421875, -0.91290283203125, -0.7559814453125, -0.59906005859375, -0.442138671875, -0.28521728515625, -0.1282958984375, 0.02862548828125, 0.185546875, 0.34246826171875, 0.4993896484375, 0.65631103515625, 0.813232421875, 0.97015380859375, 1.1270751953125, 1.28399658203125, 1.44091796875, 1.59783935546875, 1.7547607421875, 1.91168212890625, 2.068603515625, 2.22552490234375, 2.3824462890625, 2.53936767578125, 2.6962890625, 2.85321044921875, 3.0101318359375, 3.16705322265625, 3.323974609375, 3.48089599609375, 3.6378173828125, 3.79473876953125, 3.95166015625, 4.10858154296875, 4.2655029296875, 4.42242431640625, 4.579345703125, 4.73626708984375, 4.8931884765625, 5.05010986328125, 5.20703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 7.0, 10.0, 7.0, 16.0, 17.0, 24.0, 11.0, 21.0, 23.0, 26.0, 44.0, 39.0, 47.0, 46.0, 55.0, 69.0, 162.0, 379.0, 1404.0, 152.0, 86.0, 57.0, 43.0, 39.0, 28.0, 29.0, 24.0, 29.0, 20.0, 20.0, 16.0, 13.0, 17.0, 17.0, 5.0, 7.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.2421875, -9.8896484375, -9.537109375, -9.1845703125, -8.83203125, -8.4794921875, -8.126953125, -7.7744140625, -7.421875, -7.0693359375, -6.716796875, -6.3642578125, -6.01171875, -5.6591796875, -5.306640625, -4.9541015625, -4.6015625, -4.2490234375, -3.896484375, -3.5439453125, -3.19140625, -2.8388671875, -2.486328125, -2.1337890625, -1.78125, -1.4287109375, -1.076171875, -0.7236328125, -0.37109375, -0.0185546875, 0.333984375, 0.6865234375, 1.0390625, 1.3916015625, 1.744140625, 2.0966796875, 2.44921875, 2.8017578125, 3.154296875, 3.5068359375, 3.859375, 4.2119140625, 4.564453125, 4.9169921875, 5.26953125, 5.6220703125, 5.974609375, 6.3271484375, 6.6796875, 7.0322265625, 7.384765625, 7.7373046875, 8.08984375, 8.4423828125, 8.794921875, 9.1474609375, 9.5, 9.8525390625, 10.205078125, 10.5576171875, 10.91015625, 11.2626953125, 11.615234375, 11.9677734375, 12.3203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 4.0, 18.0, 3.0, 6.0, 12.0, 9.0, 26.0, 22.0, 41.0, 45.0, 59.0, 69.0, 102.0, 166.0, 275.0, 493.0, 947.0, 2665.0, 11115.0, 77103.0, 2417755.0, 589522.0, 35135.0, 6421.0, 1738.0, 741.0, 434.0, 250.0, 137.0, 93.0, 70.0, 50.0, 48.0, 32.0, 24.0, 14.0, 16.0, 11.0, 4.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-18.625, -18.119140625, -17.61328125, -17.107421875, -16.6015625, -16.095703125, -15.58984375, -15.083984375, -14.578125, -14.072265625, -13.56640625, -13.060546875, -12.5546875, -12.048828125, -11.54296875, -11.037109375, -10.53125, -10.025390625, -9.51953125, -9.013671875, -8.5078125, -8.001953125, -7.49609375, -6.990234375, -6.484375, -5.978515625, -5.47265625, -4.966796875, -4.4609375, -3.955078125, -3.44921875, -2.943359375, -2.4375, -1.931640625, -1.42578125, -0.919921875, -0.4140625, 0.091796875, 0.59765625, 1.103515625, 1.609375, 2.115234375, 2.62109375, 3.126953125, 3.6328125, 4.138671875, 4.64453125, 5.150390625, 5.65625, 6.162109375, 6.66796875, 7.173828125, 7.6796875, 8.185546875, 8.69140625, 9.197265625, 9.703125, 10.208984375, 10.71484375, 11.220703125, 11.7265625, 12.232421875, 12.73828125, 13.244140625, 13.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 561.0, 453.0, 2.0], "bins": [-598.583984375, -588.9202270507812, -579.2564697265625, -569.5927734375, -559.9290161132812, -550.2652587890625, -540.6015014648438, -530.937744140625, -521.2739868164062, -511.6102294921875, -501.9465026855469, -492.2827453613281, -482.6189880371094, -472.95526123046875, -463.29150390625, -453.62774658203125, -443.96405029296875, -434.30029296875, -424.6365661621094, -414.9728088378906, -405.3090515136719, -395.64532470703125, -385.9815673828125, -376.31781005859375, -366.654052734375, -356.99029541015625, -347.3265686035156, -337.6628112792969, -327.9990539550781, -318.3353271484375, -308.67156982421875, -299.0078125, -289.3440856933594, -279.6803283691406, -270.0166015625, -260.35284423828125, -250.68910217285156, -241.02536010742188, -231.36160278320312, -221.69786071777344, -212.0341033935547, -202.370361328125, -192.70660400390625, -183.04286193847656, -173.37911987304688, -163.71536254882812, -154.05162048339844, -144.38787841796875, -134.72412109375, -125.06037139892578, -115.3966293334961, -105.73287963867188, -96.06913757324219, -86.40538787841797, -76.74163818359375, -67.07789611816406, -57.414154052734375, -47.75040817260742, -38.08666229248047, -28.42291259765625, -18.759166717529297, -9.095420837402344, 0.568328857421875, 10.232070922851562, 19.89582061767578]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 7.0, 6.0, 7.0, 8.0, 16.0, 19.0, 19.0, 16.0, 17.0, 20.0, 34.0, 31.0, 30.0, 24.0, 37.0, 41.0, 38.0, 33.0, 37.0, 45.0, 42.0, 39.0, 46.0, 42.0, 41.0, 34.0, 37.0, 34.0, 30.0, 16.0, 28.0, 25.0, 21.0, 18.0, 6.0, 9.0, 4.0, 10.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.07630157470703, -27.971431732177734, -26.866561889648438, -25.761690139770508, -24.65682029724121, -23.551950454711914, -22.447078704833984, -21.342208862304688, -20.23733901977539, -19.132469177246094, -18.027599334716797, -16.922727584838867, -15.81785774230957, -14.712987899780273, -13.60811710357666, -12.503246307373047, -11.39837646484375, -10.293506622314453, -9.18863582611084, -8.083765029907227, -6.97889518737793, -5.874024868011475, -4.7691545486450195, -3.6642842292785645, -2.5594139099121094, -1.4545435905456543, -0.3496732711791992, 0.7551970481872559, 1.860067367553711, 2.964937686920166, 4.069808006286621, 5.174678325653076, 6.279548645019531, 7.384418964385986, 8.489289283752441, 9.594160079956055, 10.699029922485352, 11.803899765014648, 12.908770561218262, 14.013641357421875, 15.118511199951172, 16.22338104248047, 17.328250885009766, 18.433122634887695, 19.537992477416992, 20.64286231994629, 21.74773406982422, 22.852603912353516, 23.957473754882812, 25.06234359741211, 26.167213439941406, 27.272085189819336, 28.376955032348633, 29.48182487487793, 30.58669662475586, 31.691566467285156, 32.79643630981445, 33.90130615234375, 35.00617599487305, 36.111045837402344, 37.215919494628906, 38.3207893371582, 39.4256591796875, 40.5305290222168, 41.635398864746094]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 13.0, 5.0, 13.0, 12.0, 18.0, 16.0, 22.0, 26.0, 31.0, 31.0, 39.0, 35.0, 27.0, 31.0, 38.0, 43.0, 29.0, 38.0, 45.0, 43.0, 33.0, 32.0, 35.0, 35.0, 24.0, 29.0, 31.0, 31.0, 26.0, 28.0, 16.0, 12.0, 14.0, 17.0, 10.0, 8.0, 13.0, 10.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9609375, -2.860015869140625, -2.75909423828125, -2.658172607421875, -2.5572509765625, -2.456329345703125, -2.35540771484375, -2.254486083984375, -2.153564453125, -2.052642822265625, -1.95172119140625, -1.850799560546875, -1.7498779296875, -1.648956298828125, -1.54803466796875, -1.447113037109375, -1.34619140625, -1.245269775390625, -1.14434814453125, -1.043426513671875, -0.9425048828125, -0.841583251953125, -0.74066162109375, -0.639739990234375, -0.538818359375, -0.437896728515625, -0.33697509765625, -0.236053466796875, -0.1351318359375, -0.034210205078125, 0.06671142578125, 0.167633056640625, 0.2685546875, 0.369476318359375, 0.47039794921875, 0.571319580078125, 0.6722412109375, 0.773162841796875, 0.87408447265625, 0.975006103515625, 1.075927734375, 1.176849365234375, 1.27777099609375, 1.378692626953125, 1.4796142578125, 1.580535888671875, 1.68145751953125, 1.782379150390625, 1.88330078125, 1.984222412109375, 2.08514404296875, 2.186065673828125, 2.2869873046875, 2.387908935546875, 2.48883056640625, 2.589752197265625, 2.690673828125, 2.791595458984375, 2.89251708984375, 2.993438720703125, 3.0943603515625, 3.195281982421875, 3.29620361328125, 3.397125244140625, 3.498046875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 7.0, 11.0, 16.0, 20.0, 34.0, 49.0, 51.0, 76.0, 111.0, 170.0, 290.0, 369.0, 548.0, 857.0, 1325.0, 2078.0, 3310.0, 5483.0, 8844.0, 15320.0, 28045.0, 55521.0, 131725.0, 469523.0, 1574674.0, 1332533.0, 347593.0, 107207.0, 47684.0, 24766.0, 13926.0, 8480.0, 5008.0, 3066.0, 1957.0, 1267.0, 783.0, 558.0, 326.0, 233.0, 154.0, 97.0, 58.0, 35.0, 34.0, 18.0, 13.0, 7.0, 9.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.546875, -5.38323974609375, -5.2196044921875, -5.05596923828125, -4.892333984375, -4.72869873046875, -4.5650634765625, -4.40142822265625, -4.23779296875, -4.07415771484375, -3.9105224609375, -3.74688720703125, -3.583251953125, -3.41961669921875, -3.2559814453125, -3.09234619140625, -2.9287109375, -2.76507568359375, -2.6014404296875, -2.43780517578125, -2.274169921875, -2.11053466796875, -1.9468994140625, -1.78326416015625, -1.61962890625, -1.45599365234375, -1.2923583984375, -1.12872314453125, -0.965087890625, -0.80145263671875, -0.6378173828125, -0.47418212890625, -0.310546875, -0.14691162109375, 0.0167236328125, 0.18035888671875, 0.343994140625, 0.50762939453125, 0.6712646484375, 0.83489990234375, 0.99853515625, 1.16217041015625, 1.3258056640625, 1.48944091796875, 1.653076171875, 1.81671142578125, 1.9803466796875, 2.14398193359375, 2.3076171875, 2.47125244140625, 2.6348876953125, 2.79852294921875, 2.962158203125, 3.12579345703125, 3.2894287109375, 3.45306396484375, 3.61669921875, 3.78033447265625, 3.9439697265625, 4.10760498046875, 4.271240234375, 4.43487548828125, 4.5985107421875, 4.76214599609375, 4.92578125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 11.0, 16.0, 28.0, 25.0, 31.0, 44.0, 49.0, 61.0, 95.0, 105.0, 139.0, 203.0, 302.0, 399.0, 479.0, 517.0, 361.0, 314.0, 212.0, 162.0, 115.0, 90.0, 72.0, 47.0, 52.0, 30.0, 31.0, 17.0, 13.0, 6.0, 5.0, 5.0, 9.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6171875, -8.3555908203125, -8.093994140625, -7.8323974609375, -7.57080078125, -7.3092041015625, -7.047607421875, -6.7860107421875, -6.5244140625, -6.2628173828125, -6.001220703125, -5.7396240234375, -5.47802734375, -5.2164306640625, -4.954833984375, -4.6932373046875, -4.431640625, -4.1700439453125, -3.908447265625, -3.6468505859375, -3.38525390625, -3.1236572265625, -2.862060546875, -2.6004638671875, -2.3388671875, -2.0772705078125, -1.815673828125, -1.5540771484375, -1.29248046875, -1.0308837890625, -0.769287109375, -0.5076904296875, -0.24609375, 0.0155029296875, 0.277099609375, 0.5386962890625, 0.80029296875, 1.0618896484375, 1.323486328125, 1.5850830078125, 1.8466796875, 2.1082763671875, 2.369873046875, 2.6314697265625, 2.89306640625, 3.1546630859375, 3.416259765625, 3.6778564453125, 3.939453125, 4.2010498046875, 4.462646484375, 4.7242431640625, 4.98583984375, 5.2474365234375, 5.509033203125, 5.7706298828125, 6.0322265625, 6.2938232421875, 6.555419921875, 6.8170166015625, 7.07861328125, 7.3402099609375, 7.601806640625, 7.8634033203125, 8.125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 9.0, 12.0, 12.0, 20.0, 23.0, 38.0, 54.0, 87.0, 117.0, 200.0, 384.0, 534.0, 1069.0, 2003.0, 3757.0, 7797.0, 16235.0, 37435.0, 93827.0, 268353.0, 1068502.0, 1926898.0, 508624.0, 153708.0, 57414.0, 24620.0, 11105.0, 5361.0, 2707.0, 1430.0, 767.0, 481.0, 237.0, 157.0, 103.0, 60.0, 32.0, 34.0, 30.0, 14.0, 6.0, 11.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.9296875, -8.6439208984375, -8.358154296875, -8.0723876953125, -7.78662109375, -7.5008544921875, -7.215087890625, -6.9293212890625, -6.6435546875, -6.3577880859375, -6.072021484375, -5.7862548828125, -5.50048828125, -5.2147216796875, -4.928955078125, -4.6431884765625, -4.357421875, -4.0716552734375, -3.785888671875, -3.5001220703125, -3.21435546875, -2.9285888671875, -2.642822265625, -2.3570556640625, -2.0712890625, -1.7855224609375, -1.499755859375, -1.2139892578125, -0.92822265625, -0.6424560546875, -0.356689453125, -0.0709228515625, 0.21484375, 0.5006103515625, 0.786376953125, 1.0721435546875, 1.35791015625, 1.6436767578125, 1.929443359375, 2.2152099609375, 2.5009765625, 2.7867431640625, 3.072509765625, 3.3582763671875, 3.64404296875, 3.9298095703125, 4.215576171875, 4.5013427734375, 4.787109375, 5.0728759765625, 5.358642578125, 5.6444091796875, 5.93017578125, 6.2159423828125, 6.501708984375, 6.7874755859375, 7.0732421875, 7.3590087890625, 7.644775390625, 7.9305419921875, 8.21630859375, 8.5020751953125, 8.787841796875, 9.0736083984375, 9.359375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 23.0, 73.0, 184.0, 288.0, 236.0, 129.0, 52.0, 19.0, 3.0, 1.0, 1.0], "bins": [-243.63755798339844, -239.3422088623047, -235.046875, -230.75152587890625, -226.4561767578125, -222.16082763671875, -217.865478515625, -213.5701446533203, -209.27479553222656, -204.9794464111328, -200.68411254882812, -196.38876342773438, -192.09341430664062, -187.79806518554688, -183.50271606445312, -179.20738220214844, -174.9120330810547, -170.61668395996094, -166.32135009765625, -162.0260009765625, -157.73065185546875, -153.435302734375, -149.13995361328125, -144.84461975097656, -140.5492706298828, -136.25392150878906, -131.95858764648438, -127.66323852539062, -123.36788940429688, -119.07254028320312, -114.7771987915039, -110.48185729980469, -106.18650817871094, -101.89115905761719, -97.59581756591797, -93.30047607421875, -89.005126953125, -84.70977783203125, -80.41443634033203, -76.11909484863281, -71.82374572753906, -67.52839660644531, -63.233055114746094, -58.93770980834961, -54.642364501953125, -50.34701919555664, -46.051673889160156, -41.75632858276367, -37.46098327636719, -33.1656379699707, -28.87029266357422, -24.574947357177734, -20.27960205078125, -15.984256744384766, -11.688911437988281, -7.393566131591797, -3.0982189178466797, 1.1971263885498047, 5.492471694946289, 9.787817001342773, 14.083162307739258, 18.378507614135742, 22.673852920532227, 26.96919822692871, 31.264543533325195]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 8.0, 12.0, 12.0, 10.0, 20.0, 24.0, 24.0, 28.0, 23.0, 37.0, 33.0, 52.0, 39.0, 58.0, 50.0, 56.0, 48.0, 36.0, 58.0, 47.0, 42.0, 30.0, 24.0, 32.0, 25.0, 22.0, 31.0, 15.0, 16.0, 17.0, 10.0, 15.0, 11.0, 6.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.22528839111328, -34.189964294433594, -33.15463638305664, -32.11931228637695, -31.083986282348633, -30.048660278320312, -29.013336181640625, -27.978010177612305, -26.942684173583984, -25.907358169555664, -24.872032165527344, -23.836708068847656, -22.801382064819336, -21.766056060791016, -20.730731964111328, -19.695405960083008, -18.660079956054688, -17.624753952026367, -16.589427947998047, -15.55410385131836, -14.518777847290039, -13.483451843261719, -12.448126792907715, -11.412801742553711, -10.37747573852539, -9.34214973449707, -8.306824684143066, -7.271499156951904, -6.236173629760742, -5.20084810256958, -4.165522575378418, -3.130197048187256, -2.0948734283447266, -1.0595479011535645, -0.024222373962402344, 1.0111031532287598, 2.046428680419922, 3.081754207611084, 4.117079734802246, 5.152405261993408, 6.18773078918457, 7.223056316375732, 8.258381843566895, 9.293706893920898, 10.329032897949219, 11.364358901977539, 12.399683952331543, 13.435009002685547, 14.470335006713867, 15.505661010742188, 16.540985107421875, 17.576311111450195, 18.611637115478516, 19.646963119506836, 20.682289123535156, 21.717613220214844, 22.752939224243164, 23.788265228271484, 24.823589324951172, 25.858915328979492, 26.894241333007812, 27.929567337036133, 28.964893341064453, 30.00021743774414, 31.03554344177246]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 12.0, 9.0, 8.0, 15.0, 9.0, 13.0, 16.0, 26.0, 22.0, 30.0, 18.0, 25.0, 34.0, 40.0, 37.0, 32.0, 37.0, 30.0, 43.0, 39.0, 31.0, 35.0, 42.0, 29.0, 40.0, 41.0, 30.0, 33.0, 33.0, 18.0, 26.0, 19.0, 19.0, 15.0, 15.0, 20.0, 11.0, 15.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.859375, -2.75811767578125, -2.6568603515625, -2.55560302734375, -2.454345703125, -2.35308837890625, -2.2518310546875, -2.15057373046875, -2.04931640625, -1.94805908203125, -1.8468017578125, -1.74554443359375, -1.644287109375, -1.54302978515625, -1.4417724609375, -1.34051513671875, -1.2392578125, -1.13800048828125, -1.0367431640625, -0.93548583984375, -0.834228515625, -0.73297119140625, -0.6317138671875, -0.53045654296875, -0.42919921875, -0.32794189453125, -0.2266845703125, -0.12542724609375, -0.024169921875, 0.07708740234375, 0.1783447265625, 0.27960205078125, 0.380859375, 0.48211669921875, 0.5833740234375, 0.68463134765625, 0.785888671875, 0.88714599609375, 0.9884033203125, 1.08966064453125, 1.19091796875, 1.29217529296875, 1.3934326171875, 1.49468994140625, 1.595947265625, 1.69720458984375, 1.7984619140625, 1.89971923828125, 2.0009765625, 2.10223388671875, 2.2034912109375, 2.30474853515625, 2.406005859375, 2.50726318359375, 2.6085205078125, 2.70977783203125, 2.81103515625, 2.91229248046875, 3.0135498046875, 3.11480712890625, 3.216064453125, 3.31732177734375, 3.4185791015625, 3.51983642578125, 3.62109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 8.0, 7.0, 14.0, 20.0, 35.0, 48.0, 80.0, 96.0, 132.0, 201.0, 278.0, 371.0, 549.0, 835.0, 1215.0, 1789.0, 2739.0, 4154.0, 6418.0, 10513.0, 17160.0, 30043.0, 57376.0, 119279.0, 302119.0, 263335.0, 106597.0, 52329.0, 27499.0, 15893.0, 9538.0, 6073.0, 3849.0, 2569.0, 1721.0, 1156.0, 760.0, 516.0, 387.0, 259.0, 195.0, 121.0, 88.0, 51.0, 51.0, 27.0, 24.0, 16.0, 12.0, 6.0, 8.0, 0.0, 1.0, 1.0, 3.0], "bins": [-11.140625, -10.812255859375, -10.48388671875, -10.155517578125, -9.8271484375, -9.498779296875, -9.17041015625, -8.842041015625, -8.513671875, -8.185302734375, -7.85693359375, -7.528564453125, -7.2001953125, -6.871826171875, -6.54345703125, -6.215087890625, -5.88671875, -5.558349609375, -5.22998046875, -4.901611328125, -4.5732421875, -4.244873046875, -3.91650390625, -3.588134765625, -3.259765625, -2.931396484375, -2.60302734375, -2.274658203125, -1.9462890625, -1.617919921875, -1.28955078125, -0.961181640625, -0.6328125, -0.304443359375, 0.02392578125, 0.352294921875, 0.6806640625, 1.009033203125, 1.33740234375, 1.665771484375, 1.994140625, 2.322509765625, 2.65087890625, 2.979248046875, 3.3076171875, 3.635986328125, 3.96435546875, 4.292724609375, 4.62109375, 4.949462890625, 5.27783203125, 5.606201171875, 5.9345703125, 6.262939453125, 6.59130859375, 6.919677734375, 7.248046875, 7.576416015625, 7.90478515625, 8.233154296875, 8.5615234375, 8.889892578125, 9.21826171875, 9.546630859375, 9.875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 7.0, 13.0, 15.0, 14.0, 9.0, 21.0, 26.0, 17.0, 21.0, 27.0, 28.0, 32.0, 26.0, 37.0, 38.0, 32.0, 36.0, 41.0, 1064.0, 44.0, 48.0, 39.0, 32.0, 40.0, 27.0, 30.0, 25.0, 32.0, 16.0, 16.0, 23.0, 20.0, 23.0, 14.0, 15.0, 16.0, 8.0, 5.0, 4.0, 6.0, 3.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.25, -3.1588134765625, -3.067626953125, -2.9764404296875, -2.88525390625, -2.7940673828125, -2.702880859375, -2.6116943359375, -2.5205078125, -2.4293212890625, -2.338134765625, -2.2469482421875, -2.15576171875, -2.0645751953125, -1.973388671875, -1.8822021484375, -1.791015625, -1.6998291015625, -1.608642578125, -1.5174560546875, -1.42626953125, -1.3350830078125, -1.243896484375, -1.1527099609375, -1.0615234375, -0.9703369140625, -0.879150390625, -0.7879638671875, -0.69677734375, -0.6055908203125, -0.514404296875, -0.4232177734375, -0.33203125, -0.2408447265625, -0.149658203125, -0.0584716796875, 0.03271484375, 0.1239013671875, 0.215087890625, 0.3062744140625, 0.3974609375, 0.4886474609375, 0.579833984375, 0.6710205078125, 0.76220703125, 0.8533935546875, 0.944580078125, 1.0357666015625, 1.126953125, 1.2181396484375, 1.309326171875, 1.4005126953125, 1.49169921875, 1.5828857421875, 1.674072265625, 1.7652587890625, 1.8564453125, 1.9476318359375, 2.038818359375, 2.1300048828125, 2.22119140625, 2.3123779296875, 2.403564453125, 2.4947509765625, 2.5859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 8.0, 5.0, 6.0, 5.0, 8.0, 12.0, 8.0, 13.0, 27.0, 29.0, 46.0, 81.0, 84.0, 109.0, 127.0, 177.0, 263.0, 349.0, 534.0, 823.0, 1364.0, 2230.0, 4004.0, 7885.0, 19202.0, 55212.0, 231071.0, 1425007.0, 251958.0, 57937.0, 19694.0, 8359.0, 4092.0, 2313.0, 1324.0, 840.0, 545.0, 362.0, 246.0, 168.0, 152.0, 120.0, 89.0, 66.0, 58.0, 28.0, 22.0, 19.0, 11.0, 14.0, 6.0, 9.0, 8.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0], "bins": [-10.8515625, -10.50732421875, -10.1630859375, -9.81884765625, -9.474609375, -9.13037109375, -8.7861328125, -8.44189453125, -8.09765625, -7.75341796875, -7.4091796875, -7.06494140625, -6.720703125, -6.37646484375, -6.0322265625, -5.68798828125, -5.34375, -4.99951171875, -4.6552734375, -4.31103515625, -3.966796875, -3.62255859375, -3.2783203125, -2.93408203125, -2.58984375, -2.24560546875, -1.9013671875, -1.55712890625, -1.212890625, -0.86865234375, -0.5244140625, -0.18017578125, 0.1640625, 0.50830078125, 0.8525390625, 1.19677734375, 1.541015625, 1.88525390625, 2.2294921875, 2.57373046875, 2.91796875, 3.26220703125, 3.6064453125, 3.95068359375, 4.294921875, 4.63916015625, 4.9833984375, 5.32763671875, 5.671875, 6.01611328125, 6.3603515625, 6.70458984375, 7.048828125, 7.39306640625, 7.7373046875, 8.08154296875, 8.42578125, 8.77001953125, 9.1142578125, 9.45849609375, 9.802734375, 10.14697265625, 10.4912109375, 10.83544921875, 11.1796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 13.0, 20.0, 29.0, 72.0, 157.0, 308.0, 242.0, 71.0, 39.0, 17.0, 11.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.83782958984375, -4.6326904296875, -4.42755126953125, -4.222412109375, -4.01727294921875, -3.8121337890625, -3.60699462890625, -3.40185546875, -3.19671630859375, -2.9915771484375, -2.78643798828125, -2.581298828125, -2.37615966796875, -2.1710205078125, -1.96588134765625, -1.7607421875, -1.55560302734375, -1.3504638671875, -1.14532470703125, -0.940185546875, -0.73504638671875, -0.5299072265625, -0.32476806640625, -0.11962890625, 0.08551025390625, 0.2906494140625, 0.49578857421875, 0.700927734375, 0.90606689453125, 1.1112060546875, 1.31634521484375, 1.521484375, 1.72662353515625, 1.9317626953125, 2.13690185546875, 2.342041015625, 2.54718017578125, 2.7523193359375, 2.95745849609375, 3.16259765625, 3.36773681640625, 3.5728759765625, 3.77801513671875, 3.983154296875, 4.18829345703125, 4.3934326171875, 4.59857177734375, 4.8037109375, 5.00885009765625, 5.2139892578125, 5.41912841796875, 5.624267578125, 5.82940673828125, 6.0345458984375, 6.23968505859375, 6.44482421875, 6.64996337890625, 6.8551025390625, 7.06024169921875, 7.265380859375, 7.47052001953125, 7.6756591796875, 7.88079833984375, 8.0859375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 2.0, 13.0, 7.0, 17.0, 29.0, 47.0, 153.0, 480.0, 2813.0, 948675.0, 93903.0, 1816.0, 321.0, 124.0, 58.0, 35.0, 22.0, 6.0, 4.0, 5.0, 10.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.8125, -103.8369140625, -100.861328125, -97.8857421875, -94.91015625, -91.9345703125, -88.958984375, -85.9833984375, -83.0078125, -80.0322265625, -77.056640625, -74.0810546875, -71.10546875, -68.1298828125, -65.154296875, -62.1787109375, -59.203125, -56.2275390625, -53.251953125, -50.2763671875, -47.30078125, -44.3251953125, -41.349609375, -38.3740234375, -35.3984375, -32.4228515625, -29.447265625, -26.4716796875, -23.49609375, -20.5205078125, -17.544921875, -14.5693359375, -11.59375, -8.6181640625, -5.642578125, -2.6669921875, 0.30859375, 3.2841796875, 6.259765625, 9.2353515625, 12.2109375, 15.1865234375, 18.162109375, 21.1376953125, 24.11328125, 27.0888671875, 30.064453125, 33.0400390625, 36.015625, 38.9912109375, 41.966796875, 44.9423828125, 47.91796875, 50.8935546875, 53.869140625, 56.8447265625, 59.8203125, 62.7958984375, 65.771484375, 68.7470703125, 71.72265625, 74.6982421875, 77.673828125, 80.6494140625, 83.625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 8.0, 39.0, 85.0, 236.0, 354.0, 195.0, 57.0, 19.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.473761558532715, -15.05947494506836, -14.645188331604004, -14.230902671813965, -13.81661605834961, -13.402329444885254, -12.988042831420898, -12.57375717163086, -12.159470558166504, -11.745183944702148, -11.330897331237793, -10.916611671447754, -10.502325057983398, -10.088038444519043, -9.673751831054688, -9.259466171264648, -8.845178604125977, -8.430891990661621, -8.016605377197266, -7.602319240570068, -7.188033103942871, -6.773746490478516, -6.35945987701416, -5.945173740386963, -5.530887603759766, -5.11660099029541, -4.702314853668213, -4.288028240203857, -3.87374210357666, -3.4594554901123047, -3.0451691150665283, -2.630882740020752, -2.2165966033935547, -1.8023102283477783, -1.388023853302002, -0.973737359046936, -0.5594509840011597, -0.14516448974609375, 0.2691218852996826, 0.683408260345459, 1.0976946353912354, 1.5119810104370117, 1.926267385482788, 2.3405537605285645, 2.75484037399292, 3.1691267490386963, 3.5834131240844727, 3.997699499130249, 4.411985874176025, 4.826272487640381, 5.240558624267578, 5.654845237731934, 6.069131374359131, 6.483417987823486, 6.897704124450684, 7.311990737915039, 7.7262773513793945, 8.14056396484375, 8.554850578308105, 8.969136238098145, 9.3834228515625, 9.797709465026855, 10.211996078491211, 10.62628173828125, 11.040568351745605]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 11.0, 3.0, 9.0, 11.0, 17.0, 16.0, 27.0, 14.0, 24.0, 32.0, 30.0, 33.0, 38.0, 31.0, 34.0, 33.0, 43.0, 51.0, 49.0, 38.0, 45.0, 33.0, 34.0, 37.0, 37.0, 39.0, 22.0, 39.0, 30.0, 15.0, 27.0, 17.0, 11.0, 22.0, 9.0, 9.0, 5.0, 5.0, 2.0, 7.0, 3.0, 7.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9819717407226562, -2.8878679275512695, -2.793764114379883, -2.699660301208496, -2.6055564880371094, -2.5114526748657227, -2.417348861694336, -2.323245048522949, -2.2291412353515625, -2.135037422180176, -2.040933609008789, -1.9468297958374023, -1.8527259826660156, -1.758622169494629, -1.6645184755325317, -1.570414662361145, -1.4763109683990479, -1.3822071552276611, -1.2881033420562744, -1.1939995288848877, -1.099895715713501, -1.0057919025421143, -0.9116882085800171, -0.8175843954086304, -0.7234805822372437, -0.6293767690658569, -0.5352729558944702, -0.44116920232772827, -0.34706538915634155, -0.25296157598495483, -0.1588578224182129, -0.06475400924682617, 0.029349803924560547, 0.12345360219478607, 0.2175574004650116, 0.3116611838340759, 0.40576499700546265, 0.49986881017684937, 0.5939725637435913, 0.688076376914978, 0.7821801900863647, 0.8762840032577515, 0.9703878164291382, 1.0644915103912354, 1.158595323562622, 1.2526991367340088, 1.3468029499053955, 1.4409067630767822, 1.535010576248169, 1.6291143894195557, 1.7232182025909424, 1.817322015762329, 1.9114258289337158, 2.0055296421051025, 2.09963321685791, 2.193737030029297, 2.2878408432006836, 2.3819446563720703, 2.476048469543457, 2.5701522827148438, 2.6642560958862305, 2.758359909057617, 2.852463722229004, 2.9465675354003906, 3.0406713485717773]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 8.0, 15.0, 10.0, 9.0, 16.0, 11.0, 17.0, 24.0, 22.0, 29.0, 35.0, 22.0, 33.0, 32.0, 38.0, 36.0, 40.0, 34.0, 40.0, 46.0, 34.0, 47.0, 39.0, 37.0, 41.0, 27.0, 31.0, 26.0, 28.0, 16.0, 25.0, 24.0, 18.0, 24.0, 12.0, 15.0, 11.0, 5.0, 3.0, 10.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.111328125, -3.0052490234375, -2.899169921875, -2.7930908203125, -2.68701171875, -2.5809326171875, -2.474853515625, -2.3687744140625, -2.2626953125, -2.1566162109375, -2.050537109375, -1.9444580078125, -1.83837890625, -1.7322998046875, -1.626220703125, -1.5201416015625, -1.4140625, -1.3079833984375, -1.201904296875, -1.0958251953125, -0.98974609375, -0.8836669921875, -0.777587890625, -0.6715087890625, -0.5654296875, -0.4593505859375, -0.353271484375, -0.2471923828125, -0.14111328125, -0.0350341796875, 0.071044921875, 0.1771240234375, 0.283203125, 0.3892822265625, 0.495361328125, 0.6014404296875, 0.70751953125, 0.8135986328125, 0.919677734375, 1.0257568359375, 1.1318359375, 1.2379150390625, 1.343994140625, 1.4500732421875, 1.55615234375, 1.6622314453125, 1.768310546875, 1.8743896484375, 1.98046875, 2.0865478515625, 2.192626953125, 2.2987060546875, 2.40478515625, 2.5108642578125, 2.616943359375, 2.7230224609375, 2.8291015625, 2.9351806640625, 3.041259765625, 3.1473388671875, 3.25341796875, 3.3594970703125, 3.465576171875, 3.5716552734375, 3.677734375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 12.0, 27.0, 18.0, 40.0, 44.0, 74.0, 104.0, 157.0, 217.0, 291.0, 453.0, 643.0, 914.0, 1444.0, 2174.0, 3458.0, 5788.0, 9845.0, 17214.0, 33556.0, 74401.0, 201003.0, 394844.0, 167878.0, 64694.0, 29810.0, 15617.0, 8913.0, 5317.0, 3301.0, 2114.0, 1333.0, 857.0, 613.0, 412.0, 298.0, 210.0, 136.0, 93.0, 63.0, 59.0, 28.0, 29.0, 19.0, 12.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.16015625, -5.0009765625, -4.841796875, -4.6826171875, -4.5234375, -4.3642578125, -4.205078125, -4.0458984375, -3.88671875, -3.7275390625, -3.568359375, -3.4091796875, -3.25, -3.0908203125, -2.931640625, -2.7724609375, -2.61328125, -2.4541015625, -2.294921875, -2.1357421875, -1.9765625, -1.8173828125, -1.658203125, -1.4990234375, -1.33984375, -1.1806640625, -1.021484375, -0.8623046875, -0.703125, -0.5439453125, -0.384765625, -0.2255859375, -0.06640625, 0.0927734375, 0.251953125, 0.4111328125, 0.5703125, 0.7294921875, 0.888671875, 1.0478515625, 1.20703125, 1.3662109375, 1.525390625, 1.6845703125, 1.84375, 2.0029296875, 2.162109375, 2.3212890625, 2.48046875, 2.6396484375, 2.798828125, 2.9580078125, 3.1171875, 3.2763671875, 3.435546875, 3.5947265625, 3.75390625, 3.9130859375, 4.072265625, 4.2314453125, 4.390625, 4.5498046875, 4.708984375, 4.8681640625, 5.02734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 11.0, 13.0, 10.0, 14.0, 12.0, 15.0, 20.0, 28.0, 24.0, 30.0, 37.0, 34.0, 44.0, 61.0, 78.0, 128.0, 221.0, 1423.0, 256.0, 120.0, 75.0, 54.0, 32.0, 39.0, 45.0, 39.0, 26.0, 22.0, 15.0, 28.0, 13.0, 16.0, 15.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1953125, -11.7830810546875, -11.370849609375, -10.9586181640625, -10.54638671875, -10.1341552734375, -9.721923828125, -9.3096923828125, -8.8974609375, -8.4852294921875, -8.072998046875, -7.6607666015625, -7.24853515625, -6.8363037109375, -6.424072265625, -6.0118408203125, -5.599609375, -5.1873779296875, -4.775146484375, -4.3629150390625, -3.95068359375, -3.5384521484375, -3.126220703125, -2.7139892578125, -2.3017578125, -1.8895263671875, -1.477294921875, -1.0650634765625, -0.65283203125, -0.2406005859375, 0.171630859375, 0.5838623046875, 0.99609375, 1.4083251953125, 1.820556640625, 2.2327880859375, 2.64501953125, 3.0572509765625, 3.469482421875, 3.8817138671875, 4.2939453125, 4.7061767578125, 5.118408203125, 5.5306396484375, 5.94287109375, 6.3551025390625, 6.767333984375, 7.1795654296875, 7.591796875, 8.0040283203125, 8.416259765625, 8.8284912109375, 9.24072265625, 9.6529541015625, 10.065185546875, 10.4774169921875, 10.8896484375, 11.3018798828125, 11.714111328125, 12.1263427734375, 12.53857421875, 12.9508056640625, 13.363037109375, 13.7752685546875, 14.1875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 6.0, 2.0, 9.0, 12.0, 17.0, 21.0, 27.0, 17.0, 35.0, 50.0, 53.0, 68.0, 76.0, 133.0, 208.0, 384.0, 963.0, 3663.0, 22458.0, 523908.0, 2527567.0, 56234.0, 6813.0, 1597.0, 565.0, 234.0, 155.0, 114.0, 69.0, 46.0, 42.0, 25.0, 30.0, 19.0, 19.0, 17.0, 11.0, 5.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.703125, -22.966796875, -22.23046875, -21.494140625, -20.7578125, -20.021484375, -19.28515625, -18.548828125, -17.8125, -17.076171875, -16.33984375, -15.603515625, -14.8671875, -14.130859375, -13.39453125, -12.658203125, -11.921875, -11.185546875, -10.44921875, -9.712890625, -8.9765625, -8.240234375, -7.50390625, -6.767578125, -6.03125, -5.294921875, -4.55859375, -3.822265625, -3.0859375, -2.349609375, -1.61328125, -0.876953125, -0.140625, 0.595703125, 1.33203125, 2.068359375, 2.8046875, 3.541015625, 4.27734375, 5.013671875, 5.75, 6.486328125, 7.22265625, 7.958984375, 8.6953125, 9.431640625, 10.16796875, 10.904296875, 11.640625, 12.376953125, 13.11328125, 13.849609375, 14.5859375, 15.322265625, 16.05859375, 16.794921875, 17.53125, 18.267578125, 19.00390625, 19.740234375, 20.4765625, 21.212890625, 21.94921875, 22.685546875, 23.421875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 12.0, 339.0, 618.0, 47.0, 1.0, 2.0, 0.0, 1.0], "bins": [-389.95233154296875, -383.2428283691406, -376.5333251953125, -369.8238220214844, -363.11431884765625, -356.40478515625, -349.6952819824219, -342.98577880859375, -336.2762756347656, -329.5667724609375, -322.8572692871094, -316.14776611328125, -309.438232421875, -302.7287292480469, -296.01922607421875, -289.3097229003906, -282.6002197265625, -275.8907165527344, -269.18121337890625, -262.4717102050781, -255.76219177246094, -249.0526885986328, -242.34317016601562, -235.6336669921875, -228.92416381835938, -222.21466064453125, -215.50515747070312, -208.79563903808594, -202.0861358642578, -195.3766326904297, -188.6671142578125, -181.95761108398438, -175.24810791015625, -168.53860473632812, -161.8291015625, -155.1195831298828, -148.4100799560547, -141.70057678222656, -134.99105834960938, -128.28155517578125, -121.5720443725586, -114.86253356933594, -108.15303039550781, -101.44352722167969, -94.73401641845703, -88.02450561523438, -81.31500244140625, -74.60549926757812, -67.89598846435547, -61.18648147583008, -54.47697448730469, -47.7674674987793, -41.057960510253906, -34.348453521728516, -27.638946533203125, -20.929439544677734, -14.219932556152344, -7.510425567626953, -0.8009185791015625, 5.908588409423828, 12.618095397949219, 19.32760238647461, 26.037109375, 32.74661636352539, 39.45612335205078]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 6.0, 11.0, 14.0, 8.0, 12.0, 10.0, 18.0, 30.0, 23.0, 22.0, 20.0, 40.0, 44.0, 36.0, 47.0, 35.0, 36.0, 50.0, 43.0, 38.0, 31.0, 44.0, 44.0, 34.0, 31.0, 30.0, 27.0, 23.0, 35.0, 21.0, 14.0, 21.0, 12.0, 11.0, 16.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 1.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.50245666503906, -32.43413543701172, -31.365814208984375, -30.29749298095703, -29.229171752929688, -28.160850524902344, -27.092529296875, -26.024208068847656, -24.955886840820312, -23.88756561279297, -22.819244384765625, -21.75092315673828, -20.682601928710938, -19.614280700683594, -18.54595947265625, -17.477638244628906, -16.409317016601562, -15.340995788574219, -14.272674560546875, -13.204353332519531, -12.136032104492188, -11.067710876464844, -9.9993896484375, -8.931068420410156, -7.8627471923828125, -6.794425964355469, -5.726104736328125, -4.657783508300781, -3.5894622802734375, -2.5211410522460938, -1.45281982421875, -0.38449859619140625, 0.6838264465332031, 1.7521476745605469, 2.8204689025878906, 3.8887901306152344, 4.957111358642578, 6.025432586669922, 7.093753814697266, 8.16207504272461, 9.230396270751953, 10.298717498779297, 11.36703872680664, 12.435359954833984, 13.503681182861328, 14.572002410888672, 15.640323638916016, 16.70864486694336, 17.776966094970703, 18.845287322998047, 19.91360855102539, 20.981929779052734, 22.050251007080078, 23.118572235107422, 24.186893463134766, 25.25521469116211, 26.323535919189453, 27.391857147216797, 28.46017837524414, 29.528499603271484, 30.596820831298828, 31.665142059326172, 32.733463287353516, 33.80178451538086, 34.8701057434082]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 3.0, 6.0, 11.0, 7.0, 11.0, 19.0, 18.0, 21.0, 22.0, 31.0, 37.0, 33.0, 38.0, 40.0, 36.0, 42.0, 39.0, 34.0, 34.0, 37.0, 45.0, 30.0, 37.0, 33.0, 39.0, 40.0, 37.0, 23.0, 31.0, 28.0, 19.0, 20.0, 15.0, 9.0, 12.0, 14.0, 9.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.332733154296875, -3.22015380859375, -3.107574462890625, -2.9949951171875, -2.882415771484375, -2.76983642578125, -2.657257080078125, -2.544677734375, -2.432098388671875, -2.31951904296875, -2.206939697265625, -2.0943603515625, -1.981781005859375, -1.86920166015625, -1.756622314453125, -1.64404296875, -1.531463623046875, -1.41888427734375, -1.306304931640625, -1.1937255859375, -1.081146240234375, -0.96856689453125, -0.855987548828125, -0.743408203125, -0.630828857421875, -0.51824951171875, -0.405670166015625, -0.2930908203125, -0.180511474609375, -0.06793212890625, 0.044647216796875, 0.1572265625, 0.269805908203125, 0.38238525390625, 0.494964599609375, 0.6075439453125, 0.720123291015625, 0.83270263671875, 0.945281982421875, 1.057861328125, 1.170440673828125, 1.28302001953125, 1.395599365234375, 1.5081787109375, 1.620758056640625, 1.73333740234375, 1.845916748046875, 1.95849609375, 2.071075439453125, 2.18365478515625, 2.296234130859375, 2.4088134765625, 2.521392822265625, 2.63397216796875, 2.746551513671875, 2.859130859375, 2.971710205078125, 3.08428955078125, 3.196868896484375, 3.3094482421875, 3.422027587890625, 3.53460693359375, 3.647186279296875, 3.759765625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 10.0, 22.0, 12.0, 18.0, 42.0, 40.0, 59.0, 103.0, 172.0, 235.0, 382.0, 609.0, 1083.0, 1904.0, 3416.0, 6101.0, 12230.0, 25285.0, 59412.0, 192945.0, 1046071.0, 2114787.0, 532551.0, 114054.0, 42112.0, 19155.0, 9541.0, 5180.0, 2797.0, 1641.0, 946.0, 505.0, 329.0, 201.0, 93.0, 78.0, 42.0, 35.0, 28.0, 11.0, 14.0, 3.0, 9.0, 5.0, 5.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-6.3828125, -6.1650390625, -5.947265625, -5.7294921875, -5.51171875, -5.2939453125, -5.076171875, -4.8583984375, -4.640625, -4.4228515625, -4.205078125, -3.9873046875, -3.76953125, -3.5517578125, -3.333984375, -3.1162109375, -2.8984375, -2.6806640625, -2.462890625, -2.2451171875, -2.02734375, -1.8095703125, -1.591796875, -1.3740234375, -1.15625, -0.9384765625, -0.720703125, -0.5029296875, -0.28515625, -0.0673828125, 0.150390625, 0.3681640625, 0.5859375, 0.8037109375, 1.021484375, 1.2392578125, 1.45703125, 1.6748046875, 1.892578125, 2.1103515625, 2.328125, 2.5458984375, 2.763671875, 2.9814453125, 3.19921875, 3.4169921875, 3.634765625, 3.8525390625, 4.0703125, 4.2880859375, 4.505859375, 4.7236328125, 4.94140625, 5.1591796875, 5.376953125, 5.5947265625, 5.8125, 6.0302734375, 6.248046875, 6.4658203125, 6.68359375, 6.9013671875, 7.119140625, 7.3369140625, 7.5546875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 11.0, 4.0, 13.0, 22.0, 27.0, 35.0, 43.0, 56.0, 67.0, 95.0, 125.0, 165.0, 230.0, 341.0, 478.0, 602.0, 521.0, 361.0, 244.0, 182.0, 106.0, 92.0, 78.0, 35.0, 32.0, 23.0, 20.0, 14.0, 11.0, 7.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6953125, -10.4022216796875, -10.109130859375, -9.8160400390625, -9.52294921875, -9.2298583984375, -8.936767578125, -8.6436767578125, -8.3505859375, -8.0574951171875, -7.764404296875, -7.4713134765625, -7.17822265625, -6.8851318359375, -6.592041015625, -6.2989501953125, -6.005859375, -5.7127685546875, -5.419677734375, -5.1265869140625, -4.83349609375, -4.5404052734375, -4.247314453125, -3.9542236328125, -3.6611328125, -3.3680419921875, -3.074951171875, -2.7818603515625, -2.48876953125, -2.1956787109375, -1.902587890625, -1.6094970703125, -1.31640625, -1.0233154296875, -0.730224609375, -0.4371337890625, -0.14404296875, 0.1490478515625, 0.442138671875, 0.7352294921875, 1.0283203125, 1.3214111328125, 1.614501953125, 1.9075927734375, 2.20068359375, 2.4937744140625, 2.786865234375, 3.0799560546875, 3.373046875, 3.6661376953125, 3.959228515625, 4.2523193359375, 4.54541015625, 4.8385009765625, 5.131591796875, 5.4246826171875, 5.7177734375, 6.0108642578125, 6.303955078125, 6.5970458984375, 6.89013671875, 7.1832275390625, 7.476318359375, 7.7694091796875, 8.0625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 2.0, 16.0, 17.0, 16.0, 16.0, 34.0, 56.0, 105.0, 173.0, 414.0, 929.0, 2638.0, 9042.0, 39863.0, 269572.0, 2938475.0, 824059.0, 85224.0, 16514.0, 4437.0, 1463.0, 554.0, 244.0, 141.0, 83.0, 46.0, 38.0, 31.0, 13.0, 15.0, 8.0, 11.0, 5.0, 8.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6875, -15.100341796875, -14.51318359375, -13.926025390625, -13.3388671875, -12.751708984375, -12.16455078125, -11.577392578125, -10.990234375, -10.403076171875, -9.81591796875, -9.228759765625, -8.6416015625, -8.054443359375, -7.46728515625, -6.880126953125, -6.29296875, -5.705810546875, -5.11865234375, -4.531494140625, -3.9443359375, -3.357177734375, -2.77001953125, -2.182861328125, -1.595703125, -1.008544921875, -0.42138671875, 0.165771484375, 0.7529296875, 1.340087890625, 1.92724609375, 2.514404296875, 3.1015625, 3.688720703125, 4.27587890625, 4.863037109375, 5.4501953125, 6.037353515625, 6.62451171875, 7.211669921875, 7.798828125, 8.385986328125, 8.97314453125, 9.560302734375, 10.1474609375, 10.734619140625, 11.32177734375, 11.908935546875, 12.49609375, 13.083251953125, 13.67041015625, 14.257568359375, 14.8447265625, 15.431884765625, 16.01904296875, 16.606201171875, 17.193359375, 17.780517578125, 18.36767578125, 18.954833984375, 19.5419921875, 20.129150390625, 20.71630859375, 21.303466796875, 21.890625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 27.0, 56.0, 121.0, 194.0, 223.0, 197.0, 115.0, 46.0, 11.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.23078918457031, -62.85179138183594, -59.47279739379883, -56.09380340576172, -52.714805603027344, -49.33580780029297, -45.95681381225586, -42.57781982421875, -39.198822021484375, -35.81982421875, -32.44083023071289, -29.06183433532715, -25.682838439941406, -22.303842544555664, -18.924846649169922, -15.54585075378418, -12.166854858398438, -8.787858963012695, -5.408863067626953, -2.029867172241211, 1.3491287231445312, 4.728124618530273, 8.107120513916016, 11.486116409301758, 14.8651123046875, 18.244108200073242, 21.623104095458984, 25.002099990844727, 28.38109588623047, 31.76009178161621, 35.13908767700195, 38.51808166503906, 41.89707946777344, 45.27607727050781, 48.65507125854492, 52.03406524658203, 55.413063049316406, 58.79206085205078, 62.17105484008789, 65.550048828125, 68.92904663085938, 72.30804443359375, 75.68704223632812, 79.06603240966797, 82.44503021240234, 85.82402801513672, 89.20301818847656, 92.58201599121094, 95.96101379394531, 99.34001159667969, 102.71900939941406, 106.0979995727539, 109.47699737548828, 112.85599517822266, 116.2349853515625, 119.61398315429688, 122.99298095703125, 126.37197875976562, 129.7509765625, 133.12997436523438, 136.50897216796875, 139.88795471191406, 143.26695251464844, 146.6459503173828, 150.0249481201172]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 3.0, 9.0, 10.0, 17.0, 15.0, 13.0, 21.0, 24.0, 25.0, 22.0, 25.0, 33.0, 37.0, 33.0, 50.0, 41.0, 54.0, 43.0, 35.0, 43.0, 45.0, 33.0, 29.0, 32.0, 33.0, 38.0, 33.0, 32.0, 27.0, 20.0, 16.0, 18.0, 13.0, 18.0, 10.0, 12.0, 3.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.91424560546875, -28.92262840270996, -27.931011199951172, -26.939395904541016, -25.947778701782227, -24.956161499023438, -23.96454429626465, -22.97292709350586, -21.981311798095703, -20.989694595336914, -19.998077392578125, -19.00646209716797, -18.01484489440918, -17.02322769165039, -16.0316104888916, -15.039993286132812, -14.048376083374023, -13.056758880615234, -12.065142631530762, -11.073525428771973, -10.0819091796875, -9.090291976928711, -8.098674774169922, -7.107058048248291, -6.11544132232666, -5.123824596405029, -4.132207870483398, -3.1405906677246094, -2.1489739418029785, -1.1573572158813477, -0.1657400131225586, 0.8258767127990723, 1.8174934387207031, 2.809110164642334, 3.800727128982544, 4.792344093322754, 5.783960819244385, 6.775577545166016, 7.767194747924805, 8.758811950683594, 9.750428199768066, 10.742045402526855, 11.733661651611328, 12.725278854370117, 13.716896057128906, 14.708512306213379, 15.700129508972168, 16.69174575805664, 17.68336296081543, 18.67498016357422, 19.666597366333008, 20.658214569091797, 21.649829864501953, 22.641447067260742, 23.63306427001953, 24.62468147277832, 25.61629867553711, 26.6079158782959, 27.599533081054688, 28.591148376464844, 29.582765579223633, 30.574382781982422, 31.56599998474121, 32.5576171875, 33.549232482910156]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 12.0, 16.0, 14.0, 29.0, 14.0, 18.0, 19.0, 23.0, 22.0, 27.0, 32.0, 36.0, 41.0, 40.0, 36.0, 36.0, 32.0, 40.0, 50.0, 38.0, 54.0, 35.0, 26.0, 36.0, 39.0, 25.0, 23.0, 18.0, 27.0, 19.0, 17.0, 23.0, 20.0, 17.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.494140625, -3.381317138671875, -3.26849365234375, -3.155670166015625, -3.0428466796875, -2.930023193359375, -2.81719970703125, -2.704376220703125, -2.591552734375, -2.478729248046875, -2.36590576171875, -2.253082275390625, -2.1402587890625, -2.027435302734375, -1.91461181640625, -1.801788330078125, -1.68896484375, -1.576141357421875, -1.46331787109375, -1.350494384765625, -1.2376708984375, -1.124847412109375, -1.01202392578125, -0.899200439453125, -0.786376953125, -0.673553466796875, -0.56072998046875, -0.447906494140625, -0.3350830078125, -0.222259521484375, -0.10943603515625, 0.003387451171875, 0.1162109375, 0.229034423828125, 0.34185791015625, 0.454681396484375, 0.5675048828125, 0.680328369140625, 0.79315185546875, 0.905975341796875, 1.018798828125, 1.131622314453125, 1.24444580078125, 1.357269287109375, 1.4700927734375, 1.582916259765625, 1.69573974609375, 1.808563232421875, 1.92138671875, 2.034210205078125, 2.14703369140625, 2.259857177734375, 2.3726806640625, 2.485504150390625, 2.59832763671875, 2.711151123046875, 2.823974609375, 2.936798095703125, 3.04962158203125, 3.162445068359375, 3.2752685546875, 3.388092041015625, 3.50091552734375, 3.613739013671875, 3.7265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 4.0, 8.0, 17.0, 24.0, 34.0, 64.0, 92.0, 138.0, 255.0, 443.0, 763.0, 1382.0, 2391.0, 4472.0, 8087.0, 14767.0, 27661.0, 54602.0, 124122.0, 533664.0, 147109.0, 61365.0, 30923.0, 16183.0, 8864.0, 4869.0, 2727.0, 1538.0, 863.0, 476.0, 249.0, 154.0, 82.0, 50.0, 32.0, 24.0, 16.0, 19.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2265625, -13.8028564453125, -13.379150390625, -12.9554443359375, -12.53173828125, -12.1080322265625, -11.684326171875, -11.2606201171875, -10.8369140625, -10.4132080078125, -9.989501953125, -9.5657958984375, -9.14208984375, -8.7183837890625, -8.294677734375, -7.8709716796875, -7.447265625, -7.0235595703125, -6.599853515625, -6.1761474609375, -5.75244140625, -5.3287353515625, -4.905029296875, -4.4813232421875, -4.0576171875, -3.6339111328125, -3.210205078125, -2.7864990234375, -2.36279296875, -1.9390869140625, -1.515380859375, -1.0916748046875, -0.66796875, -0.2442626953125, 0.179443359375, 0.6031494140625, 1.02685546875, 1.4505615234375, 1.874267578125, 2.2979736328125, 2.7216796875, 3.1453857421875, 3.569091796875, 3.9927978515625, 4.41650390625, 4.8402099609375, 5.263916015625, 5.6876220703125, 6.111328125, 6.5350341796875, 6.958740234375, 7.3824462890625, 7.80615234375, 8.2298583984375, 8.653564453125, 9.0772705078125, 9.5009765625, 9.9246826171875, 10.348388671875, 10.7720947265625, 11.19580078125, 11.6195068359375, 12.043212890625, 12.4669189453125, 12.890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 6.0, 12.0, 17.0, 13.0, 23.0, 26.0, 34.0, 38.0, 35.0, 29.0, 52.0, 47.0, 44.0, 48.0, 1074.0, 41.0, 48.0, 51.0, 49.0, 42.0, 39.0, 31.0, 32.0, 35.0, 32.0, 24.0, 16.0, 11.0, 12.0, 14.0, 8.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.518798828125, -3.40478515625, -3.290771484375, -3.1767578125, -3.062744140625, -2.94873046875, -2.834716796875, -2.720703125, -2.606689453125, -2.49267578125, -2.378662109375, -2.2646484375, -2.150634765625, -2.03662109375, -1.922607421875, -1.80859375, -1.694580078125, -1.58056640625, -1.466552734375, -1.3525390625, -1.238525390625, -1.12451171875, -1.010498046875, -0.896484375, -0.782470703125, -0.66845703125, -0.554443359375, -0.4404296875, -0.326416015625, -0.21240234375, -0.098388671875, 0.015625, 0.129638671875, 0.24365234375, 0.357666015625, 0.4716796875, 0.585693359375, 0.69970703125, 0.813720703125, 0.927734375, 1.041748046875, 1.15576171875, 1.269775390625, 1.3837890625, 1.497802734375, 1.61181640625, 1.725830078125, 1.83984375, 1.953857421875, 2.06787109375, 2.181884765625, 2.2958984375, 2.409912109375, 2.52392578125, 2.637939453125, 2.751953125, 2.865966796875, 2.97998046875, 3.093994140625, 3.2080078125, 3.322021484375, 3.43603515625, 3.550048828125, 3.6640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 12.0, 16.0, 21.0, 27.0, 41.0, 70.0, 78.0, 106.0, 196.0, 260.0, 389.0, 562.0, 916.0, 1442.0, 2692.0, 5091.0, 10731.0, 27450.0, 88188.0, 988653.0, 835439.0, 85334.0, 27052.0, 10612.0, 4966.0, 2597.0, 1488.0, 877.0, 579.0, 376.0, 261.0, 196.0, 122.0, 70.0, 66.0, 38.0, 32.0, 26.0, 12.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.8671875, -12.4649658203125, -12.062744140625, -11.6605224609375, -11.25830078125, -10.8560791015625, -10.453857421875, -10.0516357421875, -9.6494140625, -9.2471923828125, -8.844970703125, -8.4427490234375, -8.04052734375, -7.6383056640625, -7.236083984375, -6.8338623046875, -6.431640625, -6.0294189453125, -5.627197265625, -5.2249755859375, -4.82275390625, -4.4205322265625, -4.018310546875, -3.6160888671875, -3.2138671875, -2.8116455078125, -2.409423828125, -2.0072021484375, -1.60498046875, -1.2027587890625, -0.800537109375, -0.3983154296875, 0.00390625, 0.4061279296875, 0.808349609375, 1.2105712890625, 1.61279296875, 2.0150146484375, 2.417236328125, 2.8194580078125, 3.2216796875, 3.6239013671875, 4.026123046875, 4.4283447265625, 4.83056640625, 5.2327880859375, 5.635009765625, 6.0372314453125, 6.439453125, 6.8416748046875, 7.243896484375, 7.6461181640625, 8.04833984375, 8.4505615234375, 8.852783203125, 9.2550048828125, 9.6572265625, 10.0594482421875, 10.461669921875, 10.8638916015625, 11.26611328125, 11.6683349609375, 12.070556640625, 12.4727783203125, 12.875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 11.0, 12.0, 13.0, 19.0, 21.0, 30.0, 39.0, 63.0, 205.0, 300.0, 72.0, 50.0, 29.0, 20.0, 19.0, 15.0, 19.0, 11.0, 9.0, 6.0, 6.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.813201904296875, -3.69085693359375, -3.568511962890625, -3.4461669921875, -3.323822021484375, -3.20147705078125, -3.079132080078125, -2.956787109375, -2.834442138671875, -2.71209716796875, -2.589752197265625, -2.4674072265625, -2.345062255859375, -2.22271728515625, -2.100372314453125, -1.97802734375, -1.855682373046875, -1.73333740234375, -1.610992431640625, -1.4886474609375, -1.366302490234375, -1.24395751953125, -1.121612548828125, -0.999267578125, -0.876922607421875, -0.75457763671875, -0.632232666015625, -0.5098876953125, -0.387542724609375, -0.26519775390625, -0.142852783203125, -0.0205078125, 0.101837158203125, 0.22418212890625, 0.346527099609375, 0.4688720703125, 0.591217041015625, 0.71356201171875, 0.835906982421875, 0.958251953125, 1.080596923828125, 1.20294189453125, 1.325286865234375, 1.4476318359375, 1.569976806640625, 1.69232177734375, 1.814666748046875, 1.93701171875, 2.059356689453125, 2.18170166015625, 2.304046630859375, 2.4263916015625, 2.548736572265625, 2.67108154296875, 2.793426513671875, 2.915771484375, 3.038116455078125, 3.16046142578125, 3.282806396484375, 3.4051513671875, 3.527496337890625, 3.64984130859375, 3.772186279296875, 3.89453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 5.0, 4.0, 7.0, 6.0, 9.0, 16.0, 20.0, 23.0, 35.0, 41.0, 55.0, 71.0, 168.0, 406.0, 1654.0, 11082.0, 927263.0, 101055.0, 4939.0, 987.0, 276.0, 124.0, 82.0, 55.0, 41.0, 23.0, 27.0, 23.0, 14.0, 5.0, 9.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.6357421875, -50.927734375, -49.2197265625, -47.51171875, -45.8037109375, -44.095703125, -42.3876953125, -40.6796875, -38.9716796875, -37.263671875, -35.5556640625, -33.84765625, -32.1396484375, -30.431640625, -28.7236328125, -27.015625, -25.3076171875, -23.599609375, -21.8916015625, -20.18359375, -18.4755859375, -16.767578125, -15.0595703125, -13.3515625, -11.6435546875, -9.935546875, -8.2275390625, -6.51953125, -4.8115234375, -3.103515625, -1.3955078125, 0.3125, 2.0205078125, 3.728515625, 5.4365234375, 7.14453125, 8.8525390625, 10.560546875, 12.2685546875, 13.9765625, 15.6845703125, 17.392578125, 19.1005859375, 20.80859375, 22.5166015625, 24.224609375, 25.9326171875, 27.640625, 29.3486328125, 31.056640625, 32.7646484375, 34.47265625, 36.1806640625, 37.888671875, 39.5966796875, 41.3046875, 43.0126953125, 44.720703125, 46.4287109375, 48.13671875, 49.8447265625, 51.552734375, 53.2607421875, 54.96875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 10.0, 17.0, 56.0, 102.0, 194.0, 259.0, 179.0, 81.0, 35.0, 30.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.776590347290039, -6.459705352783203, -6.142820835113525, -5.825936317443848, -5.509051322937012, -5.192166328430176, -4.875281810760498, -4.55839729309082, -4.241512298583984, -3.9246275424957275, -3.6077427864074707, -3.290858030319214, -2.973973274230957, -2.6570885181427, -2.3402037620544434, -2.0233190059661865, -1.7064342498779297, -1.3895494937896729, -1.072664737701416, -0.7557799816131592, -0.43889522552490234, -0.12201046943664551, 0.19487428665161133, 0.5117590427398682, 0.828643798828125, 1.1455285549163818, 1.4624133110046387, 1.7792980670928955, 2.0961828231811523, 2.413067579269409, 2.729952335357666, 3.046837091445923, 3.3637218475341797, 3.6806066036224365, 3.9974913597106934, 4.314375877380371, 4.631260871887207, 4.948145866394043, 5.265030384063721, 5.581914901733398, 5.898799896240234, 6.21568489074707, 6.532569408416748, 6.849453926086426, 7.166338920593262, 7.483223915100098, 7.800108432769775, 8.116992950439453, 8.433877944946289, 8.750762939453125, 9.067647933959961, 9.38453197479248, 9.701416969299316, 10.018301963806152, 10.335186004638672, 10.652070999145508, 10.968955993652344, 11.28584098815918, 11.602725982666016, 11.919610023498535, 12.236495018005371, 12.553380012512207, 12.870264053344727, 13.187149047851562, 13.504034042358398]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 1.0, 3.0, 4.0, 9.0, 14.0, 12.0, 6.0, 12.0, 12.0, 23.0, 17.0, 26.0, 19.0, 28.0, 30.0, 17.0, 30.0, 31.0, 35.0, 46.0, 36.0, 42.0, 41.0, 45.0, 40.0, 49.0, 36.0, 36.0, 52.0, 30.0, 32.0, 31.0, 19.0, 26.0, 22.0, 14.0, 13.0, 7.0, 8.0, 10.0, 4.0, 8.0, 7.0, 0.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.8131330013275146, -2.725132942199707, -2.6371331214904785, -2.549133062362671, -2.4611330032348633, -2.3731329441070557, -2.285132884979248, -2.1971330642700195, -2.109133005142212, -2.0211329460144043, -1.9331330060958862, -1.8451330661773682, -1.7571330070495605, -1.669132947921753, -1.5811330080032349, -1.4931330680847168, -1.4051330089569092, -1.3171329498291016, -1.2291330099105835, -1.1411330699920654, -1.0531330108642578, -0.965133011341095, -0.8771330118179321, -0.7891330122947693, -0.7011330127716064, -0.6131330132484436, -0.5251330137252808, -0.4371330142021179, -0.3491330146789551, -0.26113301515579224, -0.1731330156326294, -0.08513301610946655, 0.002866983413696289, 0.09086698293685913, 0.17886698246002197, 0.2668669819831848, 0.35486698150634766, 0.4428669810295105, 0.5308669805526733, 0.6188669800758362, 0.706866979598999, 0.7948669791221619, 0.8828669786453247, 0.9708669781684875, 1.0588669776916504, 1.146867036819458, 1.234866976737976, 1.3228669166564941, 1.4108669757843018, 1.4988670349121094, 1.5868669748306274, 1.6748669147491455, 1.7628669738769531, 1.8508670330047607, 1.9388669729232788, 2.026866912841797, 2.1148669719696045, 2.202867031097412, 2.2908668518066406, 2.3788669109344482, 2.466866970062256, 2.5548670291900635, 2.642867088317871, 2.7308669090270996, 2.8188669681549072]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 5.0, 8.0, 19.0, 23.0, 26.0, 14.0, 24.0, 23.0, 24.0, 32.0, 35.0, 35.0, 36.0, 37.0, 37.0, 42.0, 27.0, 37.0, 31.0, 47.0, 51.0, 30.0, 33.0, 35.0, 32.0, 32.0, 26.0, 25.0, 19.0, 25.0, 24.0, 15.0, 13.0, 16.0, 10.0, 9.0, 8.0, 8.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.755859375, -3.644378662109375, -3.53289794921875, -3.421417236328125, -3.3099365234375, -3.198455810546875, -3.08697509765625, -2.975494384765625, -2.864013671875, -2.752532958984375, -2.64105224609375, -2.529571533203125, -2.4180908203125, -2.306610107421875, -2.19512939453125, -2.083648681640625, -1.97216796875, -1.860687255859375, -1.74920654296875, -1.637725830078125, -1.5262451171875, -1.414764404296875, -1.30328369140625, -1.191802978515625, -1.080322265625, -0.968841552734375, -0.85736083984375, -0.745880126953125, -0.6343994140625, -0.522918701171875, -0.41143798828125, -0.299957275390625, -0.1884765625, -0.076995849609375, 0.03448486328125, 0.145965576171875, 0.2574462890625, 0.368927001953125, 0.48040771484375, 0.591888427734375, 0.703369140625, 0.814849853515625, 0.92633056640625, 1.037811279296875, 1.1492919921875, 1.260772705078125, 1.37225341796875, 1.483734130859375, 1.59521484375, 1.706695556640625, 1.81817626953125, 1.929656982421875, 2.0411376953125, 2.152618408203125, 2.26409912109375, 2.375579833984375, 2.487060546875, 2.598541259765625, 2.71002197265625, 2.821502685546875, 2.9329833984375, 3.044464111328125, 3.15594482421875, 3.267425537109375, 3.37890625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 4.0, 13.0, 13.0, 19.0, 38.0, 43.0, 58.0, 112.0, 131.0, 200.0, 329.0, 501.0, 799.0, 1333.0, 2184.0, 3786.0, 6975.0, 13840.0, 31567.0, 87131.0, 346887.0, 390518.0, 96194.0, 33619.0, 14699.0, 7510.0, 3994.0, 2297.0, 1391.0, 826.0, 505.0, 332.0, 226.0, 147.0, 95.0, 65.0, 56.0, 32.0, 29.0, 11.0, 16.0, 9.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71484375, -7.47406005859375, -7.2332763671875, -6.99249267578125, -6.751708984375, -6.51092529296875, -6.2701416015625, -6.02935791015625, -5.78857421875, -5.54779052734375, -5.3070068359375, -5.06622314453125, -4.825439453125, -4.58465576171875, -4.3438720703125, -4.10308837890625, -3.8623046875, -3.62152099609375, -3.3807373046875, -3.13995361328125, -2.899169921875, -2.65838623046875, -2.4176025390625, -2.17681884765625, -1.93603515625, -1.69525146484375, -1.4544677734375, -1.21368408203125, -0.972900390625, -0.73211669921875, -0.4913330078125, -0.25054931640625, -0.009765625, 0.23101806640625, 0.4718017578125, 0.71258544921875, 0.953369140625, 1.19415283203125, 1.4349365234375, 1.67572021484375, 1.91650390625, 2.15728759765625, 2.3980712890625, 2.63885498046875, 2.879638671875, 3.12042236328125, 3.3612060546875, 3.60198974609375, 3.8427734375, 4.08355712890625, 4.3243408203125, 4.56512451171875, 4.805908203125, 5.04669189453125, 5.2874755859375, 5.52825927734375, 5.76904296875, 6.00982666015625, 6.2506103515625, 6.49139404296875, 6.732177734375, 6.97296142578125, 7.2137451171875, 7.45452880859375, 7.6953125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 2.0, 11.0, 7.0, 8.0, 11.0, 15.0, 11.0, 13.0, 24.0, 21.0, 21.0, 32.0, 43.0, 41.0, 44.0, 51.0, 54.0, 109.0, 211.0, 1336.0, 314.0, 184.0, 101.0, 54.0, 46.0, 21.0, 39.0, 23.0, 22.0, 22.0, 22.0, 25.0, 30.0, 12.0, 12.0, 12.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.3406982421875, -12.923583984375, -12.5064697265625, -12.08935546875, -11.6722412109375, -11.255126953125, -10.8380126953125, -10.4208984375, -10.0037841796875, -9.586669921875, -9.1695556640625, -8.75244140625, -8.3353271484375, -7.918212890625, -7.5010986328125, -7.083984375, -6.6668701171875, -6.249755859375, -5.8326416015625, -5.41552734375, -4.9984130859375, -4.581298828125, -4.1641845703125, -3.7470703125, -3.3299560546875, -2.912841796875, -2.4957275390625, -2.07861328125, -1.6614990234375, -1.244384765625, -0.8272705078125, -0.41015625, 0.0069580078125, 0.424072265625, 0.8411865234375, 1.25830078125, 1.6754150390625, 2.092529296875, 2.5096435546875, 2.9267578125, 3.3438720703125, 3.760986328125, 4.1781005859375, 4.59521484375, 5.0123291015625, 5.429443359375, 5.8465576171875, 6.263671875, 6.6807861328125, 7.097900390625, 7.5150146484375, 7.93212890625, 8.3492431640625, 8.766357421875, 9.1834716796875, 9.6005859375, 10.0177001953125, 10.434814453125, 10.8519287109375, 11.26904296875, 11.6861572265625, 12.103271484375, 12.5203857421875, 12.9375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 4.0, 4.0, 5.0, 4.0, 13.0, 11.0, 19.0, 28.0, 30.0, 58.0, 75.0, 93.0, 187.0, 368.0, 976.0, 4430.0, 51421.0, 2969491.0, 109976.0, 6125.0, 1336.0, 432.0, 232.0, 118.0, 76.0, 55.0, 31.0, 23.0, 21.0, 13.0, 12.0, 12.0, 9.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.193359375, -34.04296875, -32.892578125, -31.7421875, -30.591796875, -29.44140625, -28.291015625, -27.140625, -25.990234375, -24.83984375, -23.689453125, -22.5390625, -21.388671875, -20.23828125, -19.087890625, -17.9375, -16.787109375, -15.63671875, -14.486328125, -13.3359375, -12.185546875, -11.03515625, -9.884765625, -8.734375, -7.583984375, -6.43359375, -5.283203125, -4.1328125, -2.982421875, -1.83203125, -0.681640625, 0.46875, 1.619140625, 2.76953125, 3.919921875, 5.0703125, 6.220703125, 7.37109375, 8.521484375, 9.671875, 10.822265625, 11.97265625, 13.123046875, 14.2734375, 15.423828125, 16.57421875, 17.724609375, 18.875, 20.025390625, 21.17578125, 22.326171875, 23.4765625, 24.626953125, 25.77734375, 26.927734375, 28.078125, 29.228515625, 30.37890625, 31.529296875, 32.6796875, 33.830078125, 34.98046875, 36.130859375, 37.28125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [10.0, 844.0, 164.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.191394805908203, -10.436698913574219, 3.3179969787597656, 17.07269287109375, 30.827388763427734, 44.582088470458984, 58.3367805480957, 72.09147644042969, 85.84617614746094, 99.60087585449219, 113.3555679321289, 127.11026000976562, 140.86495971679688, 154.61965942382812, 168.37435913085938, 182.12904357910156, 195.8837432861328, 209.63844299316406, 223.39312744140625, 237.1478271484375, 250.90252685546875, 264.6572265625, 278.41192626953125, 292.1666259765625, 305.9212951660156, 319.6759948730469, 333.4306945800781, 347.1853942871094, 360.9400634765625, 374.69476318359375, 388.449462890625, 402.20416259765625, 415.9588623046875, 429.71356201171875, 443.46826171875, 457.22296142578125, 470.9776611328125, 484.73236083984375, 498.4870300292969, 512.24169921875, 525.9964599609375, 539.7511596679688, 553.505859375, 567.2605590820312, 581.0152587890625, 594.7699584960938, 608.524658203125, 622.279296875, 636.0339965820312, 649.7886962890625, 663.5433959960938, 677.298095703125, 691.0527954101562, 704.8074951171875, 718.5621948242188, 732.31689453125, 746.071533203125, 759.8262329101562, 773.5809326171875, 787.3356323242188, 801.09033203125, 814.8450317382812, 828.5997314453125, 842.3543701171875, 856.109130859375]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 9.0, 12.0, 6.0, 9.0, 12.0, 26.0, 13.0, 18.0, 20.0, 23.0, 24.0, 18.0, 20.0, 31.0, 24.0, 41.0, 33.0, 31.0, 36.0, 39.0, 40.0, 45.0, 35.0, 31.0, 35.0, 33.0, 37.0, 36.0, 22.0, 29.0, 22.0, 21.0, 17.0, 24.0, 23.0, 15.0, 12.0, 16.0, 13.0, 9.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.055152893066406, -34.95722961425781, -33.85930633544922, -32.761383056640625, -31.663461685180664, -30.56553840637207, -29.46761703491211, -28.369693756103516, -27.271770477294922, -26.173847198486328, -25.075923919677734, -23.978002548217773, -22.88007926940918, -21.782155990600586, -20.684234619140625, -19.58631134033203, -18.488388061523438, -17.390464782714844, -16.29254150390625, -15.194620132446289, -14.096696853637695, -12.998773574829102, -11.900851249694824, -10.802928924560547, -9.705005645751953, -8.60708236694336, -7.509160041809082, -6.4112372398376465, -5.313314437866211, -4.215391635894775, -3.11746883392334, -2.0195460319519043, -0.9216232299804688, 0.1762995719909668, 1.2742223739624023, 2.372145175933838, 3.4700679779052734, 4.567990779876709, 5.6659135818481445, 6.76383638381958, 7.861759185791016, 8.95968246459961, 10.057604789733887, 11.155527114868164, 12.253450393676758, 13.351373672485352, 14.449295997619629, 15.547218322753906, 16.6451416015625, 17.743064880371094, 18.840988159179688, 19.93890953063965, 21.036832809448242, 22.134756088256836, 23.232677459716797, 24.33060073852539, 25.428524017333984, 26.526447296142578, 27.624370574951172, 28.722291946411133, 29.820215225219727, 30.91813850402832, 32.01605987548828, 33.113983154296875, 34.21190643310547]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 3.0, 7.0, 12.0, 8.0, 13.0, 11.0, 18.0, 17.0, 18.0, 32.0, 32.0, 23.0, 31.0, 39.0, 40.0, 41.0, 49.0, 39.0, 39.0, 33.0, 34.0, 41.0, 36.0, 38.0, 32.0, 39.0, 26.0, 36.0, 26.0, 30.0, 17.0, 15.0, 15.0, 19.0, 15.0, 16.0, 10.0, 11.0, 9.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.42498779296875, -3.3070068359375, -3.18902587890625, -3.071044921875, -2.95306396484375, -2.8350830078125, -2.71710205078125, -2.59912109375, -2.48114013671875, -2.3631591796875, -2.24517822265625, -2.127197265625, -2.00921630859375, -1.8912353515625, -1.77325439453125, -1.6552734375, -1.53729248046875, -1.4193115234375, -1.30133056640625, -1.183349609375, -1.06536865234375, -0.9473876953125, -0.82940673828125, -0.71142578125, -0.59344482421875, -0.4754638671875, -0.35748291015625, -0.239501953125, -0.12152099609375, -0.0035400390625, 0.11444091796875, 0.232421875, 0.35040283203125, 0.4683837890625, 0.58636474609375, 0.704345703125, 0.82232666015625, 0.9403076171875, 1.05828857421875, 1.17626953125, 1.29425048828125, 1.4122314453125, 1.53021240234375, 1.648193359375, 1.76617431640625, 1.8841552734375, 2.00213623046875, 2.1201171875, 2.23809814453125, 2.3560791015625, 2.47406005859375, 2.592041015625, 2.71002197265625, 2.8280029296875, 2.94598388671875, 3.06396484375, 3.18194580078125, 3.2999267578125, 3.41790771484375, 3.535888671875, 3.65386962890625, 3.7718505859375, 3.88983154296875, 4.0078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 10.0, 8.0, 17.0, 26.0, 32.0, 47.0, 65.0, 94.0, 124.0, 216.0, 294.0, 410.0, 646.0, 933.0, 1596.0, 2452.0, 3968.0, 6614.0, 11838.0, 21578.0, 44323.0, 106420.0, 353816.0, 1213042.0, 1603593.0, 550774.0, 151564.0, 57210.0, 27234.0, 14389.0, 8052.0, 4795.0, 2988.0, 1784.0, 1124.0, 755.0, 487.0, 343.0, 220.0, 141.0, 88.0, 60.0, 45.0, 32.0, 17.0, 5.0, 4.0, 10.0, 6.0, 1.0, 3.0, 2.0], "bins": [-6.35546875, -6.17974853515625, -6.0040283203125, -5.82830810546875, -5.652587890625, -5.47686767578125, -5.3011474609375, -5.12542724609375, -4.94970703125, -4.77398681640625, -4.5982666015625, -4.42254638671875, -4.246826171875, -4.07110595703125, -3.8953857421875, -3.71966552734375, -3.5439453125, -3.36822509765625, -3.1925048828125, -3.01678466796875, -2.841064453125, -2.66534423828125, -2.4896240234375, -2.31390380859375, -2.13818359375, -1.96246337890625, -1.7867431640625, -1.61102294921875, -1.435302734375, -1.25958251953125, -1.0838623046875, -0.90814208984375, -0.732421875, -0.55670166015625, -0.3809814453125, -0.20526123046875, -0.029541015625, 0.14617919921875, 0.3218994140625, 0.49761962890625, 0.67333984375, 0.84906005859375, 1.0247802734375, 1.20050048828125, 1.376220703125, 1.55194091796875, 1.7276611328125, 1.90338134765625, 2.0791015625, 2.25482177734375, 2.4305419921875, 2.60626220703125, 2.781982421875, 2.95770263671875, 3.1334228515625, 3.30914306640625, 3.48486328125, 3.66058349609375, 3.8363037109375, 4.01202392578125, 4.187744140625, 4.36346435546875, 4.5391845703125, 4.71490478515625, 4.890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 15.0, 19.0, 15.0, 29.0, 35.0, 34.0, 81.0, 82.0, 128.0, 187.0, 257.0, 363.0, 505.0, 594.0, 502.0, 337.0, 263.0, 164.0, 134.0, 79.0, 58.0, 43.0, 32.0, 29.0, 17.0, 14.0, 16.0, 7.0, 8.0, 10.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1802978515625, -8.868408203125, -8.5565185546875, -8.24462890625, -7.9327392578125, -7.620849609375, -7.3089599609375, -6.9970703125, -6.6851806640625, -6.373291015625, -6.0614013671875, -5.74951171875, -5.4376220703125, -5.125732421875, -4.8138427734375, -4.501953125, -4.1900634765625, -3.878173828125, -3.5662841796875, -3.25439453125, -2.9425048828125, -2.630615234375, -2.3187255859375, -2.0068359375, -1.6949462890625, -1.383056640625, -1.0711669921875, -0.75927734375, -0.4473876953125, -0.135498046875, 0.1763916015625, 0.48828125, 0.8001708984375, 1.112060546875, 1.4239501953125, 1.73583984375, 2.0477294921875, 2.359619140625, 2.6715087890625, 2.9833984375, 3.2952880859375, 3.607177734375, 3.9190673828125, 4.23095703125, 4.5428466796875, 4.854736328125, 5.1666259765625, 5.478515625, 5.7904052734375, 6.102294921875, 6.4141845703125, 6.72607421875, 7.0379638671875, 7.349853515625, 7.6617431640625, 7.9736328125, 8.2855224609375, 8.597412109375, 8.9093017578125, 9.22119140625, 9.5330810546875, 9.844970703125, 10.1568603515625, 10.46875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 13.0, 18.0, 29.0, 40.0, 53.0, 99.0, 228.0, 459.0, 1104.0, 2957.0, 9101.0, 33749.0, 168387.0, 1501750.0, 2180027.0, 234851.0, 44252.0, 11328.0, 3470.0, 1277.0, 546.0, 233.0, 134.0, 64.0, 39.0, 35.0, 15.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.8494873046875, -16.355224609375, -15.8609619140625, -15.36669921875, -14.8724365234375, -14.378173828125, -13.8839111328125, -13.3896484375, -12.8953857421875, -12.401123046875, -11.9068603515625, -11.41259765625, -10.9183349609375, -10.424072265625, -9.9298095703125, -9.435546875, -8.9412841796875, -8.447021484375, -7.9527587890625, -7.45849609375, -6.9642333984375, -6.469970703125, -5.9757080078125, -5.4814453125, -4.9871826171875, -4.492919921875, -3.9986572265625, -3.50439453125, -3.0101318359375, -2.515869140625, -2.0216064453125, -1.52734375, -1.0330810546875, -0.538818359375, -0.0445556640625, 0.44970703125, 0.9439697265625, 1.438232421875, 1.9324951171875, 2.4267578125, 2.9210205078125, 3.415283203125, 3.9095458984375, 4.40380859375, 4.8980712890625, 5.392333984375, 5.8865966796875, 6.380859375, 6.8751220703125, 7.369384765625, 7.8636474609375, 8.35791015625, 8.8521728515625, 9.346435546875, 9.8406982421875, 10.3349609375, 10.8292236328125, 11.323486328125, 11.8177490234375, 12.31201171875, 12.8062744140625, 13.300537109375, 13.7947998046875, 14.2890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 20.0, 31.0, 46.0, 67.0, 102.0, 121.0, 148.0, 135.0, 113.0, 73.0, 47.0, 39.0, 14.0, 14.0, 13.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.23213958740234, -81.32213592529297, -79.41213989257812, -77.50213623046875, -75.59213256835938, -73.68212890625, -71.77213287353516, -69.86212921142578, -67.9521255493164, -66.04212188720703, -64.13212585449219, -62.22212219238281, -60.31211853027344, -58.40211868286133, -56.49211883544922, -54.582115173339844, -52.672115325927734, -50.762115478515625, -48.85211181640625, -46.94211196899414, -45.032108306884766, -43.122108459472656, -41.21210479736328, -39.30210494995117, -37.39210510253906, -35.48210525512695, -33.57210159301758, -31.66210174560547, -29.752098083496094, -27.842098236083984, -25.932096481323242, -24.0220947265625, -22.11209487915039, -20.20209312438965, -18.292091369628906, -16.382091522216797, -14.472088813781738, -12.562087059020996, -10.65208625793457, -8.742084503173828, -6.832082748413086, -4.922080993652344, -3.0120797157287598, -1.1020784378051758, 0.8079233169555664, 2.7179250717163086, 4.627925872802734, 6.537927627563477, 8.447929382324219, 10.357931137084961, 12.267932891845703, 14.177933692932129, 16.087936401367188, 17.997936248779297, 19.90793800354004, 21.81793975830078, 23.727941513061523, 25.637943267822266, 27.547945022583008, 29.45794677734375, 31.36794662475586, 33.277950286865234, 35.187950134277344, 37.09795379638672, 39.00795364379883]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 6.0, 7.0, 6.0, 8.0, 13.0, 9.0, 16.0, 12.0, 18.0, 20.0, 27.0, 36.0, 41.0, 30.0, 36.0, 34.0, 38.0, 45.0, 47.0, 31.0, 42.0, 34.0, 49.0, 41.0, 26.0, 32.0, 47.0, 34.0, 25.0, 28.0, 25.0, 21.0, 17.0, 8.0, 15.0, 8.0, 9.0, 10.0, 6.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-29.218772888183594, -28.336788177490234, -27.454805374145508, -26.57282066345215, -25.690837860107422, -24.808853149414062, -23.926868438720703, -23.044883728027344, -22.162900924682617, -21.280916213989258, -20.39893341064453, -19.516948699951172, -18.634963989257812, -17.752981185913086, -16.870996475219727, -15.989012718200684, -15.10702896118164, -14.225045204162598, -13.343061447143555, -12.461076736450195, -11.579092979431152, -10.69710922241211, -9.81512451171875, -8.933140754699707, -8.051156997680664, -7.169173240661621, -6.28718900680542, -5.405204772949219, -4.523221015930176, -3.641237258911133, -2.7592530250549316, -1.8772687911987305, -0.9952850341796875, -0.11330103874206543, 0.7686829566955566, 1.6506669521331787, 2.532650947570801, 3.4146347045898438, 4.296618938446045, 5.178603172302246, 6.060586929321289, 6.942570686340332, 7.824554920196533, 8.706539154052734, 9.588522911071777, 10.47050666809082, 11.35249137878418, 12.234475135803223, 13.116458892822266, 13.998442649841309, 14.880426406860352, 15.762411117553711, 16.644393920898438, 17.526378631591797, 18.408363342285156, 19.290348052978516, 20.172330856323242, 21.0543155670166, 21.936298370361328, 22.818283081054688, 23.700267791748047, 24.582250595092773, 25.464235305786133, 26.34621810913086, 27.22820281982422]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 11.0, 6.0, 16.0, 17.0, 26.0, 22.0, 32.0, 24.0, 35.0, 36.0, 31.0, 40.0, 43.0, 49.0, 43.0, 40.0, 45.0, 40.0, 38.0, 32.0, 40.0, 31.0, 37.0, 32.0, 28.0, 23.0, 22.0, 19.0, 21.0, 15.0, 21.0, 13.0, 13.0, 7.0, 19.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-4.58203125, -4.459686279296875, -4.33734130859375, -4.214996337890625, -4.0926513671875, -3.970306396484375, -3.84796142578125, -3.725616455078125, -3.603271484375, -3.480926513671875, -3.35858154296875, -3.236236572265625, -3.1138916015625, -2.991546630859375, -2.86920166015625, -2.746856689453125, -2.62451171875, -2.502166748046875, -2.37982177734375, -2.257476806640625, -2.1351318359375, -2.012786865234375, -1.89044189453125, -1.768096923828125, -1.645751953125, -1.523406982421875, -1.40106201171875, -1.278717041015625, -1.1563720703125, -1.034027099609375, -0.91168212890625, -0.789337158203125, -0.6669921875, -0.544647216796875, -0.42230224609375, -0.299957275390625, -0.1776123046875, -0.055267333984375, 0.06707763671875, 0.189422607421875, 0.311767578125, 0.434112548828125, 0.55645751953125, 0.678802490234375, 0.8011474609375, 0.923492431640625, 1.04583740234375, 1.168182373046875, 1.29052734375, 1.412872314453125, 1.53521728515625, 1.657562255859375, 1.7799072265625, 1.902252197265625, 2.02459716796875, 2.146942138671875, 2.269287109375, 2.391632080078125, 2.51397705078125, 2.636322021484375, 2.7586669921875, 2.881011962890625, 3.00335693359375, 3.125701904296875, 3.248046875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 11.0, 6.0, 37.0, 52.0, 76.0, 159.0, 254.0, 466.0, 895.0, 1861.0, 3893.0, 8538.0, 20036.0, 50275.0, 143163.0, 469982.0, 228804.0, 70961.0, 27782.0, 11487.0, 5029.0, 2348.0, 1114.0, 592.0, 343.0, 159.0, 103.0, 63.0, 28.0, 13.0, 12.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.759521484375, -3.62841796875, -3.497314453125, -3.3662109375, -3.235107421875, -3.10400390625, -2.972900390625, -2.841796875, -2.710693359375, -2.57958984375, -2.448486328125, -2.3173828125, -2.186279296875, -2.05517578125, -1.924072265625, -1.79296875, -1.661865234375, -1.53076171875, -1.399658203125, -1.2685546875, -1.137451171875, -1.00634765625, -0.875244140625, -0.744140625, -0.613037109375, -0.48193359375, -0.350830078125, -0.2197265625, -0.088623046875, 0.04248046875, 0.173583984375, 0.3046875, 0.435791015625, 0.56689453125, 0.697998046875, 0.8291015625, 0.960205078125, 1.09130859375, 1.222412109375, 1.353515625, 1.484619140625, 1.61572265625, 1.746826171875, 1.8779296875, 2.009033203125, 2.14013671875, 2.271240234375, 2.40234375, 2.533447265625, 2.66455078125, 2.795654296875, 2.9267578125, 3.057861328125, 3.18896484375, 3.320068359375, 3.451171875, 3.582275390625, 3.71337890625, 3.844482421875, 3.9755859375, 4.106689453125, 4.23779296875, 4.368896484375, 4.5]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 11.0, 9.0, 14.0, 12.0, 14.0, 13.0, 32.0, 30.0, 27.0, 30.0, 32.0, 36.0, 35.0, 36.0, 45.0, 42.0, 49.0, 1056.0, 42.0, 26.0, 40.0, 38.0, 29.0, 28.0, 33.0, 32.0, 29.0, 26.0, 27.0, 16.0, 25.0, 13.0, 16.0, 7.0, 13.0, 10.0, 9.0, 9.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.365234375, -3.268463134765625, -3.17169189453125, -3.074920654296875, -2.9781494140625, -2.881378173828125, -2.78460693359375, -2.687835693359375, -2.591064453125, -2.494293212890625, -2.39752197265625, -2.300750732421875, -2.2039794921875, -2.107208251953125, -2.01043701171875, -1.913665771484375, -1.81689453125, -1.720123291015625, -1.62335205078125, -1.526580810546875, -1.4298095703125, -1.333038330078125, -1.23626708984375, -1.139495849609375, -1.042724609375, -0.945953369140625, -0.84918212890625, -0.752410888671875, -0.6556396484375, -0.558868408203125, -0.46209716796875, -0.365325927734375, -0.2685546875, -0.171783447265625, -0.07501220703125, 0.021759033203125, 0.1185302734375, 0.215301513671875, 0.31207275390625, 0.408843994140625, 0.505615234375, 0.602386474609375, 0.69915771484375, 0.795928955078125, 0.8927001953125, 0.989471435546875, 1.08624267578125, 1.183013916015625, 1.27978515625, 1.376556396484375, 1.47332763671875, 1.570098876953125, 1.6668701171875, 1.763641357421875, 1.86041259765625, 1.957183837890625, 2.053955078125, 2.150726318359375, 2.24749755859375, 2.344268798828125, 2.4410400390625, 2.537811279296875, 2.63458251953125, 2.731353759765625, 2.828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 6.0, 15.0, 7.0, 18.0, 25.0, 32.0, 46.0, 83.0, 90.0, 145.0, 214.0, 307.0, 428.0, 646.0, 1023.0, 1488.0, 2267.0, 3541.0, 5743.0, 9839.0, 17282.0, 33484.0, 73666.0, 213100.0, 1102508.0, 416541.0, 112740.0, 46602.0, 23131.0, 12475.0, 7102.0, 4383.0, 2831.0, 1774.0, 1140.0, 743.0, 492.0, 368.0, 238.0, 157.0, 121.0, 81.0, 53.0, 39.0, 39.0, 20.0, 19.0, 7.0, 13.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0], "bins": [-1.94921875, -1.89141845703125, -1.8336181640625, -1.77581787109375, -1.718017578125, -1.66021728515625, -1.6024169921875, -1.54461669921875, -1.48681640625, -1.42901611328125, -1.3712158203125, -1.31341552734375, -1.255615234375, -1.19781494140625, -1.1400146484375, -1.08221435546875, -1.0244140625, -0.96661376953125, -0.9088134765625, -0.85101318359375, -0.793212890625, -0.73541259765625, -0.6776123046875, -0.61981201171875, -0.56201171875, -0.50421142578125, -0.4464111328125, -0.38861083984375, -0.330810546875, -0.27301025390625, -0.2152099609375, -0.15740966796875, -0.099609375, -0.04180908203125, 0.0159912109375, 0.07379150390625, 0.131591796875, 0.18939208984375, 0.2471923828125, 0.30499267578125, 0.36279296875, 0.42059326171875, 0.4783935546875, 0.53619384765625, 0.593994140625, 0.65179443359375, 0.7095947265625, 0.76739501953125, 0.8251953125, 0.88299560546875, 0.9407958984375, 0.99859619140625, 1.056396484375, 1.11419677734375, 1.1719970703125, 1.22979736328125, 1.28759765625, 1.34539794921875, 1.4031982421875, 1.46099853515625, 1.518798828125, 1.57659912109375, 1.6343994140625, 1.69219970703125, 1.75]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 9.0, 10.0, 14.0, 21.0, 23.0, 43.0, 46.0, 71.0, 112.0, 224.0, 117.0, 69.0, 42.0, 37.0, 29.0, 26.0, 17.0, 12.0, 12.0, 9.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88037109375, -0.85491943359375, -0.8294677734375, -0.80401611328125, -0.778564453125, -0.75311279296875, -0.7276611328125, -0.70220947265625, -0.6767578125, -0.65130615234375, -0.6258544921875, -0.60040283203125, -0.574951171875, -0.54949951171875, -0.5240478515625, -0.49859619140625, -0.47314453125, -0.44769287109375, -0.4222412109375, -0.39678955078125, -0.371337890625, -0.34588623046875, -0.3204345703125, -0.29498291015625, -0.26953125, -0.24407958984375, -0.2186279296875, -0.19317626953125, -0.167724609375, -0.14227294921875, -0.1168212890625, -0.09136962890625, -0.06591796875, -0.04046630859375, -0.0150146484375, 0.01043701171875, 0.035888671875, 0.06134033203125, 0.0867919921875, 0.11224365234375, 0.1376953125, 0.16314697265625, 0.1885986328125, 0.21405029296875, 0.239501953125, 0.26495361328125, 0.2904052734375, 0.31585693359375, 0.34130859375, 0.36676025390625, 0.3922119140625, 0.41766357421875, 0.443115234375, 0.46856689453125, 0.4940185546875, 0.51947021484375, 0.544921875, 0.57037353515625, 0.5958251953125, 0.62127685546875, 0.646728515625, 0.67218017578125, 0.6976318359375, 0.72308349609375, 0.74853515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 9.0, 17.0, 16.0, 18.0, 33.0, 50.0, 71.0, 138.0, 423.0, 5115.0, 942548.0, 97783.0, 1733.0, 262.0, 114.0, 69.0, 35.0, 34.0, 22.0, 14.0, 12.0, 4.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.921875, -14.404296875, -13.88671875, -13.369140625, -12.8515625, -12.333984375, -11.81640625, -11.298828125, -10.78125, -10.263671875, -9.74609375, -9.228515625, -8.7109375, -8.193359375, -7.67578125, -7.158203125, -6.640625, -6.123046875, -5.60546875, -5.087890625, -4.5703125, -4.052734375, -3.53515625, -3.017578125, -2.5, -1.982421875, -1.46484375, -0.947265625, -0.4296875, 0.087890625, 0.60546875, 1.123046875, 1.640625, 2.158203125, 2.67578125, 3.193359375, 3.7109375, 4.228515625, 4.74609375, 5.263671875, 5.78125, 6.298828125, 6.81640625, 7.333984375, 7.8515625, 8.369140625, 8.88671875, 9.404296875, 9.921875, 10.439453125, 10.95703125, 11.474609375, 11.9921875, 12.509765625, 13.02734375, 13.544921875, 14.0625, 14.580078125, 15.09765625, 15.615234375, 16.1328125, 16.650390625, 17.16796875, 17.685546875, 18.203125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 8.0, 22.0, 26.0, 33.0, 69.0, 110.0, 112.0, 127.0, 175.0, 112.0, 86.0, 53.0, 28.0, 18.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.398878574371338, -1.3462492227554321, -1.2936198711395264, -1.2409905195236206, -1.1883611679077148, -1.1357316970825195, -1.0831024646759033, -1.030472993850708, -0.9778436422348022, -0.9252142906188965, -0.8725849390029907, -0.819955587387085, -0.7673261761665344, -0.7146968245506287, -0.6620674729347229, -0.6094380617141724, -0.5568087697029114, -0.5041794180870056, -0.45155003666877747, -0.3989206850528717, -0.34629130363464355, -0.2936619520187378, -0.24103260040283203, -0.18840321898460388, -0.13577386736869812, -0.08314450085163116, -0.030515141785144806, 0.022114217281341553, 0.07474358379840851, 0.12737295031547546, 0.18000230193138123, 0.23263168334960938, 0.28526103496551514, 0.3378903865814209, 0.39051976799964905, 0.4431491196155548, 0.49577850103378296, 0.5484078526496887, 0.6010372042655945, 0.653666615486145, 0.7062959671020508, 0.7589253187179565, 0.8115546703338623, 0.8641840219497681, 0.9168134331703186, 0.9694427847862244, 1.0220720767974854, 1.0747015476226807, 1.1273307800292969, 1.1799601316452026, 1.2325894832611084, 1.2852188348770142, 1.33784818649292, 1.3904776573181152, 1.4431068897247314, 1.4957363605499268, 1.5483657121658325, 1.6009950637817383, 1.653624415397644, 1.7062537670135498, 1.7588831186294556, 1.8115124702453613, 1.8641419410705566, 1.9167712926864624, 1.9694006443023682]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 15.0, 9.0, 8.0, 27.0, 20.0, 18.0, 23.0, 33.0, 25.0, 24.0, 38.0, 38.0, 43.0, 33.0, 54.0, 43.0, 40.0, 46.0, 48.0, 33.0, 32.0, 50.0, 37.0, 39.0, 25.0, 24.0, 26.0, 23.0, 17.0, 12.0, 19.0, 8.0, 6.0, 10.0, 11.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7128490209579468, -0.6916950345039368, -0.6705410480499268, -0.6493870615959167, -0.6282330751419067, -0.607079029083252, -0.5859250426292419, -0.5647710561752319, -0.5436170697212219, -0.5224630832672119, -0.5013090968132019, -0.4801550805568695, -0.4590010941028595, -0.4378471076488495, -0.4166930913925171, -0.3955391049385071, -0.37438511848449707, -0.35323113203048706, -0.33207714557647705, -0.31092312932014465, -0.28976914286613464, -0.26861515641212463, -0.24746115505695343, -0.22630715370178223, -0.20515316724777222, -0.1839991807937622, -0.162845179438591, -0.1416911780834198, -0.12053719162940979, -0.09938319772481918, -0.07822920382022858, -0.05707520246505737, -0.03592115640640259, -0.014767162501811981, 0.0063868314027786255, 0.027540825307369232, 0.04869481921195984, 0.06984881311655045, 0.09100280702114105, 0.11215680837631226, 0.13331079483032227, 0.15446478128433228, 0.17561878263950348, 0.19677278399467468, 0.2179267704486847, 0.2390807569026947, 0.2602347731590271, 0.2813887596130371, 0.3025427460670471, 0.32369673252105713, 0.34485071897506714, 0.36600473523139954, 0.38715872168540955, 0.40831270813941956, 0.42946672439575195, 0.45062071084976196, 0.471774697303772, 0.492928683757782, 0.514082670211792, 0.535236656665802, 0.556390643119812, 0.5775446891784668, 0.5986986756324768, 0.6198526620864868, 0.6410066485404968]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 6.0, 11.0, 15.0, 22.0, 18.0, 19.0, 24.0, 26.0, 32.0, 35.0, 39.0, 29.0, 44.0, 41.0, 38.0, 32.0, 43.0, 47.0, 35.0, 30.0, 37.0, 35.0, 29.0, 30.0, 25.0, 27.0, 27.0, 26.0, 15.0, 15.0, 15.0, 18.0, 8.0, 19.0, 8.0, 13.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.71875, -3.608367919921875, -3.49798583984375, -3.387603759765625, -3.2772216796875, -3.166839599609375, -3.05645751953125, -2.946075439453125, -2.835693359375, -2.725311279296875, -2.61492919921875, -2.504547119140625, -2.3941650390625, -2.283782958984375, -2.17340087890625, -2.063018798828125, -1.95263671875, -1.842254638671875, -1.73187255859375, -1.621490478515625, -1.5111083984375, -1.400726318359375, -1.29034423828125, -1.179962158203125, -1.069580078125, -0.959197998046875, -0.84881591796875, -0.738433837890625, -0.6280517578125, -0.517669677734375, -0.40728759765625, -0.296905517578125, -0.1865234375, -0.076141357421875, 0.03424072265625, 0.144622802734375, 0.2550048828125, 0.365386962890625, 0.47576904296875, 0.586151123046875, 0.696533203125, 0.806915283203125, 0.91729736328125, 1.027679443359375, 1.1380615234375, 1.248443603515625, 1.35882568359375, 1.469207763671875, 1.57958984375, 1.689971923828125, 1.80035400390625, 1.910736083984375, 2.0211181640625, 2.131500244140625, 2.24188232421875, 2.352264404296875, 2.462646484375, 2.573028564453125, 2.68341064453125, 2.793792724609375, 2.9041748046875, 3.014556884765625, 3.12493896484375, 3.235321044921875, 3.345703125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 9.0, 11.0, 12.0, 19.0, 17.0, 28.0, 34.0, 58.0, 95.0, 160.0, 283.0, 442.0, 867.0, 1646.0, 3474.0, 8440.0, 22799.0, 78364.0, 312724.0, 450465.0, 116912.0, 31852.0, 10914.0, 4462.0, 2021.0, 1006.0, 580.0, 299.0, 188.0, 122.0, 71.0, 44.0, 32.0, 25.0, 25.0, 11.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0], "bins": [-11.4296875, -11.1376953125, -10.845703125, -10.5537109375, -10.26171875, -9.9697265625, -9.677734375, -9.3857421875, -9.09375, -8.8017578125, -8.509765625, -8.2177734375, -7.92578125, -7.6337890625, -7.341796875, -7.0498046875, -6.7578125, -6.4658203125, -6.173828125, -5.8818359375, -5.58984375, -5.2978515625, -5.005859375, -4.7138671875, -4.421875, -4.1298828125, -3.837890625, -3.5458984375, -3.25390625, -2.9619140625, -2.669921875, -2.3779296875, -2.0859375, -1.7939453125, -1.501953125, -1.2099609375, -0.91796875, -0.6259765625, -0.333984375, -0.0419921875, 0.25, 0.5419921875, 0.833984375, 1.1259765625, 1.41796875, 1.7099609375, 2.001953125, 2.2939453125, 2.5859375, 2.8779296875, 3.169921875, 3.4619140625, 3.75390625, 4.0458984375, 4.337890625, 4.6298828125, 4.921875, 5.2138671875, 5.505859375, 5.7978515625, 6.08984375, 6.3818359375, 6.673828125, 6.9658203125, 7.2578125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 11.0, 7.0, 14.0, 14.0, 11.0, 17.0, 19.0, 31.0, 42.0, 52.0, 52.0, 58.0, 66.0, 126.0, 194.0, 1418.0, 272.0, 150.0, 94.0, 69.0, 51.0, 50.0, 38.0, 33.0, 28.0, 23.0, 27.0, 14.0, 13.0, 10.0, 6.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.40625, -17.875, -17.34375, -16.8125, -16.28125, -15.75, -15.21875, -14.6875, -14.15625, -13.625, -13.09375, -12.5625, -12.03125, -11.5, -10.96875, -10.4375, -9.90625, -9.375, -8.84375, -8.3125, -7.78125, -7.25, -6.71875, -6.1875, -5.65625, -5.125, -4.59375, -4.0625, -3.53125, -3.0, -2.46875, -1.9375, -1.40625, -0.875, -0.34375, 0.1875, 0.71875, 1.25, 1.78125, 2.3125, 2.84375, 3.375, 3.90625, 4.4375, 4.96875, 5.5, 6.03125, 6.5625, 7.09375, 7.625, 8.15625, 8.6875, 9.21875, 9.75, 10.28125, 10.8125, 11.34375, 11.875, 12.40625, 12.9375, 13.46875, 14.0, 14.53125, 15.0625, 15.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 5.0, 7.0, 9.0, 6.0, 13.0, 19.0, 14.0, 28.0, 44.0, 60.0, 66.0, 117.0, 142.0, 208.0, 451.0, 1237.0, 5697.0, 83733.0, 2889396.0, 153916.0, 7801.0, 1433.0, 513.0, 259.0, 165.0, 96.0, 62.0, 60.0, 45.0, 38.0, 21.0, 8.0, 5.0, 13.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.65625, -33.6240234375, -32.591796875, -31.5595703125, -30.52734375, -29.4951171875, -28.462890625, -27.4306640625, -26.3984375, -25.3662109375, -24.333984375, -23.3017578125, -22.26953125, -21.2373046875, -20.205078125, -19.1728515625, -18.140625, -17.1083984375, -16.076171875, -15.0439453125, -14.01171875, -12.9794921875, -11.947265625, -10.9150390625, -9.8828125, -8.8505859375, -7.818359375, -6.7861328125, -5.75390625, -4.7216796875, -3.689453125, -2.6572265625, -1.625, -0.5927734375, 0.439453125, 1.4716796875, 2.50390625, 3.5361328125, 4.568359375, 5.6005859375, 6.6328125, 7.6650390625, 8.697265625, 9.7294921875, 10.76171875, 11.7939453125, 12.826171875, 13.8583984375, 14.890625, 15.9228515625, 16.955078125, 17.9873046875, 19.01953125, 20.0517578125, 21.083984375, 22.1162109375, 23.1484375, 24.1806640625, 25.212890625, 26.2451171875, 27.27734375, 28.3095703125, 29.341796875, 30.3740234375, 31.40625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 16.0, 698.0, 299.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.95354461669922, -61.44935607910156, -50.94516372680664, -40.44097137451172, -29.936782836914062, -19.432594299316406, -8.928401947021484, 1.5757904052734375, 12.079978942871094, 22.584169387817383, 33.08835983276367, 43.592552185058594, 54.09674072265625, 64.6009292602539, 75.10511779785156, 85.60931396484375, 96.1135025024414, 106.61769104003906, 117.12188720703125, 127.6260757446289, 138.13026428222656, 148.63446044921875, 159.13864135742188, 169.64283752441406, 180.14703369140625, 190.65122985839844, 201.15541076660156, 211.65960693359375, 222.16378784179688, 232.66798400878906, 243.17218017578125, 253.67636108398438, 264.1805419921875, 274.6847229003906, 285.1889343261719, 295.693115234375, 306.1972961425781, 316.70147705078125, 327.2056884765625, 337.7098693847656, 348.21405029296875, 358.7182312011719, 369.2224426269531, 379.72662353515625, 390.2308044433594, 400.7349853515625, 411.23919677734375, 421.7433776855469, 432.2475891113281, 442.75177001953125, 453.2559814453125, 463.7601623535156, 474.26434326171875, 484.7685546875, 495.2727355957031, 505.77691650390625, 516.2811279296875, 526.7853393554688, 537.2894897460938, 547.793701171875, 558.2979125976562, 568.8020629882812, 579.3062744140625, 589.8104858398438, 600.3146362304688]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 10.0, 5.0, 6.0, 12.0, 15.0, 11.0, 20.0, 18.0, 17.0, 28.0, 22.0, 24.0, 26.0, 27.0, 31.0, 37.0, 27.0, 35.0, 32.0, 36.0, 38.0, 46.0, 40.0, 45.0, 42.0, 36.0, 32.0, 30.0, 24.0, 28.0, 19.0, 20.0, 26.0, 21.0, 20.0, 19.0, 14.0, 11.0, 9.0, 3.0, 13.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.680667877197266, -32.60024642944336, -31.51982879638672, -30.439409255981445, -29.358989715576172, -28.278568267822266, -27.198148727416992, -26.11772918701172, -25.037309646606445, -23.956890106201172, -22.8764705657959, -21.796051025390625, -20.71562957763672, -19.635211944580078, -18.554790496826172, -17.4743709564209, -16.393951416015625, -15.313531875610352, -14.233112335205078, -13.152691841125488, -12.072272300720215, -10.991852760314941, -9.911432266235352, -8.831012725830078, -7.750593185424805, -6.670173645019531, -5.5897536277771, -4.509333610534668, -3.4289140701293945, -2.348494529724121, -1.2680745124816895, -0.1876544952392578, 0.89276123046875, 1.9731810092926025, 3.053600788116455, 4.134020805358887, 5.21444034576416, 6.294859886169434, 7.375279903411865, 8.455699920654297, 9.53611946105957, 10.616539001464844, 11.696958541870117, 12.777379035949707, 13.85779857635498, 14.938218116760254, 16.018638610839844, 17.099058151245117, 18.17947769165039, 19.259897232055664, 20.340316772460938, 21.42073631286621, 22.501155853271484, 23.58157730102539, 24.661996841430664, 25.742416381835938, 26.82283592224121, 27.903255462646484, 28.983675003051758, 30.06409454345703, 31.144515991210938, 32.22493362426758, 33.305355072021484, 34.385772705078125, 35.46619415283203]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 10.0, 6.0, 8.0, 6.0, 12.0, 14.0, 17.0, 12.0, 21.0, 25.0, 26.0, 25.0, 37.0, 37.0, 33.0, 33.0, 37.0, 35.0, 37.0, 34.0, 35.0, 58.0, 38.0, 46.0, 44.0, 39.0, 27.0, 31.0, 30.0, 18.0, 24.0, 28.0, 21.0, 16.0, 10.0, 17.0, 12.0, 7.0, 13.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.315887451171875, -4.19036865234375, -4.064849853515625, -3.9393310546875, -3.813812255859375, -3.68829345703125, -3.562774658203125, -3.437255859375, -3.311737060546875, -3.18621826171875, -3.060699462890625, -2.9351806640625, -2.809661865234375, -2.68414306640625, -2.558624267578125, -2.43310546875, -2.307586669921875, -2.18206787109375, -2.056549072265625, -1.9310302734375, -1.805511474609375, -1.67999267578125, -1.554473876953125, -1.428955078125, -1.303436279296875, -1.17791748046875, -1.052398681640625, -0.9268798828125, -0.801361083984375, -0.67584228515625, -0.550323486328125, -0.4248046875, -0.299285888671875, -0.17376708984375, -0.048248291015625, 0.0772705078125, 0.202789306640625, 0.32830810546875, 0.453826904296875, 0.579345703125, 0.704864501953125, 0.83038330078125, 0.955902099609375, 1.0814208984375, 1.206939697265625, 1.33245849609375, 1.457977294921875, 1.58349609375, 1.709014892578125, 1.83453369140625, 1.960052490234375, 2.0855712890625, 2.211090087890625, 2.33660888671875, 2.462127685546875, 2.587646484375, 2.713165283203125, 2.83868408203125, 2.964202880859375, 3.0897216796875, 3.215240478515625, 3.34075927734375, 3.466278076171875, 3.591796875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 11.0, 16.0, 15.0, 24.0, 31.0, 56.0, 86.0, 142.0, 238.0, 437.0, 755.0, 1334.0, 2757.0, 5793.0, 12950.0, 31034.0, 89580.0, 427384.0, 2033335.0, 1272781.0, 218449.0, 58518.0, 21282.0, 9014.0, 4029.0, 2004.0, 932.0, 520.0, 300.0, 164.0, 107.0, 69.0, 34.0, 23.0, 25.0, 13.0, 15.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-8.2734375, -8.0133056640625, -7.753173828125, -7.4930419921875, -7.23291015625, -6.9727783203125, -6.712646484375, -6.4525146484375, -6.1923828125, -5.9322509765625, -5.672119140625, -5.4119873046875, -5.15185546875, -4.8917236328125, -4.631591796875, -4.3714599609375, -4.111328125, -3.8511962890625, -3.591064453125, -3.3309326171875, -3.07080078125, -2.8106689453125, -2.550537109375, -2.2904052734375, -2.0302734375, -1.7701416015625, -1.510009765625, -1.2498779296875, -0.98974609375, -0.7296142578125, -0.469482421875, -0.2093505859375, 0.05078125, 0.3109130859375, 0.571044921875, 0.8311767578125, 1.09130859375, 1.3514404296875, 1.611572265625, 1.8717041015625, 2.1318359375, 2.3919677734375, 2.652099609375, 2.9122314453125, 3.17236328125, 3.4324951171875, 3.692626953125, 3.9527587890625, 4.212890625, 4.4730224609375, 4.733154296875, 4.9932861328125, 5.25341796875, 5.5135498046875, 5.773681640625, 6.0338134765625, 6.2939453125, 6.5540771484375, 6.814208984375, 7.0743408203125, 7.33447265625, 7.5946044921875, 7.854736328125, 8.1148681640625, 8.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 3.0, 16.0, 15.0, 22.0, 35.0, 59.0, 100.0, 153.0, 234.0, 402.0, 633.0, 785.0, 591.0, 374.0, 224.0, 153.0, 101.0, 58.0, 31.0, 38.0, 11.0, 13.0, 12.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -15.10546875, -14.6796875, -14.25390625, -13.828125, -13.40234375, -12.9765625, -12.55078125, -12.125, -11.69921875, -11.2734375, -10.84765625, -10.421875, -9.99609375, -9.5703125, -9.14453125, -8.71875, -8.29296875, -7.8671875, -7.44140625, -7.015625, -6.58984375, -6.1640625, -5.73828125, -5.3125, -4.88671875, -4.4609375, -4.03515625, -3.609375, -3.18359375, -2.7578125, -2.33203125, -1.90625, -1.48046875, -1.0546875, -0.62890625, -0.203125, 0.22265625, 0.6484375, 1.07421875, 1.5, 1.92578125, 2.3515625, 2.77734375, 3.203125, 3.62890625, 4.0546875, 4.48046875, 4.90625, 5.33203125, 5.7578125, 6.18359375, 6.609375, 7.03515625, 7.4609375, 7.88671875, 8.3125, 8.73828125, 9.1640625, 9.58984375, 10.015625, 10.44140625, 10.8671875, 11.29296875, 11.71875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 14.0, 23.0, 30.0, 73.0, 123.0, 211.0, 397.0, 1191.0, 4418.0, 25616.0, 225154.0, 3129929.0, 737552.0, 57745.0, 8574.0, 2025.0, 615.0, 278.0, 127.0, 71.0, 28.0, 31.0, 23.0, 10.0, 7.0, 10.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.774169921875, -16.09521484375, -15.416259765625, -14.7373046875, -14.058349609375, -13.37939453125, -12.700439453125, -12.021484375, -11.342529296875, -10.66357421875, -9.984619140625, -9.3056640625, -8.626708984375, -7.94775390625, -7.268798828125, -6.58984375, -5.910888671875, -5.23193359375, -4.552978515625, -3.8740234375, -3.195068359375, -2.51611328125, -1.837158203125, -1.158203125, -0.479248046875, 0.19970703125, 0.878662109375, 1.5576171875, 2.236572265625, 2.91552734375, 3.594482421875, 4.2734375, 4.952392578125, 5.63134765625, 6.310302734375, 6.9892578125, 7.668212890625, 8.34716796875, 9.026123046875, 9.705078125, 10.384033203125, 11.06298828125, 11.741943359375, 12.4208984375, 13.099853515625, 13.77880859375, 14.457763671875, 15.13671875, 15.815673828125, 16.49462890625, 17.173583984375, 17.8525390625, 18.531494140625, 19.21044921875, 19.889404296875, 20.568359375, 21.247314453125, 21.92626953125, 22.605224609375, 23.2841796875, 23.963134765625, 24.64208984375, 25.321044921875, 26.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 16.0, 18.0, 19.0, 33.0, 61.0, 78.0, 91.0, 139.0, 114.0, 118.0, 89.0, 61.0, 59.0, 29.0, 27.0, 15.0, 10.0, 10.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.85332489013672, -35.21104049682617, -33.568756103515625, -31.926469802856445, -30.2841854095459, -28.64190101623535, -26.999614715576172, -25.357330322265625, -23.715045928955078, -22.07276153564453, -20.430477142333984, -18.788190841674805, -17.145906448364258, -15.503622055053711, -13.861336708068848, -12.219051361083984, -10.576766967773438, -8.93448257446289, -7.292197227478027, -5.649912357330322, -4.007627487182617, -2.3653430938720703, -0.723057746887207, 0.9192276000976562, 2.561511993408203, 4.203796863555908, 5.846081733703613, 7.488366603851318, 9.130651473999023, 10.77293586730957, 12.415221214294434, 14.057506561279297, 15.699790954589844, 17.34207534790039, 18.984359741210938, 20.626646041870117, 22.268930435180664, 23.91121482849121, 25.55350112915039, 27.195785522460938, 28.838069915771484, 30.48035430908203, 32.12263870239258, 33.764923095703125, 35.40721130371094, 37.04949188232422, 38.69178009033203, 40.33406448364258, 41.976348876953125, 43.61863327026367, 45.26091766357422, 46.903202056884766, 48.54548645019531, 50.187774658203125, 51.83005905151367, 53.47234344482422, 55.114627838134766, 56.75691223144531, 58.39919662475586, 60.041481018066406, 61.68376922607422, 63.3260498046875, 64.96833801269531, 66.61062622070312, 68.2529067993164]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 15.0, 13.0, 14.0, 21.0, 24.0, 26.0, 25.0, 32.0, 40.0, 32.0, 54.0, 57.0, 40.0, 53.0, 40.0, 47.0, 30.0, 49.0, 42.0, 39.0, 46.0, 30.0, 32.0, 23.0, 26.0, 18.0, 22.0, 9.0, 12.0, 13.0, 8.0, 8.0, 7.0, 5.0, 6.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.533607482910156, -26.54688262939453, -25.56015968322754, -24.573434829711914, -23.586711883544922, -22.599987030029297, -21.613264083862305, -20.62653923034668, -19.639816284179688, -18.653091430664062, -17.66636848449707, -16.679643630981445, -15.692920684814453, -14.706195831298828, -13.719472885131836, -12.732748031616211, -11.746024131774902, -10.759300231933594, -9.772576332092285, -8.785852432250977, -7.799128532409668, -6.812404155731201, -5.825680255889893, -4.838956356048584, -3.8522324562072754, -2.865508556365967, -1.8787845373153687, -0.8920605182647705, 0.09466338157653809, 1.0813875198364258, 2.0681114196777344, 3.054835319519043, 4.041559219360352, 5.02828311920166, 6.015007019042969, 7.001730918884277, 7.988454818725586, 8.975179672241211, 9.961902618408203, 10.948627471923828, 11.93535041809082, 12.922074317932129, 13.908798217773438, 14.895522117614746, 15.882246017456055, 16.86897087097168, 17.855693817138672, 18.842418670654297, 19.829143524169922, 20.815868377685547, 21.80259132385254, 22.789316177368164, 23.776039123535156, 24.76276397705078, 25.749486923217773, 26.7362117767334, 27.72293472290039, 28.709659576416016, 29.696382522583008, 30.683107376098633, 31.669830322265625, 32.65655517578125, 33.643280029296875, 34.630001068115234, 35.61672592163086]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 1.0, 10.0, 6.0, 3.0, 12.0, 11.0, 15.0, 14.0, 12.0, 18.0, 30.0, 20.0, 33.0, 26.0, 28.0, 31.0, 46.0, 44.0, 40.0, 40.0, 40.0, 38.0, 40.0, 32.0, 48.0, 42.0, 32.0, 33.0, 27.0, 24.0, 26.0, 30.0, 19.0, 27.0, 17.0, 17.0, 18.0, 13.0, 8.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.235137939453125, -3.11285400390625, -2.990570068359375, -2.8682861328125, -2.746002197265625, -2.62371826171875, -2.501434326171875, -2.379150390625, -2.256866455078125, -2.13458251953125, -2.012298583984375, -1.8900146484375, -1.767730712890625, -1.64544677734375, -1.523162841796875, -1.40087890625, -1.278594970703125, -1.15631103515625, -1.034027099609375, -0.9117431640625, -0.789459228515625, -0.66717529296875, -0.544891357421875, -0.422607421875, -0.300323486328125, -0.17803955078125, -0.055755615234375, 0.0665283203125, 0.188812255859375, 0.31109619140625, 0.433380126953125, 0.5556640625, 0.677947998046875, 0.80023193359375, 0.922515869140625, 1.0447998046875, 1.167083740234375, 1.28936767578125, 1.411651611328125, 1.533935546875, 1.656219482421875, 1.77850341796875, 1.900787353515625, 2.0230712890625, 2.145355224609375, 2.26763916015625, 2.389923095703125, 2.51220703125, 2.634490966796875, 2.75677490234375, 2.879058837890625, 3.0013427734375, 3.123626708984375, 3.24591064453125, 3.368194580078125, 3.490478515625, 3.612762451171875, 3.73504638671875, 3.857330322265625, 3.9796142578125, 4.101898193359375, 4.22418212890625, 4.346466064453125, 4.46875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 12.0, 12.0, 22.0, 35.0, 59.0, 89.0, 140.0, 230.0, 380.0, 550.0, 940.0, 1495.0, 2645.0, 4556.0, 7882.0, 14027.0, 26038.0, 50042.0, 114349.0, 397375.0, 259068.0, 81167.0, 39506.0, 20890.0, 11457.0, 6374.0, 3691.0, 2174.0, 1293.0, 788.0, 443.0, 301.0, 191.0, 114.0, 79.0, 45.0, 31.0, 24.0, 15.0, 10.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6328125, -3.522125244140625, -3.41143798828125, -3.300750732421875, -3.1900634765625, -3.079376220703125, -2.96868896484375, -2.858001708984375, -2.747314453125, -2.636627197265625, -2.52593994140625, -2.415252685546875, -2.3045654296875, -2.193878173828125, -2.08319091796875, -1.972503662109375, -1.86181640625, -1.751129150390625, -1.64044189453125, -1.529754638671875, -1.4190673828125, -1.308380126953125, -1.19769287109375, -1.087005615234375, -0.976318359375, -0.865631103515625, -0.75494384765625, -0.644256591796875, -0.5335693359375, -0.422882080078125, -0.31219482421875, -0.201507568359375, -0.0908203125, 0.019866943359375, 0.13055419921875, 0.241241455078125, 0.3519287109375, 0.462615966796875, 0.57330322265625, 0.683990478515625, 0.794677734375, 0.905364990234375, 1.01605224609375, 1.126739501953125, 1.2374267578125, 1.348114013671875, 1.45880126953125, 1.569488525390625, 1.68017578125, 1.790863037109375, 1.90155029296875, 2.012237548828125, 2.1229248046875, 2.233612060546875, 2.34429931640625, 2.454986572265625, 2.565673828125, 2.676361083984375, 2.78704833984375, 2.897735595703125, 3.0084228515625, 3.119110107421875, 3.22979736328125, 3.340484619140625, 3.451171875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 5.0, 4.0, 9.0, 12.0, 10.0, 18.0, 18.0, 16.0, 16.0, 20.0, 16.0, 24.0, 21.0, 36.0, 39.0, 39.0, 42.0, 34.0, 36.0, 39.0, 1055.0, 38.0, 29.0, 40.0, 38.0, 47.0, 36.0, 31.0, 26.0, 31.0, 21.0, 21.0, 30.0, 21.0, 23.0, 9.0, 13.0, 14.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.05859375, -2.957611083984375, -2.85662841796875, -2.755645751953125, -2.6546630859375, -2.553680419921875, -2.45269775390625, -2.351715087890625, -2.250732421875, -2.149749755859375, -2.04876708984375, -1.947784423828125, -1.8468017578125, -1.745819091796875, -1.64483642578125, -1.543853759765625, -1.44287109375, -1.341888427734375, -1.24090576171875, -1.139923095703125, -1.0389404296875, -0.937957763671875, -0.83697509765625, -0.735992431640625, -0.635009765625, -0.534027099609375, -0.43304443359375, -0.332061767578125, -0.2310791015625, -0.130096435546875, -0.02911376953125, 0.071868896484375, 0.1728515625, 0.273834228515625, 0.37481689453125, 0.475799560546875, 0.5767822265625, 0.677764892578125, 0.77874755859375, 0.879730224609375, 0.980712890625, 1.081695556640625, 1.18267822265625, 1.283660888671875, 1.3846435546875, 1.485626220703125, 1.58660888671875, 1.687591552734375, 1.78857421875, 1.889556884765625, 1.99053955078125, 2.091522216796875, 2.1925048828125, 2.293487548828125, 2.39447021484375, 2.495452880859375, 2.596435546875, 2.697418212890625, 2.79840087890625, 2.899383544921875, 3.0003662109375, 3.101348876953125, 3.20233154296875, 3.303314208984375, 3.404296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 9.0, 17.0, 16.0, 24.0, 39.0, 57.0, 113.0, 143.0, 254.0, 396.0, 646.0, 971.0, 1719.0, 2948.0, 5207.0, 9077.0, 17443.0, 35505.0, 85089.0, 340072.0, 1270995.0, 201674.0, 63582.0, 28435.0, 14295.0, 7571.0, 4380.0, 2479.0, 1544.0, 879.0, 544.0, 349.0, 220.0, 149.0, 103.0, 49.0, 42.0, 30.0, 22.0, 7.0, 11.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.35546875, -2.28265380859375, -2.2098388671875, -2.13702392578125, -2.064208984375, -1.99139404296875, -1.9185791015625, -1.84576416015625, -1.77294921875, -1.70013427734375, -1.6273193359375, -1.55450439453125, -1.481689453125, -1.40887451171875, -1.3360595703125, -1.26324462890625, -1.1904296875, -1.11761474609375, -1.0447998046875, -0.97198486328125, -0.899169921875, -0.82635498046875, -0.7535400390625, -0.68072509765625, -0.60791015625, -0.53509521484375, -0.4622802734375, -0.38946533203125, -0.316650390625, -0.24383544921875, -0.1710205078125, -0.09820556640625, -0.025390625, 0.04742431640625, 0.1202392578125, 0.19305419921875, 0.265869140625, 0.33868408203125, 0.4114990234375, 0.48431396484375, 0.55712890625, 0.62994384765625, 0.7027587890625, 0.77557373046875, 0.848388671875, 0.92120361328125, 0.9940185546875, 1.06683349609375, 1.1396484375, 1.21246337890625, 1.2852783203125, 1.35809326171875, 1.430908203125, 1.50372314453125, 1.5765380859375, 1.64935302734375, 1.72216796875, 1.79498291015625, 1.8677978515625, 1.94061279296875, 2.013427734375, 2.08624267578125, 2.1590576171875, 2.23187255859375, 2.3046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 8.0, 14.0, 10.0, 19.0, 19.0, 32.0, 31.0, 44.0, 56.0, 98.0, 121.0, 132.0, 110.0, 68.0, 34.0, 36.0, 35.0, 25.0, 18.0, 25.0, 13.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.505859375, -0.48789215087890625, -0.4699249267578125, -0.45195770263671875, -0.433990478515625, -0.41602325439453125, -0.3980560302734375, -0.38008880615234375, -0.36212158203125, -0.34415435791015625, -0.3261871337890625, -0.30821990966796875, -0.290252685546875, -0.27228546142578125, -0.2543182373046875, -0.23635101318359375, -0.2183837890625, -0.20041656494140625, -0.1824493408203125, -0.16448211669921875, -0.146514892578125, -0.12854766845703125, -0.1105804443359375, -0.09261322021484375, -0.07464599609375, -0.05667877197265625, -0.0387115478515625, -0.02074432373046875, -0.002777099609375, 0.01519012451171875, 0.0331573486328125, 0.05112457275390625, 0.069091796875, 0.08705902099609375, 0.1050262451171875, 0.12299346923828125, 0.140960693359375, 0.15892791748046875, 0.1768951416015625, 0.19486236572265625, 0.21282958984375, 0.23079681396484375, 0.2487640380859375, 0.26673126220703125, 0.284698486328125, 0.30266571044921875, 0.3206329345703125, 0.33860015869140625, 0.3565673828125, 0.37453460693359375, 0.3925018310546875, 0.41046905517578125, 0.428436279296875, 0.44640350341796875, 0.4643707275390625, 0.48233795166015625, 0.50030517578125, 0.5182723999023438, 0.5362396240234375, 0.5542068481445312, 0.572174072265625, 0.5901412963867188, 0.6081085205078125, 0.6260757446289062, 0.64404296875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 14.0, 15.0, 16.0, 26.0, 27.0, 48.0, 57.0, 86.0, 139.0, 326.0, 2150.0, 81246.0, 948727.0, 14263.0, 704.0, 236.0, 141.0, 82.0, 48.0, 39.0, 25.0, 24.0, 20.0, 16.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.453125, -10.1568603515625, -9.860595703125, -9.5643310546875, -9.26806640625, -8.9718017578125, -8.675537109375, -8.3792724609375, -8.0830078125, -7.7867431640625, -7.490478515625, -7.1942138671875, -6.89794921875, -6.6016845703125, -6.305419921875, -6.0091552734375, -5.712890625, -5.4166259765625, -5.120361328125, -4.8240966796875, -4.52783203125, -4.2315673828125, -3.935302734375, -3.6390380859375, -3.3427734375, -3.0465087890625, -2.750244140625, -2.4539794921875, -2.15771484375, -1.8614501953125, -1.565185546875, -1.2689208984375, -0.97265625, -0.6763916015625, -0.380126953125, -0.0838623046875, 0.21240234375, 0.5086669921875, 0.804931640625, 1.1011962890625, 1.3974609375, 1.6937255859375, 1.989990234375, 2.2862548828125, 2.58251953125, 2.8787841796875, 3.175048828125, 3.4713134765625, 3.767578125, 4.0638427734375, 4.360107421875, 4.6563720703125, 4.95263671875, 5.2489013671875, 5.545166015625, 5.8414306640625, 6.1376953125, 6.4339599609375, 6.730224609375, 7.0264892578125, 7.32275390625, 7.6190185546875, 7.915283203125, 8.2115478515625, 8.5078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 13.0, 31.0, 85.0, 190.0, 299.0, 244.0, 108.0, 35.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5044376850128174, -0.42892199754714966, -0.35340631008148193, -0.2778906226158142, -0.20237493515014648, -0.12685924768447876, -0.051343560218811035, 0.02417212724685669, 0.09968781471252441, 0.17520350217819214, 0.25071918964385986, 0.3262348771095276, 0.4017505645751953, 0.47726625204086304, 0.5527819395065308, 0.6282976269721985, 0.7038133144378662, 0.7793290019035339, 0.8548446893692017, 0.9303603768348694, 1.005876064300537, 1.0813918113708496, 1.1569074392318726, 1.2324230670928955, 1.307938814163208, 1.3834545612335205, 1.4589701890945435, 1.5344858169555664, 1.610001564025879, 1.6855173110961914, 1.7610329389572144, 1.8365485668182373, 1.912064552307129, 1.9875802993774414, 2.063096046447754, 2.1386115550994873, 2.2141273021698, 2.2896430492401123, 2.3651585578918457, 2.440674304962158, 2.5161900520324707, 2.591705799102783, 2.6672215461730957, 2.742737054824829, 2.8182528018951416, 2.893768548965454, 2.9692840576171875, 3.0447998046875, 3.1203155517578125, 3.195831298828125, 3.2713470458984375, 3.346862554550171, 3.4223783016204834, 3.497894048690796, 3.5734095573425293, 3.648925304412842, 3.7244410514831543, 3.799956798553467, 3.8754725456237793, 3.9509880542755127, 4.026503562927246, 4.102019309997559, 4.177535057067871, 4.253050804138184, 4.328566551208496]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 13.0, 15.0, 9.0, 16.0, 10.0, 11.0, 19.0, 22.0, 25.0, 24.0, 36.0, 32.0, 34.0, 39.0, 46.0, 50.0, 42.0, 44.0, 50.0, 47.0, 48.0, 44.0, 41.0, 32.0, 30.0, 29.0, 31.0, 27.0, 23.0, 14.0, 24.0, 12.0, 13.0, 9.0, 13.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6185957193374634, -0.5990802049636841, -0.5795647501945496, -0.5600492358207703, -0.5405337810516357, -0.5210182666778564, -0.5015027523040771, -0.48198726773262024, -0.46247178316116333, -0.4429562985897064, -0.4234408140182495, -0.4039252996444702, -0.3844098150730133, -0.3648943305015564, -0.3453788161277771, -0.3258633315563202, -0.3063478469848633, -0.28683236241340637, -0.26731687784194946, -0.24780136346817017, -0.22828587889671326, -0.20877039432525635, -0.18925489485263824, -0.16973939538002014, -0.15022391080856323, -0.13070842623710632, -0.11119292676448822, -0.09167743474245071, -0.07216194272041321, -0.0526464506983757, -0.033130958676338196, -0.013615459203720093, 0.005900025367736816, 0.025415517389774323, 0.04493100941181183, 0.06444650143384933, 0.08396199345588684, 0.10347748547792435, 0.12299297749996185, 0.14250847697257996, 0.16202396154403687, 0.18153944611549377, 0.20105494558811188, 0.22057044506072998, 0.2400859296321869, 0.2596014142036438, 0.2791169285774231, 0.29863241314888, 0.3181478977203369, 0.3376633822917938, 0.35717886686325073, 0.37669438123703003, 0.39620986580848694, 0.41572535037994385, 0.43524086475372314, 0.45475634932518005, 0.47427183389663696, 0.49378731846809387, 0.5133028030395508, 0.5328183174133301, 0.5523338317871094, 0.5718492865562439, 0.5913648009300232, 0.6108802556991577, 0.630395770072937]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 10.0, 11.0, 12.0, 16.0, 21.0, 15.0, 32.0, 26.0, 29.0, 21.0, 29.0, 36.0, 39.0, 28.0, 43.0, 34.0, 37.0, 40.0, 45.0, 40.0, 32.0, 24.0, 30.0, 31.0, 32.0, 31.0, 24.0, 22.0, 29.0, 18.0, 20.0, 14.0, 24.0, 15.0, 12.0, 12.0, 10.0, 11.0, 5.0, 3.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0], "bins": [-4.0234375, -3.908843994140625, -3.79425048828125, -3.679656982421875, -3.5650634765625, -3.450469970703125, -3.33587646484375, -3.221282958984375, -3.106689453125, -2.992095947265625, -2.87750244140625, -2.762908935546875, -2.6483154296875, -2.533721923828125, -2.41912841796875, -2.304534912109375, -2.18994140625, -2.075347900390625, -1.96075439453125, -1.846160888671875, -1.7315673828125, -1.616973876953125, -1.50238037109375, -1.387786865234375, -1.273193359375, -1.158599853515625, -1.04400634765625, -0.929412841796875, -0.8148193359375, -0.700225830078125, -0.58563232421875, -0.471038818359375, -0.3564453125, -0.241851806640625, -0.12725830078125, -0.012664794921875, 0.1019287109375, 0.216522216796875, 0.33111572265625, 0.445709228515625, 0.560302734375, 0.674896240234375, 0.78948974609375, 0.904083251953125, 1.0186767578125, 1.133270263671875, 1.24786376953125, 1.362457275390625, 1.47705078125, 1.591644287109375, 1.70623779296875, 1.820831298828125, 1.9354248046875, 2.050018310546875, 2.16461181640625, 2.279205322265625, 2.393798828125, 2.508392333984375, 2.62298583984375, 2.737579345703125, 2.8521728515625, 2.966766357421875, 3.08135986328125, 3.195953369140625, 3.310546875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 11.0, 5.0, 22.0, 27.0, 49.0, 50.0, 97.0, 115.0, 203.0, 301.0, 374.0, 565.0, 815.0, 1291.0, 1947.0, 3500.0, 6392.0, 14641.0, 39925.0, 141057.0, 505975.0, 230334.0, 60870.0, 20219.0, 8377.0, 4273.0, 2496.0, 1506.0, 1026.0, 676.0, 421.0, 326.0, 180.0, 138.0, 107.0, 77.0, 44.0, 45.0, 29.0, 16.0, 11.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4921875, -7.23974609375, -6.9873046875, -6.73486328125, -6.482421875, -6.22998046875, -5.9775390625, -5.72509765625, -5.47265625, -5.22021484375, -4.9677734375, -4.71533203125, -4.462890625, -4.21044921875, -3.9580078125, -3.70556640625, -3.453125, -3.20068359375, -2.9482421875, -2.69580078125, -2.443359375, -2.19091796875, -1.9384765625, -1.68603515625, -1.43359375, -1.18115234375, -0.9287109375, -0.67626953125, -0.423828125, -0.17138671875, 0.0810546875, 0.33349609375, 0.5859375, 0.83837890625, 1.0908203125, 1.34326171875, 1.595703125, 1.84814453125, 2.1005859375, 2.35302734375, 2.60546875, 2.85791015625, 3.1103515625, 3.36279296875, 3.615234375, 3.86767578125, 4.1201171875, 4.37255859375, 4.625, 4.87744140625, 5.1298828125, 5.38232421875, 5.634765625, 5.88720703125, 6.1396484375, 6.39208984375, 6.64453125, 6.89697265625, 7.1494140625, 7.40185546875, 7.654296875, 7.90673828125, 8.1591796875, 8.41162109375, 8.6640625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 5.0, 8.0, 9.0, 17.0, 18.0, 10.0, 14.0, 21.0, 38.0, 44.0, 36.0, 29.0, 35.0, 47.0, 72.0, 107.0, 167.0, 322.0, 1379.0, 158.0, 99.0, 73.0, 43.0, 39.0, 46.0, 35.0, 35.0, 30.0, 20.0, 19.0, 14.0, 13.0, 11.0, 9.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.375, -13.9527587890625, -13.530517578125, -13.1082763671875, -12.68603515625, -12.2637939453125, -11.841552734375, -11.4193115234375, -10.9970703125, -10.5748291015625, -10.152587890625, -9.7303466796875, -9.30810546875, -8.8858642578125, -8.463623046875, -8.0413818359375, -7.619140625, -7.1968994140625, -6.774658203125, -6.3524169921875, -5.93017578125, -5.5079345703125, -5.085693359375, -4.6634521484375, -4.2412109375, -3.8189697265625, -3.396728515625, -2.9744873046875, -2.55224609375, -2.1300048828125, -1.707763671875, -1.2855224609375, -0.86328125, -0.4410400390625, -0.018798828125, 0.4034423828125, 0.82568359375, 1.2479248046875, 1.670166015625, 2.0924072265625, 2.5146484375, 2.9368896484375, 3.359130859375, 3.7813720703125, 4.20361328125, 4.6258544921875, 5.048095703125, 5.4703369140625, 5.892578125, 6.3148193359375, 6.737060546875, 7.1593017578125, 7.58154296875, 8.0037841796875, 8.426025390625, 8.8482666015625, 9.2705078125, 9.6927490234375, 10.114990234375, 10.5372314453125, 10.95947265625, 11.3817138671875, 11.803955078125, 12.2261962890625, 12.6484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 9.0, 7.0, 13.0, 14.0, 15.0, 28.0, 32.0, 38.0, 36.0, 70.0, 100.0, 145.0, 172.0, 346.0, 857.0, 2967.0, 16421.0, 523562.0, 2556331.0, 37017.0, 5013.0, 1170.0, 495.0, 262.0, 154.0, 111.0, 77.0, 57.0, 39.0, 35.0, 22.0, 14.0, 13.0, 20.0, 5.0, 4.0, 12.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.9375, -29.034912109375, -28.13232421875, -27.229736328125, -26.3271484375, -25.424560546875, -24.52197265625, -23.619384765625, -22.716796875, -21.814208984375, -20.91162109375, -20.009033203125, -19.1064453125, -18.203857421875, -17.30126953125, -16.398681640625, -15.49609375, -14.593505859375, -13.69091796875, -12.788330078125, -11.8857421875, -10.983154296875, -10.08056640625, -9.177978515625, -8.275390625, -7.372802734375, -6.47021484375, -5.567626953125, -4.6650390625, -3.762451171875, -2.85986328125, -1.957275390625, -1.0546875, -0.152099609375, 0.75048828125, 1.653076171875, 2.5556640625, 3.458251953125, 4.36083984375, 5.263427734375, 6.166015625, 7.068603515625, 7.97119140625, 8.873779296875, 9.7763671875, 10.678955078125, 11.58154296875, 12.484130859375, 13.38671875, 14.289306640625, 15.19189453125, 16.094482421875, 16.9970703125, 17.899658203125, 18.80224609375, 19.704833984375, 20.607421875, 21.510009765625, 22.41259765625, 23.315185546875, 24.2177734375, 25.120361328125, 26.02294921875, 26.925537109375, 27.828125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 6.0, 29.0, 87.0, 200.0, 310.0, 222.0, 103.0, 38.0, 16.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609712600708008, -17.337251663208008, -15.06479263305664, -12.79233169555664, -10.519871711730957, -8.247411727905273, -5.974950790405273, -3.70249080657959, -1.4300308227539062, 0.8424293994903564, 3.114889621734619, 5.387350082397461, 7.6598100662231445, 9.932270050048828, 12.204730987548828, 14.477190971374512, 16.749650955200195, 19.022111892700195, 21.294570922851562, 23.567031860351562, 25.839492797851562, 28.11195182800293, 30.38441276550293, 32.6568717956543, 34.9293327331543, 37.2017936706543, 39.4742546081543, 41.74671173095703, 44.01917266845703, 46.29163360595703, 48.56409454345703, 50.83655548095703, 53.1090087890625, 55.3814697265625, 57.6539306640625, 59.9263916015625, 62.198848724365234, 64.4713134765625, 66.7437744140625, 69.01622772216797, 71.28868865966797, 73.56114959716797, 75.83361053466797, 78.10607147216797, 80.37853240966797, 82.65098571777344, 84.92344665527344, 87.19590759277344, 89.46836853027344, 91.74082946777344, 94.01329040527344, 96.28575134277344, 98.55821228027344, 100.83067321777344, 103.10313415527344, 105.3755874633789, 107.64805603027344, 109.92051696777344, 112.19297790527344, 114.46543884277344, 116.73789978027344, 119.01036071777344, 121.28282165527344, 123.5552749633789, 125.8277359008789]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 7.0, 2.0, 6.0, 5.0, 8.0, 3.0, 11.0, 15.0, 16.0, 9.0, 19.0, 17.0, 32.0, 26.0, 38.0, 36.0, 32.0, 45.0, 41.0, 36.0, 36.0, 59.0, 46.0, 50.0, 39.0, 40.0, 44.0, 30.0, 35.0, 30.0, 23.0, 22.0, 23.0, 22.0, 19.0, 11.0, 7.0, 16.0, 10.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.91774368286133, -37.69913101196289, -36.48051834106445, -35.26190185546875, -34.04328918457031, -32.824676513671875, -31.606063842773438, -30.387451171875, -29.16883659362793, -27.950223922729492, -26.731609344482422, -25.512996673583984, -24.294384002685547, -23.075769424438477, -21.85715675354004, -20.63854217529297, -19.41992950439453, -18.201316833496094, -16.982702255249023, -15.764089584350586, -14.545475959777832, -13.326862335205078, -12.10824966430664, -10.889636039733887, -9.671022415161133, -8.452408790588379, -7.233795642852783, -6.0151824951171875, -4.796568870544434, -3.5779552459716797, -2.359342098236084, -1.1407289505004883, 0.07788467407226562, 1.2964980602264404, 2.5151114463806152, 3.73372483253479, 4.952338218688965, 6.170951843261719, 7.3895649909973145, 8.60817813873291, 9.826791763305664, 11.045405387878418, 12.264019012451172, 13.48263168334961, 14.701245307922363, 15.919858932495117, 17.138471603393555, 18.357086181640625, 19.575698852539062, 20.7943115234375, 22.01292610168457, 23.231538772583008, 24.450153350830078, 25.668766021728516, 26.887378692626953, 28.10599136352539, 29.32460594177246, 30.5432186126709, 31.76183319091797, 32.980445861816406, 34.199058532714844, 35.41767120361328, 36.636287689208984, 37.85490036010742, 39.07351303100586]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 7.0, 9.0, 16.0, 15.0, 15.0, 19.0, 26.0, 16.0, 24.0, 33.0, 28.0, 33.0, 47.0, 33.0, 31.0, 34.0, 43.0, 47.0, 43.0, 39.0, 34.0, 40.0, 31.0, 32.0, 23.0, 31.0, 25.0, 34.0, 27.0, 20.0, 21.0, 13.0, 25.0, 12.0, 15.0, 11.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.95965576171875, -3.8294677734375, -3.69927978515625, -3.569091796875, -3.43890380859375, -3.3087158203125, -3.17852783203125, -3.04833984375, -2.91815185546875, -2.7879638671875, -2.65777587890625, -2.527587890625, -2.39739990234375, -2.2672119140625, -2.13702392578125, -2.0068359375, -1.87664794921875, -1.7464599609375, -1.61627197265625, -1.486083984375, -1.35589599609375, -1.2257080078125, -1.09552001953125, -0.96533203125, -0.83514404296875, -0.7049560546875, -0.57476806640625, -0.444580078125, -0.31439208984375, -0.1842041015625, -0.05401611328125, 0.076171875, 0.20635986328125, 0.3365478515625, 0.46673583984375, 0.596923828125, 0.72711181640625, 0.8572998046875, 0.98748779296875, 1.11767578125, 1.24786376953125, 1.3780517578125, 1.50823974609375, 1.638427734375, 1.76861572265625, 1.8988037109375, 2.02899169921875, 2.1591796875, 2.28936767578125, 2.4195556640625, 2.54974365234375, 2.679931640625, 2.81011962890625, 2.9403076171875, 3.07049560546875, 3.20068359375, 3.33087158203125, 3.4610595703125, 3.59124755859375, 3.721435546875, 3.85162353515625, 3.9818115234375, 4.11199951171875, 4.2421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 9.0, 18.0, 31.0, 26.0, 57.0, 77.0, 88.0, 144.0, 277.0, 467.0, 799.0, 1598.0, 3418.0, 8822.0, 25367.0, 96853.0, 634987.0, 2479138.0, 782498.0, 114512.0, 28432.0, 9454.0, 3631.0, 1657.0, 767.0, 427.0, 280.0, 167.0, 103.0, 60.0, 37.0, 27.0, 17.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.068115234375, -8.76123046875, -8.454345703125, -8.1474609375, -7.840576171875, -7.53369140625, -7.226806640625, -6.919921875, -6.613037109375, -6.30615234375, -5.999267578125, -5.6923828125, -5.385498046875, -5.07861328125, -4.771728515625, -4.46484375, -4.157958984375, -3.85107421875, -3.544189453125, -3.2373046875, -2.930419921875, -2.62353515625, -2.316650390625, -2.009765625, -1.702880859375, -1.39599609375, -1.089111328125, -0.7822265625, -0.475341796875, -0.16845703125, 0.138427734375, 0.4453125, 0.752197265625, 1.05908203125, 1.365966796875, 1.6728515625, 1.979736328125, 2.28662109375, 2.593505859375, 2.900390625, 3.207275390625, 3.51416015625, 3.821044921875, 4.1279296875, 4.434814453125, 4.74169921875, 5.048583984375, 5.35546875, 5.662353515625, 5.96923828125, 6.276123046875, 6.5830078125, 6.889892578125, 7.19677734375, 7.503662109375, 7.810546875, 8.117431640625, 8.42431640625, 8.731201171875, 9.0380859375, 9.344970703125, 9.65185546875, 9.958740234375, 10.265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 5.0, 8.0, 10.0, 14.0, 25.0, 24.0, 27.0, 41.0, 50.0, 72.0, 93.0, 122.0, 152.0, 214.0, 296.0, 418.0, 452.0, 447.0, 396.0, 308.0, 258.0, 141.0, 116.0, 94.0, 64.0, 53.0, 33.0, 30.0, 25.0, 20.0, 16.0, 14.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1650390625, -7.900390625, -7.6357421875, -7.37109375, -7.1064453125, -6.841796875, -6.5771484375, -6.3125, -6.0478515625, -5.783203125, -5.5185546875, -5.25390625, -4.9892578125, -4.724609375, -4.4599609375, -4.1953125, -3.9306640625, -3.666015625, -3.4013671875, -3.13671875, -2.8720703125, -2.607421875, -2.3427734375, -2.078125, -1.8134765625, -1.548828125, -1.2841796875, -1.01953125, -0.7548828125, -0.490234375, -0.2255859375, 0.0390625, 0.3037109375, 0.568359375, 0.8330078125, 1.09765625, 1.3623046875, 1.626953125, 1.8916015625, 2.15625, 2.4208984375, 2.685546875, 2.9501953125, 3.21484375, 3.4794921875, 3.744140625, 4.0087890625, 4.2734375, 4.5380859375, 4.802734375, 5.0673828125, 5.33203125, 5.5966796875, 5.861328125, 6.1259765625, 6.390625, 6.6552734375, 6.919921875, 7.1845703125, 7.44921875, 7.7138671875, 7.978515625, 8.2431640625, 8.5078125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 13.0, 8.0, 18.0, 28.0, 57.0, 54.0, 90.0, 126.0, 218.0, 609.0, 2207.0, 15530.0, 253973.0, 3596171.0, 303947.0, 17626.0, 2386.0, 562.0, 246.0, 132.0, 78.0, 57.0, 38.0, 27.0, 24.0, 15.0, 11.0, 2.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.193603515625, -24.34033203125, -23.487060546875, -22.6337890625, -21.780517578125, -20.92724609375, -20.073974609375, -19.220703125, -18.367431640625, -17.51416015625, -16.660888671875, -15.8076171875, -14.954345703125, -14.10107421875, -13.247802734375, -12.39453125, -11.541259765625, -10.68798828125, -9.834716796875, -8.9814453125, -8.128173828125, -7.27490234375, -6.421630859375, -5.568359375, -4.715087890625, -3.86181640625, -3.008544921875, -2.1552734375, -1.302001953125, -0.44873046875, 0.404541015625, 1.2578125, 2.111083984375, 2.96435546875, 3.817626953125, 4.6708984375, 5.524169921875, 6.37744140625, 7.230712890625, 8.083984375, 8.937255859375, 9.79052734375, 10.643798828125, 11.4970703125, 12.350341796875, 13.20361328125, 14.056884765625, 14.91015625, 15.763427734375, 16.61669921875, 17.469970703125, 18.3232421875, 19.176513671875, 20.02978515625, 20.883056640625, 21.736328125, 22.589599609375, 23.44287109375, 24.296142578125, 25.1494140625, 26.002685546875, 26.85595703125, 27.709228515625, 28.5625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 21.0, 62.0, 172.0, 257.0, 244.0, 150.0, 68.0, 28.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.8848876953125, -130.14376831054688, -126.40263366699219, -122.66151428222656, -118.9203872680664, -115.17926025390625, -111.4381332397461, -107.69700622558594, -103.95588684082031, -100.21475982666016, -96.4736328125, -92.73251342773438, -88.99138641357422, -85.25025939941406, -81.5091323852539, -77.76800537109375, -74.0268783569336, -70.28575134277344, -66.54462432861328, -62.80350112915039, -59.0623779296875, -55.321250915527344, -51.58012390136719, -47.83899688720703, -44.09787368774414, -40.356746673583984, -36.615623474121094, -32.87449645996094, -29.133371353149414, -25.39224624633789, -21.651119232177734, -17.90999412536621, -14.168876647949219, -10.427751541137695, -6.6866254806518555, -2.9454994201660156, 0.7956256866455078, 4.536750793457031, 8.277877807617188, 12.019002914428711, 15.760128021240234, 19.501253128051758, 23.24237823486328, 26.983505249023438, 30.72463035583496, 34.465755462646484, 38.20688247680664, 41.94800567626953, 45.68913269042969, 49.430259704589844, 53.171382904052734, 56.91250991821289, 60.65363311767578, 64.39476013183594, 68.1358871459961, 71.87701416015625, 75.61813354492188, 79.35926055908203, 83.10038757324219, 86.84150695800781, 90.58263397216797, 94.32376098632812, 98.06488800048828, 101.80601501464844, 105.5471420288086]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 10.0, 12.0, 16.0, 15.0, 18.0, 19.0, 22.0, 13.0, 19.0, 31.0, 36.0, 30.0, 29.0, 31.0, 37.0, 51.0, 46.0, 31.0, 46.0, 32.0, 47.0, 38.0, 40.0, 31.0, 35.0, 30.0, 32.0, 17.0, 32.0, 19.0, 11.0, 6.0, 16.0, 11.0, 9.0, 14.0, 4.0, 6.0, 6.0, 4.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.39491844177246, -28.486658096313477, -27.578399658203125, -26.67013931274414, -25.761878967285156, -24.853620529174805, -23.94536018371582, -23.03710174560547, -22.128841400146484, -21.2205810546875, -20.31232261657715, -19.404062271118164, -18.495803833007812, -17.587543487548828, -16.679283142089844, -15.771023750305176, -14.862764358520508, -13.95450496673584, -13.046245574951172, -12.137985229492188, -11.22972583770752, -10.321466445922852, -9.413206100463867, -8.5049467086792, -7.596687316894531, -6.688427925109863, -5.780168056488037, -4.871908187866211, -3.963648796081543, -3.055389404296875, -2.147129535675049, -1.2388696670532227, -0.3306121826171875, 0.5776474475860596, 1.4859070777893066, 2.3941667079925537, 3.302426338195801, 4.210685729980469, 5.118945598602295, 6.027205467224121, 6.935464859008789, 7.843724250793457, 8.751983642578125, 9.66024398803711, 10.568503379821777, 11.476762771606445, 12.38502311706543, 13.293282508850098, 14.201541900634766, 15.109801292419434, 16.0180606842041, 16.926321029663086, 17.834579467773438, 18.742839813232422, 19.651100158691406, 20.55936050415039, 21.467618942260742, 22.375879287719727, 23.284137725830078, 24.192398071289062, 25.100658416748047, 26.0089168548584, 26.917177200317383, 27.825435638427734, 28.73369598388672]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 10.0, 20.0, 20.0, 20.0, 27.0, 20.0, 31.0, 21.0, 38.0, 38.0, 47.0, 43.0, 43.0, 38.0, 36.0, 61.0, 59.0, 39.0, 40.0, 46.0, 44.0, 37.0, 26.0, 26.0, 23.0, 15.0, 26.0, 21.0, 18.0, 18.0, 12.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.328125, -5.1812744140625, -5.034423828125, -4.8875732421875, -4.74072265625, -4.5938720703125, -4.447021484375, -4.3001708984375, -4.1533203125, -4.0064697265625, -3.859619140625, -3.7127685546875, -3.56591796875, -3.4190673828125, -3.272216796875, -3.1253662109375, -2.978515625, -2.8316650390625, -2.684814453125, -2.5379638671875, -2.39111328125, -2.2442626953125, -2.097412109375, -1.9505615234375, -1.8037109375, -1.6568603515625, -1.510009765625, -1.3631591796875, -1.21630859375, -1.0694580078125, -0.922607421875, -0.7757568359375, -0.62890625, -0.4820556640625, -0.335205078125, -0.1883544921875, -0.04150390625, 0.1053466796875, 0.252197265625, 0.3990478515625, 0.5458984375, 0.6927490234375, 0.839599609375, 0.9864501953125, 1.13330078125, 1.2801513671875, 1.427001953125, 1.5738525390625, 1.720703125, 1.8675537109375, 2.014404296875, 2.1612548828125, 2.30810546875, 2.4549560546875, 2.601806640625, 2.7486572265625, 2.8955078125, 3.0423583984375, 3.189208984375, 3.3360595703125, 3.48291015625, 3.6297607421875, 3.776611328125, 3.9234619140625, 4.0703125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 10.0, 19.0, 28.0, 35.0, 46.0, 72.0, 124.0, 158.0, 242.0, 402.0, 624.0, 1100.0, 1971.0, 3667.0, 6948.0, 13978.0, 29783.0, 73312.0, 241721.0, 429067.0, 149839.0, 50317.0, 22101.0, 10703.0, 5576.0, 2844.0, 1579.0, 840.0, 453.0, 347.0, 184.0, 134.0, 101.0, 65.0, 38.0, 35.0, 24.0, 16.0, 11.0, 12.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.748046875, -2.647430419921875, -2.54681396484375, -2.446197509765625, -2.3455810546875, -2.244964599609375, -2.14434814453125, -2.043731689453125, -1.943115234375, -1.842498779296875, -1.74188232421875, -1.641265869140625, -1.5406494140625, -1.440032958984375, -1.33941650390625, -1.238800048828125, -1.13818359375, -1.037567138671875, -0.93695068359375, -0.836334228515625, -0.7357177734375, -0.635101318359375, -0.53448486328125, -0.433868408203125, -0.333251953125, -0.232635498046875, -0.13201904296875, -0.031402587890625, 0.0692138671875, 0.169830322265625, 0.27044677734375, 0.371063232421875, 0.4716796875, 0.572296142578125, 0.67291259765625, 0.773529052734375, 0.8741455078125, 0.974761962890625, 1.07537841796875, 1.175994873046875, 1.276611328125, 1.377227783203125, 1.47784423828125, 1.578460693359375, 1.6790771484375, 1.779693603515625, 1.88031005859375, 1.980926513671875, 2.08154296875, 2.182159423828125, 2.28277587890625, 2.383392333984375, 2.4840087890625, 2.584625244140625, 2.68524169921875, 2.785858154296875, 2.886474609375, 2.987091064453125, 3.08770751953125, 3.188323974609375, 3.2889404296875, 3.389556884765625, 3.49017333984375, 3.590789794921875, 3.69140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 8.0, 12.0, 13.0, 10.0, 18.0, 24.0, 24.0, 20.0, 30.0, 46.0, 41.0, 48.0, 40.0, 39.0, 39.0, 52.0, 1076.0, 49.0, 71.0, 39.0, 32.0, 49.0, 32.0, 32.0, 31.0, 16.0, 16.0, 23.0, 20.0, 15.0, 12.0, 4.0, 15.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.23358154296875, -4.1116943359375, -3.98980712890625, -3.867919921875, -3.74603271484375, -3.6241455078125, -3.50225830078125, -3.38037109375, -3.25848388671875, -3.1365966796875, -3.01470947265625, -2.892822265625, -2.77093505859375, -2.6490478515625, -2.52716064453125, -2.4052734375, -2.28338623046875, -2.1614990234375, -2.03961181640625, -1.917724609375, -1.79583740234375, -1.6739501953125, -1.55206298828125, -1.43017578125, -1.30828857421875, -1.1864013671875, -1.06451416015625, -0.942626953125, -0.82073974609375, -0.6988525390625, -0.57696533203125, -0.455078125, -0.33319091796875, -0.2113037109375, -0.08941650390625, 0.032470703125, 0.15435791015625, 0.2762451171875, 0.39813232421875, 0.52001953125, 0.64190673828125, 0.7637939453125, 0.88568115234375, 1.007568359375, 1.12945556640625, 1.2513427734375, 1.37322998046875, 1.4951171875, 1.61700439453125, 1.7388916015625, 1.86077880859375, 1.982666015625, 2.10455322265625, 2.2264404296875, 2.34832763671875, 2.47021484375, 2.59210205078125, 2.7139892578125, 2.83587646484375, 2.957763671875, 3.07965087890625, 3.2015380859375, 3.32342529296875, 3.4453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 13.0, 14.0, 16.0, 31.0, 42.0, 64.0, 85.0, 129.0, 181.0, 253.0, 411.0, 668.0, 1150.0, 2104.0, 3838.0, 7991.0, 18134.0, 49638.0, 193230.0, 1352950.0, 348160.0, 72358.0, 24405.0, 10134.0, 4816.0, 2538.0, 1425.0, 828.0, 499.0, 336.0, 233.0, 113.0, 89.0, 82.0, 51.0, 26.0, 27.0, 15.0, 7.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.180816650390625, -2.10968017578125, -2.038543701171875, -1.9674072265625, -1.896270751953125, -1.82513427734375, -1.753997802734375, -1.682861328125, -1.611724853515625, -1.54058837890625, -1.469451904296875, -1.3983154296875, -1.327178955078125, -1.25604248046875, -1.184906005859375, -1.11376953125, -1.042633056640625, -0.97149658203125, -0.900360107421875, -0.8292236328125, -0.758087158203125, -0.68695068359375, -0.615814208984375, -0.544677734375, -0.473541259765625, -0.40240478515625, -0.331268310546875, -0.2601318359375, -0.188995361328125, -0.11785888671875, -0.046722412109375, 0.0244140625, 0.095550537109375, 0.16668701171875, 0.237823486328125, 0.3089599609375, 0.380096435546875, 0.45123291015625, 0.522369384765625, 0.593505859375, 0.664642333984375, 0.73577880859375, 0.806915283203125, 0.8780517578125, 0.949188232421875, 1.02032470703125, 1.091461181640625, 1.16259765625, 1.233734130859375, 1.30487060546875, 1.376007080078125, 1.4471435546875, 1.518280029296875, 1.58941650390625, 1.660552978515625, 1.731689453125, 1.802825927734375, 1.87396240234375, 1.945098876953125, 2.0162353515625, 2.087371826171875, 2.15850830078125, 2.229644775390625, 2.30078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 1.0, 3.0, 5.0, 3.0, 9.0, 12.0, 16.0, 22.0, 27.0, 31.0, 26.0, 41.0, 37.0, 80.0, 168.0, 134.0, 89.0, 51.0, 53.0, 37.0, 34.0, 23.0, 22.0, 21.0, 9.0, 10.0, 10.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3830986022949219, -0.36702728271484375, -0.3509559631347656, -0.3348846435546875, -0.3188133239746094, -0.30274200439453125, -0.2866706848144531, -0.270599365234375, -0.2545280456542969, -0.23845672607421875, -0.22238540649414062, -0.2063140869140625, -0.19024276733398438, -0.17417144775390625, -0.15810012817382812, -0.14202880859375, -0.12595748901367188, -0.10988616943359375, -0.09381484985351562, -0.0777435302734375, -0.061672210693359375, -0.04560089111328125, -0.029529571533203125, -0.013458251953125, 0.002613067626953125, 0.01868438720703125, 0.034755706787109375, 0.0508270263671875, 0.06689834594726562, 0.08296966552734375, 0.09904098510742188, 0.1151123046875, 0.13118362426757812, 0.14725494384765625, 0.16332626342773438, 0.1793975830078125, 0.19546890258789062, 0.21154022216796875, 0.22761154174804688, 0.243682861328125, 0.2597541809082031, 0.27582550048828125, 0.2918968200683594, 0.3079681396484375, 0.3240394592285156, 0.34011077880859375, 0.3561820983886719, 0.37225341796875, 0.3883247375488281, 0.40439605712890625, 0.4204673767089844, 0.4365386962890625, 0.4526100158691406, 0.46868133544921875, 0.4847526550292969, 0.500823974609375, 0.5168952941894531, 0.5329666137695312, 0.5490379333496094, 0.5651092529296875, 0.5811805725097656, 0.5972518920898438, 0.6133232116699219, 0.62939453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 8.0, 9.0, 11.0, 21.0, 23.0, 36.0, 55.0, 80.0, 144.0, 297.0, 1672.0, 36873.0, 993717.0, 13996.0, 1042.0, 236.0, 110.0, 63.0, 52.0, 30.0, 15.0, 15.0, 13.0, 5.0, 5.0, 2.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2265625, -11.8905029296875, -11.554443359375, -11.2183837890625, -10.88232421875, -10.5462646484375, -10.210205078125, -9.8741455078125, -9.5380859375, -9.2020263671875, -8.865966796875, -8.5299072265625, -8.19384765625, -7.8577880859375, -7.521728515625, -7.1856689453125, -6.849609375, -6.5135498046875, -6.177490234375, -5.8414306640625, -5.50537109375, -5.1693115234375, -4.833251953125, -4.4971923828125, -4.1611328125, -3.8250732421875, -3.489013671875, -3.1529541015625, -2.81689453125, -2.4808349609375, -2.144775390625, -1.8087158203125, -1.47265625, -1.1365966796875, -0.800537109375, -0.4644775390625, -0.12841796875, 0.2076416015625, 0.543701171875, 0.8797607421875, 1.2158203125, 1.5518798828125, 1.887939453125, 2.2239990234375, 2.56005859375, 2.8961181640625, 3.232177734375, 3.5682373046875, 3.904296875, 4.2403564453125, 4.576416015625, 4.9124755859375, 5.24853515625, 5.5845947265625, 5.920654296875, 6.2567138671875, 6.5927734375, 6.9288330078125, 7.264892578125, 7.6009521484375, 7.93701171875, 8.2730712890625, 8.609130859375, 8.9451904296875, 9.28125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 23.0, 56.0, 80.0, 133.0, 162.0, 179.0, 149.0, 89.0, 60.0, 37.0, 14.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.265110492706299, -2.2206451892852783, -2.1761796474456787, -2.131714344024658, -2.0872488021850586, -2.042783498764038, -1.998318076133728, -1.953852653503418, -1.909387230873108, -1.8649218082427979, -1.8204563856124878, -1.7759909629821777, -1.7315256595611572, -1.6870602369308472, -1.642594814300537, -1.598129391670227, -1.553663969039917, -1.509198546409607, -1.4647331237792969, -1.4202678203582764, -1.3758023977279663, -1.3313369750976562, -1.2868715524673462, -1.2424061298370361, -1.1979408264160156, -1.1534754037857056, -1.1090099811553955, -1.064544677734375, -1.020079255104065, -0.9756138324737549, -0.9311484098434448, -0.8866829872131348, -0.8422176241874695, -0.7977522015571594, -0.7532868385314941, -0.7088214159011841, -0.664355993270874, -0.619890570640564, -0.5754252076148987, -0.5309597849845886, -0.48649439215660095, -0.4420289993286133, -0.3975635766983032, -0.35309818387031555, -0.3086327910423279, -0.2641673684120178, -0.21970197558403015, -0.1752365529537201, -0.13077116012573242, -0.08630575239658356, -0.04184035211801529, 0.0026250481605529785, 0.04709045588970184, 0.09155586361885071, 0.13602125644683838, 0.18048667907714844, 0.2249520719051361, 0.2694174647331238, 0.31388288736343384, 0.3583482801914215, 0.4028136730194092, 0.44727909564971924, 0.4917444884777069, 0.5362099409103394, 0.5806753039360046]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 16.0, 18.0, 13.0, 23.0, 23.0, 25.0, 32.0, 31.0, 24.0, 35.0, 38.0, 35.0, 33.0, 40.0, 39.0, 38.0, 59.0, 36.0, 43.0, 39.0, 35.0, 31.0, 39.0, 21.0, 26.0, 24.0, 19.0, 16.0, 22.0, 14.0, 14.0, 11.0, 15.0, 11.0, 4.0, 5.0, 8.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.4848117232322693, -0.4708484709262848, -0.4568852186203003, -0.4429219961166382, -0.4289587438106537, -0.4149954915046692, -0.4010322391986847, -0.3870689868927002, -0.3731057643890381, -0.3591425120830536, -0.3451792597770691, -0.331216037273407, -0.3172527849674225, -0.303289532661438, -0.2893262803554535, -0.275363028049469, -0.2613997757434845, -0.2474365234375, -0.2334732860326767, -0.2195100337266922, -0.2055467963218689, -0.1915835440158844, -0.1776202917098999, -0.1636570394039154, -0.1496938019990921, -0.1357305496931076, -0.1217673122882843, -0.1078040599822998, -0.0938408151268959, -0.079877570271492, -0.06591431796550751, -0.05195107311010361, -0.03798782825469971, -0.024024581536650658, -0.010061334818601608, 0.0039019137620925903, 0.01786515861749649, 0.03182840347290039, 0.04579165577888489, 0.05975490063428879, 0.07371814548969269, 0.08768139034509659, 0.10164463520050049, 0.11560788750648499, 0.12957113981246948, 0.14353437721729279, 0.15749762952327728, 0.17146086692810059, 0.18542411923408508, 0.19938737154006958, 0.21335060894489288, 0.22731386125087738, 0.24127709865570068, 0.2552403509616852, 0.2692036032676697, 0.2831668555736542, 0.29713010787963867, 0.31109336018562317, 0.32505661249160767, 0.3390198349952698, 0.3529830873012543, 0.36694633960723877, 0.38090959191322327, 0.39487284421920776, 0.4088360667228699]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 6.0, 10.0, 15.0, 16.0, 30.0, 28.0, 22.0, 37.0, 29.0, 31.0, 36.0, 35.0, 41.0, 54.0, 46.0, 49.0, 47.0, 38.0, 48.0, 37.0, 41.0, 39.0, 33.0, 28.0, 26.0, 32.0, 24.0, 18.0, 15.0, 18.0, 16.0, 11.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.93359375, -4.79193115234375, -4.6502685546875, -4.50860595703125, -4.366943359375, -4.22528076171875, -4.0836181640625, -3.94195556640625, -3.80029296875, -3.65863037109375, -3.5169677734375, -3.37530517578125, -3.233642578125, -3.09197998046875, -2.9503173828125, -2.80865478515625, -2.6669921875, -2.52532958984375, -2.3836669921875, -2.24200439453125, -2.100341796875, -1.95867919921875, -1.8170166015625, -1.67535400390625, -1.53369140625, -1.39202880859375, -1.2503662109375, -1.10870361328125, -0.967041015625, -0.82537841796875, -0.6837158203125, -0.54205322265625, -0.400390625, -0.25872802734375, -0.1170654296875, 0.02459716796875, 0.166259765625, 0.30792236328125, 0.4495849609375, 0.59124755859375, 0.73291015625, 0.87457275390625, 1.0162353515625, 1.15789794921875, 1.299560546875, 1.44122314453125, 1.5828857421875, 1.72454833984375, 1.8662109375, 2.00787353515625, 2.1495361328125, 2.29119873046875, 2.432861328125, 2.57452392578125, 2.7161865234375, 2.85784912109375, 2.99951171875, 3.14117431640625, 3.2828369140625, 3.42449951171875, 3.566162109375, 3.70782470703125, 3.8494873046875, 3.99114990234375, 4.1328125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 13.0, 16.0, 33.0, 35.0, 59.0, 101.0, 174.0, 270.0, 467.0, 787.0, 1333.0, 2291.0, 4680.0, 9321.0, 22070.0, 58717.0, 182570.0, 448346.0, 206004.0, 65764.0, 24290.0, 10304.0, 4910.0, 2524.0, 1456.0, 796.0, 425.0, 281.0, 162.0, 124.0, 79.0, 46.0, 32.0, 26.0, 12.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.69830322265625, -6.4552001953125, -6.21209716796875, -5.968994140625, -5.72589111328125, -5.4827880859375, -5.23968505859375, -4.99658203125, -4.75347900390625, -4.5103759765625, -4.26727294921875, -4.024169921875, -3.78106689453125, -3.5379638671875, -3.29486083984375, -3.0517578125, -2.80865478515625, -2.5655517578125, -2.32244873046875, -2.079345703125, -1.83624267578125, -1.5931396484375, -1.35003662109375, -1.10693359375, -0.86383056640625, -0.6207275390625, -0.37762451171875, -0.134521484375, 0.10858154296875, 0.3516845703125, 0.59478759765625, 0.837890625, 1.08099365234375, 1.3240966796875, 1.56719970703125, 1.810302734375, 2.05340576171875, 2.2965087890625, 2.53961181640625, 2.78271484375, 3.02581787109375, 3.2689208984375, 3.51202392578125, 3.755126953125, 3.99822998046875, 4.2413330078125, 4.48443603515625, 4.7275390625, 4.97064208984375, 5.2137451171875, 5.45684814453125, 5.699951171875, 5.94305419921875, 6.1861572265625, 6.42926025390625, 6.67236328125, 6.91546630859375, 7.1585693359375, 7.40167236328125, 7.644775390625, 7.88787841796875, 8.1309814453125, 8.37408447265625, 8.6171875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 14.0, 15.0, 15.0, 18.0, 23.0, 24.0, 25.0, 43.0, 49.0, 56.0, 61.0, 104.0, 116.0, 233.0, 1404.0, 217.0, 150.0, 94.0, 67.0, 56.0, 53.0, 38.0, 31.0, 20.0, 30.0, 17.0, 14.0, 11.0, 11.0, 6.0, 3.0, 6.0, 3.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.9638671875, -13.474609375, -12.9853515625, -12.49609375, -12.0068359375, -11.517578125, -11.0283203125, -10.5390625, -10.0498046875, -9.560546875, -9.0712890625, -8.58203125, -8.0927734375, -7.603515625, -7.1142578125, -6.625, -6.1357421875, -5.646484375, -5.1572265625, -4.66796875, -4.1787109375, -3.689453125, -3.2001953125, -2.7109375, -2.2216796875, -1.732421875, -1.2431640625, -0.75390625, -0.2646484375, 0.224609375, 0.7138671875, 1.203125, 1.6923828125, 2.181640625, 2.6708984375, 3.16015625, 3.6494140625, 4.138671875, 4.6279296875, 5.1171875, 5.6064453125, 6.095703125, 6.5849609375, 7.07421875, 7.5634765625, 8.052734375, 8.5419921875, 9.03125, 9.5205078125, 10.009765625, 10.4990234375, 10.98828125, 11.4775390625, 11.966796875, 12.4560546875, 12.9453125, 13.4345703125, 13.923828125, 14.4130859375, 14.90234375, 15.3916015625, 15.880859375, 16.3701171875, 16.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 4.0, 11.0, 9.0, 16.0, 27.0, 34.0, 46.0, 60.0, 94.0, 122.0, 164.0, 250.0, 465.0, 1416.0, 16743.0, 2833635.0, 286089.0, 4722.0, 729.0, 322.0, 213.0, 149.0, 116.0, 71.0, 42.0, 37.0, 26.0, 23.0, 16.0, 12.0, 9.0, 4.0, 1.0, 4.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.4375, -40.1337890625, -38.830078125, -37.5263671875, -36.22265625, -34.9189453125, -33.615234375, -32.3115234375, -31.0078125, -29.7041015625, -28.400390625, -27.0966796875, -25.79296875, -24.4892578125, -23.185546875, -21.8818359375, -20.578125, -19.2744140625, -17.970703125, -16.6669921875, -15.36328125, -14.0595703125, -12.755859375, -11.4521484375, -10.1484375, -8.8447265625, -7.541015625, -6.2373046875, -4.93359375, -3.6298828125, -2.326171875, -1.0224609375, 0.28125, 1.5849609375, 2.888671875, 4.1923828125, 5.49609375, 6.7998046875, 8.103515625, 9.4072265625, 10.7109375, 12.0146484375, 13.318359375, 14.6220703125, 15.92578125, 17.2294921875, 18.533203125, 19.8369140625, 21.140625, 22.4443359375, 23.748046875, 25.0517578125, 26.35546875, 27.6591796875, 28.962890625, 30.2666015625, 31.5703125, 32.8740234375, 34.177734375, 35.4814453125, 36.78515625, 38.0888671875, 39.392578125, 40.6962890625, 42.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 32.0, 427.0, 496.0, 58.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-313.26287841796875, -307.46685791015625, -301.67083740234375, -295.8748474121094, -290.0788269042969, -284.2828063964844, -278.4867858886719, -272.6907653808594, -266.894775390625, -261.0987548828125, -255.30274963378906, -249.50672912597656, -243.71072387695312, -237.91470336914062, -232.11868286132812, -226.32266235351562, -220.52664184570312, -214.73062133789062, -208.9346160888672, -203.1385955810547, -197.34259033203125, -191.54656982421875, -185.75054931640625, -179.95452880859375, -174.1585235595703, -168.3625030517578, -162.56649780273438, -156.77047729492188, -150.97445678710938, -145.17845153808594, -139.38243103027344, -133.58642578125, -127.79042053222656, -121.9944076538086, -116.19839477539062, -110.40237426757812, -104.60636138916016, -98.81034851074219, -93.01432800292969, -87.21831512451172, -81.42230224609375, -75.62628936767578, -69.83027648925781, -64.03425598144531, -58.238243103027344, -52.442230224609375, -46.64621353149414, -40.850196838378906, -35.05418014526367, -29.25816535949707, -23.46215057373047, -17.666135787963867, -11.870121002197266, -6.074106216430664, -0.2780914306640625, 5.517925262451172, 11.31393814086914, 17.109952926635742, 22.905967712402344, 28.701982498168945, 34.49799728393555, 40.29401397705078, 46.09002685546875, 51.886043548583984, 57.68205642700195]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 13.0, 12.0, 16.0, 17.0, 21.0, 20.0, 17.0, 25.0, 26.0, 30.0, 39.0, 38.0, 34.0, 30.0, 42.0, 48.0, 35.0, 48.0, 42.0, 33.0, 34.0, 44.0, 41.0, 37.0, 31.0, 34.0, 39.0, 24.0, 22.0, 12.0, 20.0, 12.0, 17.0, 11.0, 8.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.94347381591797, -33.786163330078125, -32.62885665893555, -31.471546173095703, -30.31423568725586, -29.15692710876465, -27.999618530273438, -26.842308044433594, -25.684999465942383, -24.527690887451172, -23.370380401611328, -22.213071823120117, -21.055763244628906, -19.898452758789062, -18.74114418029785, -17.58383560180664, -16.426525115966797, -15.26921558380127, -14.111906051635742, -12.954597473144531, -11.797287940979004, -10.639978408813477, -9.482669830322266, -8.325360298156738, -7.168050765991211, -6.010741233825684, -4.8534321784973145, -3.696122884750366, -2.538813591003418, -1.3815040588378906, -0.22419500350952148, 0.9331140518188477, 2.090423583984375, 3.2477328777313232, 4.4050421714782715, 5.562351226806641, 6.719660758972168, 7.876970291137695, 9.034278869628906, 10.191588401794434, 11.348897933959961, 12.506207466125488, 13.663516998291016, 14.820825576782227, 15.978135108947754, 17.13544464111328, 18.292753219604492, 19.450061798095703, 20.607372283935547, 21.764680862426758, 22.9219913482666, 24.079299926757812, 25.236610412597656, 26.393918991088867, 27.551227569580078, 28.708538055419922, 29.865846633911133, 31.023155212402344, 32.18046569824219, 33.33777618408203, 34.49508285522461, 35.65239334106445, 36.8097038269043, 37.967010498046875, 39.12432098388672]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 9.0, 2.0, 11.0, 14.0, 13.0, 18.0, 23.0, 19.0, 31.0, 29.0, 31.0, 29.0, 39.0, 29.0, 46.0, 37.0, 46.0, 39.0, 44.0, 49.0, 39.0, 42.0, 41.0, 34.0, 39.0, 28.0, 29.0, 26.0, 23.0, 30.0, 15.0, 19.0, 22.0, 17.0, 9.0, 8.0, 9.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.19921875, -5.05413818359375, -4.9090576171875, -4.76397705078125, -4.618896484375, -4.47381591796875, -4.3287353515625, -4.18365478515625, -4.03857421875, -3.89349365234375, -3.7484130859375, -3.60333251953125, -3.458251953125, -3.31317138671875, -3.1680908203125, -3.02301025390625, -2.8779296875, -2.73284912109375, -2.5877685546875, -2.44268798828125, -2.297607421875, -2.15252685546875, -2.0074462890625, -1.86236572265625, -1.71728515625, -1.57220458984375, -1.4271240234375, -1.28204345703125, -1.136962890625, -0.99188232421875, -0.8468017578125, -0.70172119140625, -0.556640625, -0.41156005859375, -0.2664794921875, -0.12139892578125, 0.023681640625, 0.16876220703125, 0.3138427734375, 0.45892333984375, 0.60400390625, 0.74908447265625, 0.8941650390625, 1.03924560546875, 1.184326171875, 1.32940673828125, 1.4744873046875, 1.61956787109375, 1.7646484375, 1.90972900390625, 2.0548095703125, 2.19989013671875, 2.344970703125, 2.49005126953125, 2.6351318359375, 2.78021240234375, 2.92529296875, 3.07037353515625, 3.2154541015625, 3.36053466796875, 3.505615234375, 3.65069580078125, 3.7957763671875, 3.94085693359375, 4.0859375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 8.0, 10.0, 18.0, 24.0, 33.0, 52.0, 66.0, 98.0, 134.0, 222.0, 324.0, 566.0, 907.0, 1666.0, 3140.0, 6252.0, 13841.0, 34172.0, 103363.0, 438878.0, 1691449.0, 1425717.0, 335697.0, 85355.0, 29061.0, 11745.0, 5475.0, 2633.0, 1377.0, 744.0, 463.0, 280.0, 150.0, 128.0, 67.0, 59.0, 27.0, 26.0, 17.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.77734375, -6.55078125, -6.32421875, -6.09765625, -5.87109375, -5.64453125, -5.41796875, -5.19140625, -4.96484375, -4.73828125, -4.51171875, -4.28515625, -4.05859375, -3.83203125, -3.60546875, -3.37890625, -3.15234375, -2.92578125, -2.69921875, -2.47265625, -2.24609375, -2.01953125, -1.79296875, -1.56640625, -1.33984375, -1.11328125, -0.88671875, -0.66015625, -0.43359375, -0.20703125, 0.01953125, 0.24609375, 0.47265625, 0.69921875, 0.92578125, 1.15234375, 1.37890625, 1.60546875, 1.83203125, 2.05859375, 2.28515625, 2.51171875, 2.73828125, 2.96484375, 3.19140625, 3.41796875, 3.64453125, 3.87109375, 4.09765625, 4.32421875, 4.55078125, 4.77734375, 5.00390625, 5.23046875, 5.45703125, 5.68359375, 5.91015625, 6.13671875, 6.36328125, 6.58984375, 6.81640625, 7.04296875, 7.26953125, 7.49609375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 10.0, 6.0, 12.0, 10.0, 22.0, 32.0, 33.0, 54.0, 60.0, 91.0, 95.0, 121.0, 196.0, 228.0, 308.0, 441.0, 482.0, 450.0, 385.0, 270.0, 194.0, 116.0, 108.0, 85.0, 56.0, 46.0, 31.0, 31.0, 23.0, 17.0, 11.0, 9.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.4921875, -8.23883056640625, -7.9854736328125, -7.73211669921875, -7.478759765625, -7.22540283203125, -6.9720458984375, -6.71868896484375, -6.46533203125, -6.21197509765625, -5.9586181640625, -5.70526123046875, -5.451904296875, -5.19854736328125, -4.9451904296875, -4.69183349609375, -4.4384765625, -4.18511962890625, -3.9317626953125, -3.67840576171875, -3.425048828125, -3.17169189453125, -2.9183349609375, -2.66497802734375, -2.41162109375, -2.15826416015625, -1.9049072265625, -1.65155029296875, -1.398193359375, -1.14483642578125, -0.8914794921875, -0.63812255859375, -0.384765625, -0.13140869140625, 0.1219482421875, 0.37530517578125, 0.628662109375, 0.88201904296875, 1.1353759765625, 1.38873291015625, 1.64208984375, 1.89544677734375, 2.1488037109375, 2.40216064453125, 2.655517578125, 2.90887451171875, 3.1622314453125, 3.41558837890625, 3.6689453125, 3.92230224609375, 4.1756591796875, 4.42901611328125, 4.682373046875, 4.93572998046875, 5.1890869140625, 5.44244384765625, 5.69580078125, 5.94915771484375, 6.2025146484375, 6.45587158203125, 6.709228515625, 6.96258544921875, 7.2159423828125, 7.46929931640625, 7.72265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 13.0, 9.0, 13.0, 20.0, 23.0, 29.0, 47.0, 69.0, 96.0, 119.0, 257.0, 511.0, 1436.0, 7801.0, 76318.0, 1853732.0, 2155746.0, 86861.0, 8484.0, 1490.0, 473.0, 229.0, 156.0, 90.0, 68.0, 44.0, 43.0, 26.0, 16.0, 17.0, 11.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.34375, -21.62353515625, -20.9033203125, -20.18310546875, -19.462890625, -18.74267578125, -18.0224609375, -17.30224609375, -16.58203125, -15.86181640625, -15.1416015625, -14.42138671875, -13.701171875, -12.98095703125, -12.2607421875, -11.54052734375, -10.8203125, -10.10009765625, -9.3798828125, -8.65966796875, -7.939453125, -7.21923828125, -6.4990234375, -5.77880859375, -5.05859375, -4.33837890625, -3.6181640625, -2.89794921875, -2.177734375, -1.45751953125, -0.7373046875, -0.01708984375, 0.703125, 1.42333984375, 2.1435546875, 2.86376953125, 3.583984375, 4.30419921875, 5.0244140625, 5.74462890625, 6.46484375, 7.18505859375, 7.9052734375, 8.62548828125, 9.345703125, 10.06591796875, 10.7861328125, 11.50634765625, 12.2265625, 12.94677734375, 13.6669921875, 14.38720703125, 15.107421875, 15.82763671875, 16.5478515625, 17.26806640625, 17.98828125, 18.70849609375, 19.4287109375, 20.14892578125, 20.869140625, 21.58935546875, 22.3095703125, 23.02978515625, 23.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 40.0, 125.0, 270.0, 298.0, 176.0, 77.0, 18.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-220.17422485351562, -216.18434143066406, -212.19444274902344, -208.20455932617188, -204.2146759033203, -200.2247772216797, -196.23489379882812, -192.24501037597656, -188.25511169433594, -184.26522827148438, -180.27532958984375, -176.2854461669922, -172.29556274414062, -168.3056640625, -164.31578063964844, -160.32589721679688, -156.3360137939453, -152.34613037109375, -148.35623168945312, -144.36634826660156, -140.37646484375, -136.38656616210938, -132.3966827392578, -128.40679931640625, -124.41690063476562, -120.42700958251953, -116.43712615966797, -112.44723510742188, -108.45734405517578, -104.46746063232422, -100.47756958007812, -96.48768615722656, -92.497802734375, -88.5079116821289, -84.51802825927734, -80.52813720703125, -76.53824615478516, -72.5483627319336, -68.5584716796875, -64.56858825683594, -60.57868957519531, -56.588802337646484, -52.59891128540039, -48.60902404785156, -44.619136810302734, -40.629249572753906, -36.63935852050781, -32.649471282958984, -28.659584045410156, -24.669694900512695, -20.679807662963867, -16.689918518066406, -12.700030326843262, -8.710142135620117, -4.720252990722656, -0.7303657531738281, 3.259523391723633, 7.249411582946777, 11.239299774169922, 15.229188919067383, 19.219078063964844, 23.208965301513672, 27.198854446411133, 31.18874168395996, 35.17863082885742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 14.0, 15.0, 9.0, 14.0, 12.0, 14.0, 20.0, 19.0, 17.0, 25.0, 32.0, 29.0, 32.0, 28.0, 29.0, 28.0, 29.0, 45.0, 41.0, 37.0, 41.0, 34.0, 48.0, 32.0, 37.0, 28.0, 37.0, 28.0, 26.0, 22.0, 19.0, 32.0, 15.0, 17.0, 14.0, 8.0, 10.0, 12.0, 7.0, 2.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-27.830181121826172, -27.027921676635742, -26.225662231445312, -25.423404693603516, -24.621145248413086, -23.818885803222656, -23.016626358032227, -22.214366912841797, -21.412109375, -20.60984992980957, -19.80759048461914, -19.005332946777344, -18.203073501586914, -17.400814056396484, -16.598554611206055, -15.796295166015625, -14.994035720825195, -14.191776275634766, -13.389517784118652, -12.587258338928223, -11.78499984741211, -10.98274040222168, -10.18048095703125, -9.37822151184082, -8.575963020324707, -7.7737040519714355, -6.971445083618164, -6.169185638427734, -5.366926670074463, -4.564667701721191, -3.7624082565307617, -2.9601492881774902, -2.1578922271728516, -1.3556331396102905, -0.5533740520477295, 0.2488851547241211, 1.0511441230773926, 1.853403091430664, 2.6556625366210938, 3.4579215049743652, 4.260180473327637, 5.062439441680908, 5.86469841003418, 6.666957855224609, 7.469216823577881, 8.271475791931152, 9.073735237121582, 9.875993728637695, 10.678253173828125, 11.480512619018555, 12.282771110534668, 13.085030555725098, 13.887289047241211, 14.68954849243164, 15.49180793762207, 16.2940673828125, 17.096324920654297, 17.898584365844727, 18.700843811035156, 19.503101348876953, 20.305360794067383, 21.107620239257812, 21.909879684448242, 22.712139129638672, 23.5143985748291]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 5.0, 6.0, 6.0, 8.0, 10.0, 15.0, 14.0, 19.0, 31.0, 24.0, 30.0, 22.0, 37.0, 23.0, 36.0, 49.0, 41.0, 53.0, 41.0, 39.0, 44.0, 40.0, 40.0, 37.0, 33.0, 32.0, 28.0, 30.0, 23.0, 32.0, 34.0, 18.0, 17.0, 18.0, 10.0, 11.0, 7.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.2752685546875, -4.140380859375, -4.0054931640625, -3.87060546875, -3.7357177734375, -3.600830078125, -3.4659423828125, -3.3310546875, -3.1961669921875, -3.061279296875, -2.9263916015625, -2.79150390625, -2.6566162109375, -2.521728515625, -2.3868408203125, -2.251953125, -2.1170654296875, -1.982177734375, -1.8472900390625, -1.71240234375, -1.5775146484375, -1.442626953125, -1.3077392578125, -1.1728515625, -1.0379638671875, -0.903076171875, -0.7681884765625, -0.63330078125, -0.4984130859375, -0.363525390625, -0.2286376953125, -0.09375, 0.0411376953125, 0.176025390625, 0.3109130859375, 0.44580078125, 0.5806884765625, 0.715576171875, 0.8504638671875, 0.9853515625, 1.1202392578125, 1.255126953125, 1.3900146484375, 1.52490234375, 1.6597900390625, 1.794677734375, 1.9295654296875, 2.064453125, 2.1993408203125, 2.334228515625, 2.4691162109375, 2.60400390625, 2.7388916015625, 2.873779296875, 3.0086669921875, 3.1435546875, 3.2784423828125, 3.413330078125, 3.5482177734375, 3.68310546875, 3.8179931640625, 3.952880859375, 4.0877685546875, 4.22265625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 9.0, 21.0, 40.0, 67.0, 85.0, 156.0, 216.0, 409.0, 723.0, 1288.0, 2413.0, 4393.0, 8369.0, 16647.0, 34049.0, 75076.0, 224133.0, 432133.0, 140062.0, 55109.0, 25848.0, 12875.0, 6598.0, 3494.0, 1916.0, 1015.0, 584.0, 331.0, 181.0, 112.0, 64.0, 47.0, 37.0, 13.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.770172119140625, -3.63214111328125, -3.494110107421875, -3.3560791015625, -3.218048095703125, -3.08001708984375, -2.941986083984375, -2.803955078125, -2.665924072265625, -2.52789306640625, -2.389862060546875, -2.2518310546875, -2.113800048828125, -1.97576904296875, -1.837738037109375, -1.69970703125, -1.561676025390625, -1.42364501953125, -1.285614013671875, -1.1475830078125, -1.009552001953125, -0.87152099609375, -0.733489990234375, -0.595458984375, -0.457427978515625, -0.31939697265625, -0.181365966796875, -0.0433349609375, 0.094696044921875, 0.23272705078125, 0.370758056640625, 0.5087890625, 0.646820068359375, 0.78485107421875, 0.922882080078125, 1.0609130859375, 1.198944091796875, 1.33697509765625, 1.475006103515625, 1.613037109375, 1.751068115234375, 1.88909912109375, 2.027130126953125, 2.1651611328125, 2.303192138671875, 2.44122314453125, 2.579254150390625, 2.71728515625, 2.855316162109375, 2.99334716796875, 3.131378173828125, 3.2694091796875, 3.407440185546875, 3.54547119140625, 3.683502197265625, 3.821533203125, 3.959564208984375, 4.09759521484375, 4.235626220703125, 4.3736572265625, 4.511688232421875, 4.64971923828125, 4.787750244140625, 4.92578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 9.0, 13.0, 9.0, 10.0, 14.0, 20.0, 23.0, 24.0, 26.0, 30.0, 33.0, 34.0, 28.0, 36.0, 42.0, 41.0, 30.0, 48.0, 1061.0, 41.0, 45.0, 28.0, 26.0, 31.0, 31.0, 34.0, 20.0, 31.0, 22.0, 29.0, 20.0, 21.0, 12.0, 16.0, 12.0, 7.0, 6.0, 8.0, 4.0, 4.0, 6.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-3.287109375, -3.1925048828125, -3.097900390625, -3.0032958984375, -2.90869140625, -2.8140869140625, -2.719482421875, -2.6248779296875, -2.5302734375, -2.4356689453125, -2.341064453125, -2.2464599609375, -2.15185546875, -2.0572509765625, -1.962646484375, -1.8680419921875, -1.7734375, -1.6788330078125, -1.584228515625, -1.4896240234375, -1.39501953125, -1.3004150390625, -1.205810546875, -1.1112060546875, -1.0166015625, -0.9219970703125, -0.827392578125, -0.7327880859375, -0.63818359375, -0.5435791015625, -0.448974609375, -0.3543701171875, -0.259765625, -0.1651611328125, -0.070556640625, 0.0240478515625, 0.11865234375, 0.2132568359375, 0.307861328125, 0.4024658203125, 0.4970703125, 0.5916748046875, 0.686279296875, 0.7808837890625, 0.87548828125, 0.9700927734375, 1.064697265625, 1.1593017578125, 1.25390625, 1.3485107421875, 1.443115234375, 1.5377197265625, 1.63232421875, 1.7269287109375, 1.821533203125, 1.9161376953125, 2.0107421875, 2.1053466796875, 2.199951171875, 2.2945556640625, 2.38916015625, 2.4837646484375, 2.578369140625, 2.6729736328125, 2.767578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 0.0, 8.0, 11.0, 24.0, 26.0, 46.0, 47.0, 88.0, 146.0, 218.0, 384.0, 613.0, 1154.0, 2115.0, 4426.0, 10161.0, 26996.0, 96095.0, 1271199.0, 576029.0, 69629.0, 21118.0, 8524.0, 3694.0, 1876.0, 979.0, 551.0, 346.0, 208.0, 140.0, 81.0, 53.0, 34.0, 32.0, 20.0, 15.0, 15.0, 9.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.48046875, -4.34423828125, -4.2080078125, -4.07177734375, -3.935546875, -3.79931640625, -3.6630859375, -3.52685546875, -3.390625, -3.25439453125, -3.1181640625, -2.98193359375, -2.845703125, -2.70947265625, -2.5732421875, -2.43701171875, -2.30078125, -2.16455078125, -2.0283203125, -1.89208984375, -1.755859375, -1.61962890625, -1.4833984375, -1.34716796875, -1.2109375, -1.07470703125, -0.9384765625, -0.80224609375, -0.666015625, -0.52978515625, -0.3935546875, -0.25732421875, -0.12109375, 0.01513671875, 0.1513671875, 0.28759765625, 0.423828125, 0.56005859375, 0.6962890625, 0.83251953125, 0.96875, 1.10498046875, 1.2412109375, 1.37744140625, 1.513671875, 1.64990234375, 1.7861328125, 1.92236328125, 2.05859375, 2.19482421875, 2.3310546875, 2.46728515625, 2.603515625, 2.73974609375, 2.8759765625, 3.01220703125, 3.1484375, 3.28466796875, 3.4208984375, 3.55712890625, 3.693359375, 3.82958984375, 3.9658203125, 4.10205078125, 4.23828125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 8.0, 12.0, 14.0, 24.0, 21.0, 41.0, 71.0, 107.0, 205.0, 183.0, 94.0, 60.0, 33.0, 27.0, 26.0, 24.0, 10.0, 11.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.9979095458984375, -0.964569091796875, -0.9312286376953125, -0.89788818359375, -0.8645477294921875, -0.831207275390625, -0.7978668212890625, -0.7645263671875, -0.7311859130859375, -0.697845458984375, -0.6645050048828125, -0.63116455078125, -0.5978240966796875, -0.564483642578125, -0.5311431884765625, -0.497802734375, -0.4644622802734375, -0.431121826171875, -0.3977813720703125, -0.36444091796875, -0.3311004638671875, -0.297760009765625, -0.2644195556640625, -0.2310791015625, -0.1977386474609375, -0.164398193359375, -0.1310577392578125, -0.09771728515625, -0.0643768310546875, -0.031036376953125, 0.0023040771484375, 0.03564453125, 0.0689849853515625, 0.102325439453125, 0.1356658935546875, 0.16900634765625, 0.2023468017578125, 0.235687255859375, 0.2690277099609375, 0.3023681640625, 0.3357086181640625, 0.369049072265625, 0.4023895263671875, 0.43572998046875, 0.4690704345703125, 0.502410888671875, 0.5357513427734375, 0.569091796875, 0.6024322509765625, 0.635772705078125, 0.6691131591796875, 0.70245361328125, 0.7357940673828125, 0.769134521484375, 0.8024749755859375, 0.8358154296875, 0.8691558837890625, 0.902496337890625, 0.9358367919921875, 0.96917724609375, 1.0025177001953125, 1.035858154296875, 1.0691986083984375, 1.1025390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 5.0, 15.0, 12.0, 30.0, 27.0, 49.0, 60.0, 122.0, 293.0, 2357.0, 923098.0, 120810.0, 1164.0, 219.0, 98.0, 50.0, 38.0, 30.0, 18.0, 12.0, 6.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.828125, -18.25537109375, -17.6826171875, -17.10986328125, -16.537109375, -15.96435546875, -15.3916015625, -14.81884765625, -14.24609375, -13.67333984375, -13.1005859375, -12.52783203125, -11.955078125, -11.38232421875, -10.8095703125, -10.23681640625, -9.6640625, -9.09130859375, -8.5185546875, -7.94580078125, -7.373046875, -6.80029296875, -6.2275390625, -5.65478515625, -5.08203125, -4.50927734375, -3.9365234375, -3.36376953125, -2.791015625, -2.21826171875, -1.6455078125, -1.07275390625, -0.5, 0.07275390625, 0.6455078125, 1.21826171875, 1.791015625, 2.36376953125, 2.9365234375, 3.50927734375, 4.08203125, 4.65478515625, 5.2275390625, 5.80029296875, 6.373046875, 6.94580078125, 7.5185546875, 8.09130859375, 8.6640625, 9.23681640625, 9.8095703125, 10.38232421875, 10.955078125, 11.52783203125, 12.1005859375, 12.67333984375, 13.24609375, 13.81884765625, 14.3916015625, 14.96435546875, 15.537109375, 16.10986328125, 16.6826171875, 17.25537109375, 17.828125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 25.0, 337.0, 592.0, 63.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.474925994873047, -12.25655746459961, -12.038189888000488, -11.81982135772705, -11.601452827453613, -11.383085250854492, -11.164716720581055, -10.946348190307617, -10.72797966003418, -10.509611129760742, -10.291243553161621, -10.072875022888184, -9.854506492614746, -9.636138916015625, -9.417770385742188, -9.19940185546875, -8.981034278869629, -8.762665748596191, -8.54429817199707, -8.325929641723633, -8.107561111450195, -7.889193058013916, -7.670825004577637, -7.452456474304199, -7.234087944030762, -7.015719890594482, -6.797351360321045, -6.578983306884766, -6.360614776611328, -6.142246723175049, -5.9238786697387695, -5.705510139465332, -5.487142086029053, -5.268774032592773, -5.050405502319336, -4.832037448883057, -4.613668918609619, -4.39530086517334, -4.176932334899902, -3.958564281463623, -3.7401959896087646, -3.5218276977539062, -3.303459405899048, -3.0850911140441895, -2.86672306060791, -2.6483547687530518, -2.4299864768981934, -2.211618423461914, -1.9932500123977661, -1.7748817205429077, -1.5565135478973389, -1.3381452560424805, -1.119776964187622, -0.9014087915420532, -0.6830404996871948, -0.464672327041626, -0.24630403518676758, -0.02793578803539276, 0.19043245911598206, 0.40880072116851807, 0.6271689534187317, 0.8455371856689453, 1.0639054775238037, 1.2822736501693726, 1.500641942024231]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 11.0, 4.0, 8.0, 5.0, 4.0, 8.0, 14.0, 12.0, 15.0, 14.0, 26.0, 21.0, 12.0, 27.0, 19.0, 26.0, 26.0, 28.0, 30.0, 31.0, 36.0, 30.0, 44.0, 41.0, 32.0, 42.0, 38.0, 37.0, 29.0, 32.0, 32.0, 34.0, 26.0, 33.0, 27.0, 29.0, 24.0, 11.0, 13.0, 9.0, 15.0, 8.0, 7.0, 10.0, 5.0, 2.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5432991981506348, -0.5236790180206299, -0.5040588974952698, -0.4844387173652649, -0.46481853723526, -0.4451983869075775, -0.425578236579895, -0.40595805644989014, -0.38633787631988525, -0.36671772599220276, -0.3470975458621979, -0.3274773955345154, -0.3078572154045105, -0.288237065076828, -0.2686169147491455, -0.24899673461914062, -0.22937658429145813, -0.20975641906261444, -0.19013625383377075, -0.17051610350608826, -0.15089592337608337, -0.13127577304840088, -0.11165560781955719, -0.0920354425907135, -0.07241527736186981, -0.05279511213302612, -0.03317495062947273, -0.013554789125919342, 0.006065376102924347, 0.025685541331768036, 0.04530569911003113, 0.06492586433887482, 0.0845460295677185, 0.1041661947965622, 0.12378636002540588, 0.14340651035308838, 0.16302669048309326, 0.18264684081077576, 0.20226700603961945, 0.22188717126846313, 0.24150733649730682, 0.2611275017261505, 0.280747652053833, 0.3003678321838379, 0.3199879825115204, 0.33960816264152527, 0.35922831296920776, 0.37884849309921265, 0.39846864342689514, 0.41808879375457764, 0.4377089738845825, 0.457329124212265, 0.4769493043422699, 0.4965694546699524, 0.5161896347999573, 0.5358097553253174, 0.5554299354553223, 0.5750501155853271, 0.5946702361106873, 0.6142904162406921, 0.633910596370697, 0.6535307765007019, 0.673150897026062, 0.6927710771560669, 0.7123912572860718]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 10.0, 16.0, 13.0, 8.0, 18.0, 24.0, 29.0, 19.0, 28.0, 34.0, 30.0, 34.0, 35.0, 56.0, 33.0, 48.0, 44.0, 35.0, 43.0, 35.0, 34.0, 33.0, 36.0, 33.0, 39.0, 42.0, 23.0, 24.0, 17.0, 15.0, 19.0, 21.0, 10.0, 13.0, 9.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.1405029296875, -4.007568359375, -3.8746337890625, -3.74169921875, -3.6087646484375, -3.475830078125, -3.3428955078125, -3.2099609375, -3.0770263671875, -2.944091796875, -2.8111572265625, -2.67822265625, -2.5452880859375, -2.412353515625, -2.2794189453125, -2.146484375, -2.0135498046875, -1.880615234375, -1.7476806640625, -1.61474609375, -1.4818115234375, -1.348876953125, -1.2159423828125, -1.0830078125, -0.9500732421875, -0.817138671875, -0.6842041015625, -0.55126953125, -0.4183349609375, -0.285400390625, -0.1524658203125, -0.01953125, 0.1134033203125, 0.246337890625, 0.3792724609375, 0.51220703125, 0.6451416015625, 0.778076171875, 0.9110107421875, 1.0439453125, 1.1768798828125, 1.309814453125, 1.4427490234375, 1.57568359375, 1.7086181640625, 1.841552734375, 1.9744873046875, 2.107421875, 2.2403564453125, 2.373291015625, 2.5062255859375, 2.63916015625, 2.7720947265625, 2.905029296875, 3.0379638671875, 3.1708984375, 3.3038330078125, 3.436767578125, 3.5697021484375, 3.70263671875, 3.8355712890625, 3.968505859375, 4.1014404296875, 4.234375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 9.0, 8.0, 12.0, 25.0, 27.0, 44.0, 51.0, 73.0, 115.0, 170.0, 257.0, 399.0, 527.0, 881.0, 1287.0, 2044.0, 3232.0, 5953.0, 12328.0, 29265.0, 79223.0, 240252.0, 439728.0, 142659.0, 49588.0, 19653.0, 8681.0, 4622.0, 2556.0, 1640.0, 1110.0, 671.0, 455.0, 298.0, 215.0, 177.0, 105.0, 64.0, 49.0, 35.0, 23.0, 12.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0], "bins": [-6.48046875, -6.2967529296875, -6.113037109375, -5.9293212890625, -5.74560546875, -5.5618896484375, -5.378173828125, -5.1944580078125, -5.0107421875, -4.8270263671875, -4.643310546875, -4.4595947265625, -4.27587890625, -4.0921630859375, -3.908447265625, -3.7247314453125, -3.541015625, -3.3572998046875, -3.173583984375, -2.9898681640625, -2.80615234375, -2.6224365234375, -2.438720703125, -2.2550048828125, -2.0712890625, -1.8875732421875, -1.703857421875, -1.5201416015625, -1.33642578125, -1.1527099609375, -0.968994140625, -0.7852783203125, -0.6015625, -0.4178466796875, -0.234130859375, -0.0504150390625, 0.13330078125, 0.3170166015625, 0.500732421875, 0.6844482421875, 0.8681640625, 1.0518798828125, 1.235595703125, 1.4193115234375, 1.60302734375, 1.7867431640625, 1.970458984375, 2.1541748046875, 2.337890625, 2.5216064453125, 2.705322265625, 2.8890380859375, 3.07275390625, 3.2564697265625, 3.440185546875, 3.6239013671875, 3.8076171875, 3.9913330078125, 4.175048828125, 4.3587646484375, 4.54248046875, 4.7261962890625, 4.909912109375, 5.0936279296875, 5.27734375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 5.0, 16.0, 18.0, 13.0, 13.0, 16.0, 27.0, 28.0, 17.0, 18.0, 31.0, 41.0, 38.0, 60.0, 58.0, 99.0, 132.0, 267.0, 1400.0, 172.0, 92.0, 63.0, 56.0, 48.0, 45.0, 40.0, 34.0, 28.0, 31.0, 18.0, 18.0, 18.0, 11.0, 11.0, 10.0, 6.0, 3.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.5703125, -12.1915283203125, -11.812744140625, -11.4339599609375, -11.05517578125, -10.6763916015625, -10.297607421875, -9.9188232421875, -9.5400390625, -9.1612548828125, -8.782470703125, -8.4036865234375, -8.02490234375, -7.6461181640625, -7.267333984375, -6.8885498046875, -6.509765625, -6.1309814453125, -5.752197265625, -5.3734130859375, -4.99462890625, -4.6158447265625, -4.237060546875, -3.8582763671875, -3.4794921875, -3.1007080078125, -2.721923828125, -2.3431396484375, -1.96435546875, -1.5855712890625, -1.206787109375, -0.8280029296875, -0.44921875, -0.0704345703125, 0.308349609375, 0.6871337890625, 1.06591796875, 1.4447021484375, 1.823486328125, 2.2022705078125, 2.5810546875, 2.9598388671875, 3.338623046875, 3.7174072265625, 4.09619140625, 4.4749755859375, 4.853759765625, 5.2325439453125, 5.611328125, 5.9901123046875, 6.368896484375, 6.7476806640625, 7.12646484375, 7.5052490234375, 7.884033203125, 8.2628173828125, 8.6416015625, 9.0203857421875, 9.399169921875, 9.7779541015625, 10.15673828125, 10.5355224609375, 10.914306640625, 11.2930908203125, 11.671875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 13.0, 7.0, 10.0, 14.0, 27.0, 33.0, 36.0, 44.0, 71.0, 84.0, 139.0, 227.0, 422.0, 842.0, 2468.0, 14258.0, 1099528.0, 2005964.0, 16698.0, 2766.0, 870.0, 405.0, 227.0, 132.0, 96.0, 78.0, 54.0, 32.0, 31.0, 20.0, 21.0, 13.0, 12.0, 11.0, 8.0, 4.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.671875, -30.617431640625, -29.56298828125, -28.508544921875, -27.4541015625, -26.399658203125, -25.34521484375, -24.290771484375, -23.236328125, -22.181884765625, -21.12744140625, -20.072998046875, -19.0185546875, -17.964111328125, -16.90966796875, -15.855224609375, -14.80078125, -13.746337890625, -12.69189453125, -11.637451171875, -10.5830078125, -9.528564453125, -8.47412109375, -7.419677734375, -6.365234375, -5.310791015625, -4.25634765625, -3.201904296875, -2.1474609375, -1.093017578125, -0.03857421875, 1.015869140625, 2.0703125, 3.124755859375, 4.17919921875, 5.233642578125, 6.2880859375, 7.342529296875, 8.39697265625, 9.451416015625, 10.505859375, 11.560302734375, 12.61474609375, 13.669189453125, 14.7236328125, 15.778076171875, 16.83251953125, 17.886962890625, 18.94140625, 19.995849609375, 21.05029296875, 22.104736328125, 23.1591796875, 24.213623046875, 25.26806640625, 26.322509765625, 27.376953125, 28.431396484375, 29.48583984375, 30.540283203125, 31.5947265625, 32.649169921875, 33.70361328125, 34.758056640625, 35.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 15.0, 27.0, 50.0, 74.0, 118.0, 156.0, 155.0, 150.0, 111.0, 71.0, 36.0, 21.0, 12.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.981853485107422, -17.898008346557617, -16.814165115356445, -15.73031997680664, -14.646474838256836, -13.562630653381348, -12.47878646850586, -11.394941329956055, -10.311097145080566, -9.227252960205078, -8.143407821655273, -7.059563636779785, -5.975718975067139, -4.891874313354492, -3.808030128479004, -2.7241854667663574, -1.640340805053711, -0.556496262550354, 0.5273482799530029, 1.6111927032470703, 2.695037364959717, 3.7788820266723633, 4.862726211547852, 5.946570873260498, 7.0304155349731445, 8.114259719848633, 9.198104858398438, 10.281949043273926, 11.365793228149414, 12.449638366699219, 13.533482551574707, 14.617326736450195, 15.701171875, 16.785017013549805, 17.868860244750977, 18.95270538330078, 20.036550521850586, 21.12039566040039, 22.204238891601562, 23.288084030151367, 24.371929168701172, 25.455774307250977, 26.53961753845215, 27.623462677001953, 28.707307815551758, 29.791152954101562, 30.874996185302734, 31.95884132385254, 33.042686462402344, 34.126529693603516, 35.21037673950195, 36.294219970703125, 37.3780632019043, 38.461910247802734, 39.545753479003906, 40.62959671020508, 41.71343994140625, 42.79728317260742, 43.88113021850586, 44.96497344970703, 46.0488166809082, 47.13266372680664, 48.21650695800781, 49.300350189208984, 50.38419723510742]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 4.0, 9.0, 5.0, 13.0, 7.0, 15.0, 24.0, 12.0, 13.0, 25.0, 26.0, 39.0, 20.0, 41.0, 30.0, 31.0, 45.0, 45.0, 39.0, 43.0, 34.0, 46.0, 32.0, 31.0, 33.0, 25.0, 32.0, 33.0, 24.0, 26.0, 26.0, 20.0, 28.0, 11.0, 19.0, 12.0, 13.0, 15.0, 6.0, 8.0, 4.0, 10.0, 4.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.297121047973633, -29.283266067504883, -28.2694091796875, -27.25555419921875, -26.24169921875, -25.22784423828125, -24.2139892578125, -23.200132369995117, -22.186277389526367, -21.172422409057617, -20.158565521240234, -19.144710540771484, -18.130855560302734, -17.117000579833984, -16.103145599365234, -15.089288711547852, -14.075433731079102, -13.061578750610352, -12.047722816467285, -11.033866882324219, -10.020011901855469, -9.006156921386719, -7.992300987243652, -6.978445529937744, -5.964590072631836, -4.950734615325928, -3.9368791580200195, -2.9230237007141113, -1.9091682434082031, -0.8953127861022949, 0.11854267120361328, 1.1323981285095215, 2.1462554931640625, 3.1601109504699707, 4.173966407775879, 5.187821865081787, 6.201677322387695, 7.2155327796936035, 8.229388236999512, 9.243244171142578, 10.257099151611328, 11.270954132080078, 12.284810066223145, 13.298666000366211, 14.312520980834961, 15.326375961303711, 16.340232849121094, 17.354087829589844, 18.367942810058594, 19.381797790527344, 20.395652770996094, 21.409509658813477, 22.423364639282227, 23.437219619750977, 24.45107650756836, 25.46493148803711, 26.47878646850586, 27.49264144897461, 28.50649642944336, 29.520353317260742, 30.534208297729492, 31.548063278198242, 32.561920166015625, 33.575775146484375, 34.589630126953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 10.0, 4.0, 9.0, 9.0, 11.0, 15.0, 13.0, 13.0, 27.0, 18.0, 37.0, 35.0, 25.0, 33.0, 33.0, 29.0, 39.0, 42.0, 36.0, 49.0, 42.0, 43.0, 48.0, 42.0, 39.0, 28.0, 41.0, 24.0, 27.0, 18.0, 21.0, 24.0, 19.0, 19.0, 17.0, 17.0, 11.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.390625, -4.2490234375, -4.107421875, -3.9658203125, -3.82421875, -3.6826171875, -3.541015625, -3.3994140625, -3.2578125, -3.1162109375, -2.974609375, -2.8330078125, -2.69140625, -2.5498046875, -2.408203125, -2.2666015625, -2.125, -1.9833984375, -1.841796875, -1.7001953125, -1.55859375, -1.4169921875, -1.275390625, -1.1337890625, -0.9921875, -0.8505859375, -0.708984375, -0.5673828125, -0.42578125, -0.2841796875, -0.142578125, -0.0009765625, 0.140625, 0.2822265625, 0.423828125, 0.5654296875, 0.70703125, 0.8486328125, 0.990234375, 1.1318359375, 1.2734375, 1.4150390625, 1.556640625, 1.6982421875, 1.83984375, 1.9814453125, 2.123046875, 2.2646484375, 2.40625, 2.5478515625, 2.689453125, 2.8310546875, 2.97265625, 3.1142578125, 3.255859375, 3.3974609375, 3.5390625, 3.6806640625, 3.822265625, 3.9638671875, 4.10546875, 4.2470703125, 4.388671875, 4.5302734375, 4.671875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 15.0, 14.0, 14.0, 18.0, 20.0, 42.0, 56.0, 54.0, 70.0, 141.0, 247.0, 319.0, 587.0, 932.0, 1738.0, 3371.0, 6832.0, 14789.0, 37395.0, 114260.0, 482565.0, 1728734.0, 1341330.0, 325815.0, 83115.0, 28393.0, 11854.0, 5290.0, 2717.0, 1384.0, 764.0, 485.0, 282.0, 192.0, 121.0, 104.0, 64.0, 34.0, 34.0, 23.0, 20.0, 16.0, 10.0, 9.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.093505859375, -5.86669921875, -5.639892578125, -5.4130859375, -5.186279296875, -4.95947265625, -4.732666015625, -4.505859375, -4.279052734375, -4.05224609375, -3.825439453125, -3.5986328125, -3.371826171875, -3.14501953125, -2.918212890625, -2.69140625, -2.464599609375, -2.23779296875, -2.010986328125, -1.7841796875, -1.557373046875, -1.33056640625, -1.103759765625, -0.876953125, -0.650146484375, -0.42333984375, -0.196533203125, 0.0302734375, 0.257080078125, 0.48388671875, 0.710693359375, 0.9375, 1.164306640625, 1.39111328125, 1.617919921875, 1.8447265625, 2.071533203125, 2.29833984375, 2.525146484375, 2.751953125, 2.978759765625, 3.20556640625, 3.432373046875, 3.6591796875, 3.885986328125, 4.11279296875, 4.339599609375, 4.56640625, 4.793212890625, 5.02001953125, 5.246826171875, 5.4736328125, 5.700439453125, 5.92724609375, 6.154052734375, 6.380859375, 6.607666015625, 6.83447265625, 7.061279296875, 7.2880859375, 7.514892578125, 7.74169921875, 7.968505859375, 8.1953125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 11.0, 10.0, 11.0, 19.0, 21.0, 23.0, 41.0, 42.0, 49.0, 63.0, 92.0, 122.0, 190.0, 209.0, 286.0, 349.0, 444.0, 410.0, 397.0, 335.0, 233.0, 167.0, 122.0, 89.0, 76.0, 53.0, 55.0, 30.0, 31.0, 14.0, 17.0, 14.0, 11.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-8.2734375, -8.0306396484375, -7.787841796875, -7.5450439453125, -7.30224609375, -7.0594482421875, -6.816650390625, -6.5738525390625, -6.3310546875, -6.0882568359375, -5.845458984375, -5.6026611328125, -5.35986328125, -5.1170654296875, -4.874267578125, -4.6314697265625, -4.388671875, -4.1458740234375, -3.903076171875, -3.6602783203125, -3.41748046875, -3.1746826171875, -2.931884765625, -2.6890869140625, -2.4462890625, -2.2034912109375, -1.960693359375, -1.7178955078125, -1.47509765625, -1.2322998046875, -0.989501953125, -0.7467041015625, -0.50390625, -0.2611083984375, -0.018310546875, 0.2244873046875, 0.46728515625, 0.7100830078125, 0.952880859375, 1.1956787109375, 1.4384765625, 1.6812744140625, 1.924072265625, 2.1668701171875, 2.40966796875, 2.6524658203125, 2.895263671875, 3.1380615234375, 3.380859375, 3.6236572265625, 3.866455078125, 4.1092529296875, 4.35205078125, 4.5948486328125, 4.837646484375, 5.0804443359375, 5.3232421875, 5.5660400390625, 5.808837890625, 6.0516357421875, 6.29443359375, 6.5372314453125, 6.780029296875, 7.0228271484375, 7.265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 2.0, 13.0, 9.0, 13.0, 19.0, 37.0, 38.0, 55.0, 66.0, 93.0, 163.0, 212.0, 473.0, 2535.0, 44718.0, 3067586.0, 1056674.0, 19010.0, 1471.0, 389.0, 220.0, 133.0, 77.0, 69.0, 39.0, 37.0, 33.0, 21.0, 19.0, 12.0, 10.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.4169921875, -30.365234375, -29.3134765625, -28.26171875, -27.2099609375, -26.158203125, -25.1064453125, -24.0546875, -23.0029296875, -21.951171875, -20.8994140625, -19.84765625, -18.7958984375, -17.744140625, -16.6923828125, -15.640625, -14.5888671875, -13.537109375, -12.4853515625, -11.43359375, -10.3818359375, -9.330078125, -8.2783203125, -7.2265625, -6.1748046875, -5.123046875, -4.0712890625, -3.01953125, -1.9677734375, -0.916015625, 0.1357421875, 1.1875, 2.2392578125, 3.291015625, 4.3427734375, 5.39453125, 6.4462890625, 7.498046875, 8.5498046875, 9.6015625, 10.6533203125, 11.705078125, 12.7568359375, 13.80859375, 14.8603515625, 15.912109375, 16.9638671875, 18.015625, 19.0673828125, 20.119140625, 21.1708984375, 22.22265625, 23.2744140625, 24.326171875, 25.3779296875, 26.4296875, 27.4814453125, 28.533203125, 29.5849609375, 30.63671875, 31.6884765625, 32.740234375, 33.7919921875, 34.84375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 14.0, 25.0, 23.0, 57.0, 88.0, 127.0, 186.0, 155.0, 113.0, 92.0, 54.0, 33.0, 26.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.3377456665039, -67.4644775390625, -65.59121704101562, -63.717952728271484, -61.844688415527344, -59.9714241027832, -58.09815979003906, -56.22489547729492, -54.35163116455078, -52.47836685180664, -50.6051025390625, -48.73183822631836, -46.85857391357422, -44.98530960083008, -43.11204528808594, -41.2387809753418, -39.365516662597656, -37.492252349853516, -35.618988037109375, -33.745723724365234, -31.872459411621094, -29.999195098876953, -28.125930786132812, -26.252666473388672, -24.37940216064453, -22.50613784790039, -20.63287353515625, -18.75960922241211, -16.88634490966797, -15.013080596923828, -13.139816284179688, -11.266551971435547, -9.393291473388672, -7.520027160644531, -5.646762847900391, -3.77349853515625, -1.9002342224121094, -0.02696990966796875, 1.8462944030761719, 3.7195587158203125, 5.592823028564453, 7.466087341308594, 9.339351654052734, 11.212615966796875, 13.085880279541016, 14.959144592285156, 16.832408905029297, 18.705673217773438, 20.578937530517578, 22.45220184326172, 24.32546615600586, 26.19873046875, 28.07199478149414, 29.94525909423828, 31.818523406982422, 33.69178771972656, 35.5650520324707, 37.438316345214844, 39.311580657958984, 41.184844970703125, 43.058109283447266, 44.931373596191406, 46.80463790893555, 48.67790222167969, 50.55116653442383]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 8.0, 7.0, 7.0, 4.0, 7.0, 17.0, 19.0, 20.0, 17.0, 23.0, 22.0, 30.0, 35.0, 37.0, 49.0, 44.0, 35.0, 46.0, 30.0, 37.0, 38.0, 32.0, 47.0, 45.0, 31.0, 38.0, 29.0, 32.0, 34.0, 29.0, 16.0, 19.0, 19.0, 19.0, 17.0, 14.0, 11.0, 5.0, 5.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.34471321105957, -26.487995147705078, -25.631275177001953, -24.77455711364746, -23.917837142944336, -23.061119079589844, -22.20439910888672, -21.347681045532227, -20.4909610748291, -19.63424301147461, -18.777523040771484, -17.920804977416992, -17.064085006713867, -16.207366943359375, -15.35064697265625, -14.493928909301758, -13.63720989227295, -12.78049087524414, -11.923771858215332, -11.067052841186523, -10.210333824157715, -9.353614807128906, -8.496896743774414, -7.640177249908447, -6.783458232879639, -5.92673921585083, -5.0700201988220215, -4.213301658630371, -3.3565824031829834, -2.499863624572754, -1.6431446075439453, -0.7864255905151367, 0.07029342651367188, 0.9270123839378357, 1.7837313413619995, 2.6404502391815186, 3.497169256210327, 4.353888034820557, 5.210607051849365, 6.067326068878174, 6.924045085906982, 7.780764102935791, 8.637482643127441, 9.49420166015625, 10.350920677185059, 11.207639694213867, 12.064358711242676, 12.921077728271484, 13.777796745300293, 14.634515762329102, 15.49123477935791, 16.34795379638672, 17.20467185974121, 18.061391830444336, 18.918109893798828, 19.774829864501953, 20.631547927856445, 21.488265991210938, 22.344985961914062, 23.201704025268555, 24.05842399597168, 24.915142059326172, 25.771862030029297, 26.62858009338379, 27.485300064086914]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 8.0, 7.0, 12.0, 12.0, 18.0, 12.0, 13.0, 15.0, 18.0, 26.0, 35.0, 21.0, 37.0, 44.0, 34.0, 37.0, 35.0, 32.0, 45.0, 43.0, 41.0, 39.0, 30.0, 34.0, 42.0, 41.0, 35.0, 26.0, 24.0, 14.0, 17.0, 21.0, 14.0, 15.0, 17.0, 12.0, 15.0, 13.0, 7.0, 4.0, 2.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.515625, -4.388092041015625, -4.26055908203125, -4.133026123046875, -4.0054931640625, -3.877960205078125, -3.75042724609375, -3.622894287109375, -3.495361328125, -3.367828369140625, -3.24029541015625, -3.112762451171875, -2.9852294921875, -2.857696533203125, -2.73016357421875, -2.602630615234375, -2.47509765625, -2.347564697265625, -2.22003173828125, -2.092498779296875, -1.9649658203125, -1.837432861328125, -1.70989990234375, -1.582366943359375, -1.454833984375, -1.327301025390625, -1.19976806640625, -1.072235107421875, -0.9447021484375, -0.817169189453125, -0.68963623046875, -0.562103271484375, -0.4345703125, -0.307037353515625, -0.17950439453125, -0.051971435546875, 0.0755615234375, 0.203094482421875, 0.33062744140625, 0.458160400390625, 0.585693359375, 0.713226318359375, 0.84075927734375, 0.968292236328125, 1.0958251953125, 1.223358154296875, 1.35089111328125, 1.478424072265625, 1.60595703125, 1.733489990234375, 1.86102294921875, 1.988555908203125, 2.1160888671875, 2.243621826171875, 2.37115478515625, 2.498687744140625, 2.626220703125, 2.753753662109375, 2.88128662109375, 3.008819580078125, 3.1363525390625, 3.263885498046875, 3.39141845703125, 3.518951416015625, 3.646484375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 7.0, 11.0, 17.0, 15.0, 44.0, 69.0, 81.0, 140.0, 178.0, 269.0, 401.0, 616.0, 955.0, 1571.0, 2441.0, 4202.0, 7509.0, 16096.0, 41797.0, 200931.0, 592019.0, 119549.0, 30542.0, 12874.0, 6549.0, 3591.0, 2171.0, 1323.0, 884.0, 550.0, 374.0, 247.0, 182.0, 117.0, 66.0, 55.0, 30.0, 19.0, 12.0, 10.0, 14.0, 3.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.8409423828125, -5.635009765625, -5.4290771484375, -5.22314453125, -5.0172119140625, -4.811279296875, -4.6053466796875, -4.3994140625, -4.1934814453125, -3.987548828125, -3.7816162109375, -3.57568359375, -3.3697509765625, -3.163818359375, -2.9578857421875, -2.751953125, -2.5460205078125, -2.340087890625, -2.1341552734375, -1.92822265625, -1.7222900390625, -1.516357421875, -1.3104248046875, -1.1044921875, -0.8985595703125, -0.692626953125, -0.4866943359375, -0.28076171875, -0.0748291015625, 0.131103515625, 0.3370361328125, 0.54296875, 0.7489013671875, 0.954833984375, 1.1607666015625, 1.36669921875, 1.5726318359375, 1.778564453125, 1.9844970703125, 2.1904296875, 2.3963623046875, 2.602294921875, 2.8082275390625, 3.01416015625, 3.2200927734375, 3.426025390625, 3.6319580078125, 3.837890625, 4.0438232421875, 4.249755859375, 4.4556884765625, 4.66162109375, 4.8675537109375, 5.073486328125, 5.2794189453125, 5.4853515625, 5.6912841796875, 5.897216796875, 6.1031494140625, 6.30908203125, 6.5150146484375, 6.720947265625, 6.9268798828125, 7.1328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 7.0, 13.0, 3.0, 9.0, 6.0, 14.0, 9.0, 11.0, 16.0, 22.0, 25.0, 15.0, 23.0, 31.0, 26.0, 40.0, 41.0, 39.0, 31.0, 47.0, 32.0, 33.0, 1058.0, 33.0, 37.0, 45.0, 37.0, 37.0, 31.0, 30.0, 37.0, 26.0, 19.0, 15.0, 18.0, 15.0, 9.0, 15.0, 7.0, 11.0, 11.0, 9.0, 7.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.939453125, -2.84259033203125, -2.7457275390625, -2.64886474609375, -2.552001953125, -2.45513916015625, -2.3582763671875, -2.26141357421875, -2.16455078125, -2.06768798828125, -1.9708251953125, -1.87396240234375, -1.777099609375, -1.68023681640625, -1.5833740234375, -1.48651123046875, -1.3896484375, -1.29278564453125, -1.1959228515625, -1.09906005859375, -1.002197265625, -0.90533447265625, -0.8084716796875, -0.71160888671875, -0.61474609375, -0.51788330078125, -0.4210205078125, -0.32415771484375, -0.227294921875, -0.13043212890625, -0.0335693359375, 0.06329345703125, 0.16015625, 0.25701904296875, 0.3538818359375, 0.45074462890625, 0.547607421875, 0.64447021484375, 0.7413330078125, 0.83819580078125, 0.93505859375, 1.03192138671875, 1.1287841796875, 1.22564697265625, 1.322509765625, 1.41937255859375, 1.5162353515625, 1.61309814453125, 1.7099609375, 1.80682373046875, 1.9036865234375, 2.00054931640625, 2.097412109375, 2.19427490234375, 2.2911376953125, 2.38800048828125, 2.48486328125, 2.58172607421875, 2.6785888671875, 2.77545166015625, 2.872314453125, 2.96917724609375, 3.0660400390625, 3.16290283203125, 3.259765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 10.0, 5.0, 21.0, 27.0, 34.0, 44.0, 81.0, 95.0, 163.0, 221.0, 304.0, 463.0, 667.0, 1142.0, 1857.0, 3281.0, 6505.0, 15230.0, 49602.0, 468380.0, 1424751.0, 84772.0, 21021.0, 8384.0, 3971.0, 2220.0, 1282.0, 865.0, 515.0, 360.0, 244.0, 179.0, 104.0, 82.0, 69.0, 51.0, 26.0, 30.0, 22.0, 11.0, 12.0, 6.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.33795166015625, -5.1719970703125, -5.00604248046875, -4.840087890625, -4.67413330078125, -4.5081787109375, -4.34222412109375, -4.17626953125, -4.01031494140625, -3.8443603515625, -3.67840576171875, -3.512451171875, -3.34649658203125, -3.1805419921875, -3.01458740234375, -2.8486328125, -2.68267822265625, -2.5167236328125, -2.35076904296875, -2.184814453125, -2.01885986328125, -1.8529052734375, -1.68695068359375, -1.52099609375, -1.35504150390625, -1.1890869140625, -1.02313232421875, -0.857177734375, -0.69122314453125, -0.5252685546875, -0.35931396484375, -0.193359375, -0.02740478515625, 0.1385498046875, 0.30450439453125, 0.470458984375, 0.63641357421875, 0.8023681640625, 0.96832275390625, 1.13427734375, 1.30023193359375, 1.4661865234375, 1.63214111328125, 1.798095703125, 1.96405029296875, 2.1300048828125, 2.29595947265625, 2.4619140625, 2.62786865234375, 2.7938232421875, 2.95977783203125, 3.125732421875, 3.29168701171875, 3.4576416015625, 3.62359619140625, 3.78955078125, 3.95550537109375, 4.1214599609375, 4.28741455078125, 4.453369140625, 4.61932373046875, 4.7852783203125, 4.95123291015625, 5.1171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 8.0, 16.0, 16.0, 23.0, 34.0, 35.0, 52.0, 66.0, 82.0, 94.0, 129.0, 95.0, 74.0, 39.0, 40.0, 44.0, 22.0, 19.0, 18.0, 15.0, 8.0, 7.0, 7.0, 5.0, 9.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.84814453125, -0.8253021240234375, -0.802459716796875, -0.7796173095703125, -0.75677490234375, -0.7339324951171875, -0.711090087890625, -0.6882476806640625, -0.6654052734375, -0.6425628662109375, -0.619720458984375, -0.5968780517578125, -0.57403564453125, -0.5511932373046875, -0.528350830078125, -0.5055084228515625, -0.482666015625, -0.4598236083984375, -0.436981201171875, -0.4141387939453125, -0.39129638671875, -0.3684539794921875, -0.345611572265625, -0.3227691650390625, -0.2999267578125, -0.2770843505859375, -0.254241943359375, -0.2313995361328125, -0.20855712890625, -0.1857147216796875, -0.162872314453125, -0.1400299072265625, -0.1171875, -0.0943450927734375, -0.071502685546875, -0.0486602783203125, -0.02581787109375, -0.0029754638671875, 0.019866943359375, 0.0427093505859375, 0.0655517578125, 0.0883941650390625, 0.111236572265625, 0.1340789794921875, 0.15692138671875, 0.1797637939453125, 0.202606201171875, 0.2254486083984375, 0.248291015625, 0.2711334228515625, 0.293975830078125, 0.3168182373046875, 0.33966064453125, 0.3625030517578125, 0.385345458984375, 0.4081878662109375, 0.4310302734375, 0.4538726806640625, 0.476715087890625, 0.4995574951171875, 0.52239990234375, 0.5452423095703125, 0.568084716796875, 0.5909271240234375, 0.61376953125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 10.0, 6.0, 8.0, 7.0, 7.0, 14.0, 13.0, 28.0, 31.0, 46.0, 62.0, 136.0, 283.0, 1594.0, 32960.0, 999510.0, 12363.0, 943.0, 218.0, 89.0, 70.0, 46.0, 20.0, 19.0, 19.0, 10.0, 14.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4891357421875, -12.032958984375, -11.5767822265625, -11.12060546875, -10.6644287109375, -10.208251953125, -9.7520751953125, -9.2958984375, -8.8397216796875, -8.383544921875, -7.9273681640625, -7.47119140625, -7.0150146484375, -6.558837890625, -6.1026611328125, -5.646484375, -5.1903076171875, -4.734130859375, -4.2779541015625, -3.82177734375, -3.3656005859375, -2.909423828125, -2.4532470703125, -1.9970703125, -1.5408935546875, -1.084716796875, -0.6285400390625, -0.17236328125, 0.2838134765625, 0.739990234375, 1.1961669921875, 1.65234375, 2.1085205078125, 2.564697265625, 3.0208740234375, 3.47705078125, 3.9332275390625, 4.389404296875, 4.8455810546875, 5.3017578125, 5.7579345703125, 6.214111328125, 6.6702880859375, 7.12646484375, 7.5826416015625, 8.038818359375, 8.4949951171875, 8.951171875, 9.4073486328125, 9.863525390625, 10.3197021484375, 10.77587890625, 11.2320556640625, 11.688232421875, 12.1444091796875, 12.6005859375, 13.0567626953125, 13.512939453125, 13.9691162109375, 14.42529296875, 14.8814697265625, 15.337646484375, 15.7938232421875, 16.25]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 43.0, 176.0, 289.0, 297.0, 136.0, 37.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.868434429168701, -4.772968769073486, -4.6775031089782715, -4.582037448883057, -4.486571788787842, -4.391106605529785, -4.29564094543457, -4.2001752853393555, -4.104709625244141, -4.009243965148926, -3.913778305053711, -3.818312883377075, -3.7228472232818604, -3.6273815631866455, -3.5319159030914307, -3.436450481414795, -3.34098482131958, -3.2455191612243652, -3.1500535011291504, -3.0545880794525146, -2.9591224193573, -2.863656759262085, -2.76819109916687, -2.6727256774902344, -2.5772597789764404, -2.4817941188812256, -2.3863284587860107, -2.290863037109375, -2.19539737701416, -2.0999317169189453, -2.0044660568237305, -1.9090005159378052, -1.8135349750518799, -1.718069314956665, -1.6226037740707397, -1.527138113975525, -1.4316725730895996, -1.3362069129943848, -1.24074125289917, -1.1452757120132446, -1.0498101711273193, -0.9543445706367493, -0.8588789701461792, -0.7634133100509644, -0.6679477691650391, -0.5724821090698242, -0.47701650857925415, -0.3815509080886841, -0.28608524799346924, -0.19061964750289917, -0.09515403211116791, 0.0003115832805633545, 0.09577718377113342, 0.1912427842617035, 0.28670841455459595, 0.382174015045166, 0.4776396155357361, 0.5731052160263062, 0.6685708165168762, 0.7640364170074463, 0.8595020771026611, 0.9549676179885864, 1.0504332780838013, 1.1458988189697266, 1.2413644790649414]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 11.0, 3.0, 6.0, 9.0, 11.0, 7.0, 14.0, 24.0, 13.0, 25.0, 17.0, 24.0, 33.0, 25.0, 28.0, 30.0, 34.0, 32.0, 44.0, 55.0, 41.0, 42.0, 41.0, 37.0, 36.0, 32.0, 39.0, 25.0, 24.0, 24.0, 27.0, 32.0, 24.0, 21.0, 16.0, 13.0, 15.0, 14.0, 14.0, 10.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.692436158657074, -0.672741174697876, -0.6530461311340332, -0.6333511471748352, -0.6136561632156372, -0.5939611792564392, -0.5742661952972412, -0.5545711517333984, -0.5348761677742004, -0.5151811838150024, -0.49548617005348206, -0.47579115629196167, -0.45609617233276367, -0.4364011883735657, -0.4167061746120453, -0.3970111608505249, -0.3773161768913269, -0.3576211929321289, -0.3379261791706085, -0.31823116540908813, -0.29853618144989014, -0.27884119749069214, -0.25914618372917175, -0.23945118486881256, -0.21975618600845337, -0.20006118714809418, -0.18036618828773499, -0.1606711894273758, -0.1409761905670166, -0.12128119170665741, -0.10158619284629822, -0.08189119398593903, -0.06219625473022461, -0.04250125586986542, -0.022806257009506226, -0.0031112581491470337, 0.016583740711212158, 0.03627873957157135, 0.05597373843193054, 0.07566873729228973, 0.09536373615264893, 0.11505873501300812, 0.1347537338733673, 0.1544487327337265, 0.1741437315940857, 0.19383873045444489, 0.21353372931480408, 0.23322872817516327, 0.25292372703552246, 0.27261871099472046, 0.29231372475624084, 0.31200873851776123, 0.33170372247695923, 0.3513987064361572, 0.3710937201976776, 0.390788733959198, 0.410483717918396, 0.430178701877594, 0.4498737156391144, 0.46956872940063477, 0.48926371335983276, 0.5089586973190308, 0.5286537408828735, 0.5483487248420715, 0.5680437088012695]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 7.0, 4.0, 5.0, 8.0, 13.0, 14.0, 13.0, 25.0, 22.0, 24.0, 22.0, 25.0, 29.0, 36.0, 24.0, 45.0, 40.0, 41.0, 36.0, 37.0, 46.0, 40.0, 39.0, 49.0, 40.0, 34.0, 36.0, 30.0, 33.0, 25.0, 20.0, 25.0, 19.0, 19.0, 13.0, 16.0, 9.0, 11.0, 11.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-5.0234375, -4.88629150390625, -4.7491455078125, -4.61199951171875, -4.474853515625, -4.33770751953125, -4.2005615234375, -4.06341552734375, -3.92626953125, -3.78912353515625, -3.6519775390625, -3.51483154296875, -3.377685546875, -3.24053955078125, -3.1033935546875, -2.96624755859375, -2.8291015625, -2.69195556640625, -2.5548095703125, -2.41766357421875, -2.280517578125, -2.14337158203125, -2.0062255859375, -1.86907958984375, -1.73193359375, -1.59478759765625, -1.4576416015625, -1.32049560546875, -1.183349609375, -1.04620361328125, -0.9090576171875, -0.77191162109375, -0.634765625, -0.49761962890625, -0.3604736328125, -0.22332763671875, -0.086181640625, 0.05096435546875, 0.1881103515625, 0.32525634765625, 0.46240234375, 0.59954833984375, 0.7366943359375, 0.87384033203125, 1.010986328125, 1.14813232421875, 1.2852783203125, 1.42242431640625, 1.5595703125, 1.69671630859375, 1.8338623046875, 1.97100830078125, 2.108154296875, 2.24530029296875, 2.3824462890625, 2.51959228515625, 2.65673828125, 2.79388427734375, 2.9310302734375, 3.06817626953125, 3.205322265625, 3.34246826171875, 3.4796142578125, 3.61676025390625, 3.75390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 8.0, 8.0, 19.0, 22.0, 26.0, 39.0, 44.0, 86.0, 111.0, 149.0, 181.0, 319.0, 440.0, 660.0, 1160.0, 1853.0, 3232.0, 6371.0, 12656.0, 25858.0, 55610.0, 136954.0, 410598.0, 234544.0, 83050.0, 37226.0, 17625.0, 8758.0, 4579.0, 2399.0, 1416.0, 810.0, 513.0, 363.0, 251.0, 182.0, 112.0, 85.0, 58.0, 39.0, 35.0, 22.0, 16.0, 15.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.38909912109375, -5.2078857421875, -5.02667236328125, -4.845458984375, -4.66424560546875, -4.4830322265625, -4.30181884765625, -4.12060546875, -3.93939208984375, -3.7581787109375, -3.57696533203125, -3.395751953125, -3.21453857421875, -3.0333251953125, -2.85211181640625, -2.6708984375, -2.48968505859375, -2.3084716796875, -2.12725830078125, -1.946044921875, -1.76483154296875, -1.5836181640625, -1.40240478515625, -1.22119140625, -1.03997802734375, -0.8587646484375, -0.67755126953125, -0.496337890625, -0.31512451171875, -0.1339111328125, 0.04730224609375, 0.228515625, 0.40972900390625, 0.5909423828125, 0.77215576171875, 0.953369140625, 1.13458251953125, 1.3157958984375, 1.49700927734375, 1.67822265625, 1.85943603515625, 2.0406494140625, 2.22186279296875, 2.403076171875, 2.58428955078125, 2.7655029296875, 2.94671630859375, 3.1279296875, 3.30914306640625, 3.4903564453125, 3.67156982421875, 3.852783203125, 4.03399658203125, 4.2152099609375, 4.39642333984375, 4.57763671875, 4.75885009765625, 4.9400634765625, 5.12127685546875, 5.302490234375, 5.48370361328125, 5.6649169921875, 5.84613037109375, 6.02734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 4.0, 5.0, 8.0, 10.0, 18.0, 18.0, 17.0, 19.0, 20.0, 30.0, 23.0, 35.0, 47.0, 42.0, 63.0, 85.0, 157.0, 1406.0, 336.0, 171.0, 98.0, 65.0, 42.0, 41.0, 46.0, 26.0, 26.0, 29.0, 28.0, 25.0, 20.0, 14.0, 9.0, 10.0, 12.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.734375, -13.29052734375, -12.8466796875, -12.40283203125, -11.958984375, -11.51513671875, -11.0712890625, -10.62744140625, -10.18359375, -9.73974609375, -9.2958984375, -8.85205078125, -8.408203125, -7.96435546875, -7.5205078125, -7.07666015625, -6.6328125, -6.18896484375, -5.7451171875, -5.30126953125, -4.857421875, -4.41357421875, -3.9697265625, -3.52587890625, -3.08203125, -2.63818359375, -2.1943359375, -1.75048828125, -1.306640625, -0.86279296875, -0.4189453125, 0.02490234375, 0.46875, 0.91259765625, 1.3564453125, 1.80029296875, 2.244140625, 2.68798828125, 3.1318359375, 3.57568359375, 4.01953125, 4.46337890625, 4.9072265625, 5.35107421875, 5.794921875, 6.23876953125, 6.6826171875, 7.12646484375, 7.5703125, 8.01416015625, 8.4580078125, 8.90185546875, 9.345703125, 9.78955078125, 10.2333984375, 10.67724609375, 11.12109375, 11.56494140625, 12.0087890625, 12.45263671875, 12.896484375, 13.34033203125, 13.7841796875, 14.22802734375, 14.671875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 8.0, 3.0, 4.0, 2.0, 7.0, 10.0, 4.0, 14.0, 12.0, 22.0, 18.0, 25.0, 55.0, 45.0, 69.0, 91.0, 110.0, 133.0, 198.0, 295.0, 583.0, 2453.0, 33593.0, 2724695.0, 372634.0, 8246.0, 1124.0, 358.0, 209.0, 170.0, 107.0, 105.0, 63.0, 55.0, 42.0, 34.0, 26.0, 27.0, 15.0, 6.0, 6.0, 8.0, 7.0, 8.0, 3.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.625, -27.72412109375, -26.8232421875, -25.92236328125, -25.021484375, -24.12060546875, -23.2197265625, -22.31884765625, -21.41796875, -20.51708984375, -19.6162109375, -18.71533203125, -17.814453125, -16.91357421875, -16.0126953125, -15.11181640625, -14.2109375, -13.31005859375, -12.4091796875, -11.50830078125, -10.607421875, -9.70654296875, -8.8056640625, -7.90478515625, -7.00390625, -6.10302734375, -5.2021484375, -4.30126953125, -3.400390625, -2.49951171875, -1.5986328125, -0.69775390625, 0.203125, 1.10400390625, 2.0048828125, 2.90576171875, 3.806640625, 4.70751953125, 5.6083984375, 6.50927734375, 7.41015625, 8.31103515625, 9.2119140625, 10.11279296875, 11.013671875, 11.91455078125, 12.8154296875, 13.71630859375, 14.6171875, 15.51806640625, 16.4189453125, 17.31982421875, 18.220703125, 19.12158203125, 20.0224609375, 20.92333984375, 21.82421875, 22.72509765625, 23.6259765625, 24.52685546875, 25.427734375, 26.32861328125, 27.2294921875, 28.13037109375, 29.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 271.0, 617.0, 104.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-245.40943908691406, -240.8939666748047, -236.37847900390625, -231.86300659179688, -227.3475341796875, -222.83206176757812, -218.31658935546875, -213.8011016845703, -209.28562927246094, -204.77015686035156, -200.25466918945312, -195.73919677734375, -191.22372436523438, -186.708251953125, -182.19277954101562, -177.6772918701172, -173.1618194580078, -168.64634704589844, -164.130859375, -159.61538696289062, -155.09991455078125, -150.58444213867188, -146.0689697265625, -141.55348205566406, -137.0380096435547, -132.5225372314453, -128.00704956054688, -123.4915771484375, -118.97610473632812, -114.46063232421875, -109.94515228271484, -105.42967224121094, -100.91419982910156, -96.39872741699219, -91.88324737548828, -87.36776733398438, -82.852294921875, -78.33682250976562, -73.82134246826172, -69.30586242675781, -64.79039001464844, -60.2749137878418, -55.759437561035156, -51.243961334228516, -46.728485107421875, -42.213008880615234, -37.697532653808594, -33.18205642700195, -28.666584014892578, -24.151107788085938, -19.635631561279297, -15.120155334472656, -10.604679107666016, -6.089202880859375, -1.5737266540527344, 2.9417495727539062, 7.457225799560547, 11.972702026367188, 16.488178253173828, 21.00365447998047, 25.51913070678711, 30.03460693359375, 34.55008316040039, 39.06555938720703, 43.58103561401367]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 6.0, 5.0, 13.0, 17.0, 20.0, 19.0, 18.0, 26.0, 23.0, 25.0, 34.0, 45.0, 40.0, 39.0, 37.0, 44.0, 52.0, 42.0, 57.0, 45.0, 32.0, 35.0, 27.0, 38.0, 47.0, 24.0, 29.0, 22.0, 22.0, 19.0, 15.0, 17.0, 11.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-41.92202377319336, -40.76006317138672, -39.59810256958008, -38.43613815307617, -37.27417755126953, -36.11221694946289, -34.95025634765625, -33.788291931152344, -32.6263313293457, -31.464370727539062, -30.30240821838379, -29.14044761657715, -27.978485107421875, -26.816524505615234, -25.654563903808594, -24.49260139465332, -23.33064079284668, -22.16868019104004, -21.006717681884766, -19.844757080078125, -18.68279457092285, -17.52083396911621, -16.358871459960938, -15.196910858154297, -14.03494930267334, -12.872987747192383, -11.711026191711426, -10.549064636230469, -9.387104034423828, -8.225141525268555, -7.063180923461914, -5.901219367980957, -4.7392578125, -3.577296257019043, -2.415334939956665, -1.253373622894287, -0.09141206741333008, 1.070549488067627, 2.232510566711426, 3.394472122192383, 4.55643367767334, 5.718395233154297, 6.880356788635254, 8.042318344116211, 9.204278945922852, 10.366241455078125, 11.528202056884766, 12.690163612365723, 13.85212516784668, 15.014086723327637, 16.176048278808594, 17.338008880615234, 18.499971389770508, 19.66193199157715, 20.823894500732422, 21.985855102539062, 23.147815704345703, 24.309776306152344, 25.471738815307617, 26.633699417114258, 27.79566192626953, 28.957622528076172, 30.119583129882812, 31.281545639038086, 32.44350814819336]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 3.0, 8.0, 13.0, 18.0, 13.0, 24.0, 23.0, 23.0, 28.0, 30.0, 33.0, 33.0, 31.0, 45.0, 41.0, 47.0, 54.0, 42.0, 42.0, 34.0, 40.0, 36.0, 41.0, 38.0, 40.0, 24.0, 25.0, 29.0, 16.0, 23.0, 16.0, 13.0, 12.0, 19.0, 8.0, 5.0, 7.0, 2.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.94378662109375, -4.7938232421875, -4.64385986328125, -4.493896484375, -4.34393310546875, -4.1939697265625, -4.04400634765625, -3.89404296875, -3.74407958984375, -3.5941162109375, -3.44415283203125, -3.294189453125, -3.14422607421875, -2.9942626953125, -2.84429931640625, -2.6943359375, -2.54437255859375, -2.3944091796875, -2.24444580078125, -2.094482421875, -1.94451904296875, -1.7945556640625, -1.64459228515625, -1.49462890625, -1.34466552734375, -1.1947021484375, -1.04473876953125, -0.894775390625, -0.74481201171875, -0.5948486328125, -0.44488525390625, -0.294921875, -0.14495849609375, 0.0050048828125, 0.15496826171875, 0.304931640625, 0.45489501953125, 0.6048583984375, 0.75482177734375, 0.90478515625, 1.05474853515625, 1.2047119140625, 1.35467529296875, 1.504638671875, 1.65460205078125, 1.8045654296875, 1.95452880859375, 2.1044921875, 2.25445556640625, 2.4044189453125, 2.55438232421875, 2.704345703125, 2.85430908203125, 3.0042724609375, 3.15423583984375, 3.30419921875, 3.45416259765625, 3.6041259765625, 3.75408935546875, 3.904052734375, 4.05401611328125, 4.2039794921875, 4.35394287109375, 4.50390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 9.0, 20.0, 14.0, 24.0, 40.0, 67.0, 72.0, 103.0, 204.0, 298.0, 491.0, 948.0, 1818.0, 3925.0, 9242.0, 25707.0, 91208.0, 491434.0, 2169956.0, 1144657.0, 185041.0, 43577.0, 14110.0, 5677.0, 2544.0, 1276.0, 685.0, 361.0, 248.0, 155.0, 103.0, 64.0, 46.0, 43.0, 32.0, 15.0, 16.0, 6.0, 8.0, 11.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.2734375, -8.9901123046875, -8.706787109375, -8.4234619140625, -8.14013671875, -7.8568115234375, -7.573486328125, -7.2901611328125, -7.0068359375, -6.7235107421875, -6.440185546875, -6.1568603515625, -5.87353515625, -5.5902099609375, -5.306884765625, -5.0235595703125, -4.740234375, -4.4569091796875, -4.173583984375, -3.8902587890625, -3.60693359375, -3.3236083984375, -3.040283203125, -2.7569580078125, -2.4736328125, -2.1903076171875, -1.906982421875, -1.6236572265625, -1.34033203125, -1.0570068359375, -0.773681640625, -0.4903564453125, -0.20703125, 0.0762939453125, 0.359619140625, 0.6429443359375, 0.92626953125, 1.2095947265625, 1.492919921875, 1.7762451171875, 2.0595703125, 2.3428955078125, 2.626220703125, 2.9095458984375, 3.19287109375, 3.4761962890625, 3.759521484375, 4.0428466796875, 4.326171875, 4.6094970703125, 4.892822265625, 5.1761474609375, 5.45947265625, 5.7427978515625, 6.026123046875, 6.3094482421875, 6.5927734375, 6.8760986328125, 7.159423828125, 7.4427490234375, 7.72607421875, 8.0093994140625, 8.292724609375, 8.5760498046875, 8.859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 16.0, 15.0, 26.0, 20.0, 29.0, 40.0, 60.0, 96.0, 76.0, 123.0, 150.0, 202.0, 262.0, 369.0, 446.0, 445.0, 392.0, 302.0, 228.0, 166.0, 123.0, 110.0, 83.0, 72.0, 52.0, 31.0, 26.0, 24.0, 18.0, 8.0, 5.0, 11.0, 3.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.28985595703125, -7.0562744140625, -6.82269287109375, -6.589111328125, -6.35552978515625, -6.1219482421875, -5.88836669921875, -5.65478515625, -5.42120361328125, -5.1876220703125, -4.95404052734375, -4.720458984375, -4.48687744140625, -4.2532958984375, -4.01971435546875, -3.7861328125, -3.55255126953125, -3.3189697265625, -3.08538818359375, -2.851806640625, -2.61822509765625, -2.3846435546875, -2.15106201171875, -1.91748046875, -1.68389892578125, -1.4503173828125, -1.21673583984375, -0.983154296875, -0.74957275390625, -0.5159912109375, -0.28240966796875, -0.048828125, 0.18475341796875, 0.4183349609375, 0.65191650390625, 0.885498046875, 1.11907958984375, 1.3526611328125, 1.58624267578125, 1.81982421875, 2.05340576171875, 2.2869873046875, 2.52056884765625, 2.754150390625, 2.98773193359375, 3.2213134765625, 3.45489501953125, 3.6884765625, 3.92205810546875, 4.1556396484375, 4.38922119140625, 4.622802734375, 4.85638427734375, 5.0899658203125, 5.32354736328125, 5.55712890625, 5.79071044921875, 6.0242919921875, 6.25787353515625, 6.491455078125, 6.72503662109375, 6.9586181640625, 7.19219970703125, 7.42578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 11.0, 14.0, 14.0, 18.0, 26.0, 22.0, 50.0, 54.0, 78.0, 93.0, 127.0, 180.0, 332.0, 898.0, 5193.0, 68954.0, 2946318.0, 1135619.0, 31727.0, 2980.0, 623.0, 276.0, 164.0, 112.0, 92.0, 63.0, 60.0, 37.0, 27.0, 28.0, 23.0, 12.0, 14.0, 6.0, 8.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.078125, -26.200927734375, -25.32373046875, -24.446533203125, -23.5693359375, -22.692138671875, -21.81494140625, -20.937744140625, -20.060546875, -19.183349609375, -18.30615234375, -17.428955078125, -16.5517578125, -15.674560546875, -14.79736328125, -13.920166015625, -13.04296875, -12.165771484375, -11.28857421875, -10.411376953125, -9.5341796875, -8.656982421875, -7.77978515625, -6.902587890625, -6.025390625, -5.148193359375, -4.27099609375, -3.393798828125, -2.5166015625, -1.639404296875, -0.76220703125, 0.114990234375, 0.9921875, 1.869384765625, 2.74658203125, 3.623779296875, 4.5009765625, 5.378173828125, 6.25537109375, 7.132568359375, 8.009765625, 8.886962890625, 9.76416015625, 10.641357421875, 11.5185546875, 12.395751953125, 13.27294921875, 14.150146484375, 15.02734375, 15.904541015625, 16.78173828125, 17.658935546875, 18.5361328125, 19.413330078125, 20.29052734375, 21.167724609375, 22.044921875, 22.922119140625, 23.79931640625, 24.676513671875, 25.5537109375, 26.430908203125, 27.30810546875, 28.185302734375, 29.0625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 12.0, 27.0, 48.0, 111.0, 136.0, 184.0, 173.0, 146.0, 71.0, 59.0, 26.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.47271728515625, -57.340023040771484, -55.20732879638672, -53.07463073730469, -50.94193649291992, -48.809242248535156, -46.676544189453125, -44.54384994506836, -42.411155700683594, -40.27846145629883, -38.14576721191406, -36.01306915283203, -33.880374908447266, -31.7476806640625, -29.6149845123291, -27.482288360595703, -25.349594116210938, -23.216899871826172, -21.084203720092773, -18.951507568359375, -16.81881332397461, -14.686118125915527, -12.553422927856445, -10.420727729797363, -8.288032531738281, -6.155337333679199, -4.022642135620117, -1.8899469375610352, 0.24274826049804688, 2.375443458557129, 4.508138656616211, 6.640833854675293, 8.773521423339844, 10.906216621398926, 13.038911819458008, 15.17160701751709, 17.304302215576172, 19.436996459960938, 21.569692611694336, 23.702388763427734, 25.8350830078125, 27.967777252197266, 30.100473403930664, 32.23316955566406, 34.36586380004883, 36.498558044433594, 38.631256103515625, 40.76395034790039, 42.896644592285156, 45.02933883666992, 47.16203308105469, 49.29473114013672, 51.427425384521484, 53.56011962890625, 55.69281768798828, 57.82551193237305, 59.95820617675781, 62.09090042114258, 64.22359466552734, 66.35629272460938, 68.48898315429688, 70.6216812133789, 72.75437927246094, 74.88706970214844, 77.01976776123047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 8.0, 5.0, 12.0, 14.0, 18.0, 24.0, 23.0, 30.0, 24.0, 19.0, 36.0, 30.0, 34.0, 39.0, 32.0, 41.0, 36.0, 39.0, 39.0, 34.0, 26.0, 43.0, 39.0, 26.0, 33.0, 32.0, 37.0, 37.0, 18.0, 17.0, 23.0, 25.0, 12.0, 10.0, 19.0, 8.0, 6.0, 7.0, 8.0, 6.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.44509506225586, -21.629261016845703, -20.813426971435547, -19.997594833374023, -19.181760787963867, -18.36592674255371, -17.550094604492188, -16.73426055908203, -15.918426513671875, -15.102592468261719, -14.286759376525879, -13.470926284790039, -12.655092239379883, -11.839258193969727, -11.023425102233887, -10.207592010498047, -9.39175796508789, -8.575923919677734, -7.7600908279418945, -6.9442572593688965, -6.128423690795898, -5.3125901222229, -4.496756553649902, -3.6809229850769043, -2.8650894165039062, -2.049255847930908, -1.2334222793579102, -0.4175887107849121, 0.39824485778808594, 1.214078426361084, 2.029911994934082, 2.84574556350708, 3.661579132080078, 4.477412700653076, 5.293246269226074, 6.109079837799072, 6.92491340637207, 7.740746974945068, 8.556580543518066, 9.372413635253906, 10.188247680664062, 11.004081726074219, 11.819914817810059, 12.635747909545898, 13.451581954956055, 14.267416000366211, 15.08324909210205, 15.89908218383789, 16.714916229248047, 17.530750274658203, 18.34658432006836, 19.162416458129883, 19.97825050354004, 20.794084548950195, 21.60991668701172, 22.425750732421875, 23.24158477783203, 24.057418823242188, 24.873252868652344, 25.689085006713867, 26.504919052124023, 27.32075309753418, 28.136585235595703, 28.95241928100586, 29.768253326416016]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 8.0, 7.0, 14.0, 15.0, 20.0, 16.0, 16.0, 28.0, 17.0, 24.0, 20.0, 28.0, 24.0, 38.0, 34.0, 25.0, 39.0, 40.0, 44.0, 46.0, 34.0, 27.0, 29.0, 30.0, 26.0, 36.0, 42.0, 28.0, 21.0, 25.0, 18.0, 20.0, 20.0, 12.0, 15.0, 12.0, 11.0, 15.0, 15.0, 6.0, 5.0, 6.0, 3.0, 11.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.7421875, -3.624114990234375, -3.50604248046875, -3.387969970703125, -3.2698974609375, -3.151824951171875, -3.03375244140625, -2.915679931640625, -2.797607421875, -2.679534912109375, -2.56146240234375, -2.443389892578125, -2.3253173828125, -2.207244873046875, -2.08917236328125, -1.971099853515625, -1.85302734375, -1.734954833984375, -1.61688232421875, -1.498809814453125, -1.3807373046875, -1.262664794921875, -1.14459228515625, -1.026519775390625, -0.908447265625, -0.790374755859375, -0.67230224609375, -0.554229736328125, -0.4361572265625, -0.318084716796875, -0.20001220703125, -0.081939697265625, 0.0361328125, 0.154205322265625, 0.27227783203125, 0.390350341796875, 0.5084228515625, 0.626495361328125, 0.74456787109375, 0.862640380859375, 0.980712890625, 1.098785400390625, 1.21685791015625, 1.334930419921875, 1.4530029296875, 1.571075439453125, 1.68914794921875, 1.807220458984375, 1.92529296875, 2.043365478515625, 2.16143798828125, 2.279510498046875, 2.3975830078125, 2.515655517578125, 2.63372802734375, 2.751800537109375, 2.869873046875, 2.987945556640625, 3.10601806640625, 3.224090576171875, 3.3421630859375, 3.460235595703125, 3.57830810546875, 3.696380615234375, 3.814453125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 13.0, 20.0, 31.0, 46.0, 84.0, 127.0, 182.0, 346.0, 539.0, 918.0, 1628.0, 2824.0, 5560.0, 11834.0, 27219.0, 70670.0, 197513.0, 377673.0, 218444.0, 77423.0, 29557.0, 12740.0, 6022.0, 3065.0, 1658.0, 930.0, 571.0, 337.0, 201.0, 128.0, 86.0, 62.0, 43.0, 19.0, 12.0, 7.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.775390625, -1.7254486083984375, -1.675506591796875, -1.6255645751953125, -1.57562255859375, -1.5256805419921875, -1.475738525390625, -1.4257965087890625, -1.3758544921875, -1.3259124755859375, -1.275970458984375, -1.2260284423828125, -1.17608642578125, -1.1261444091796875, -1.076202392578125, -1.0262603759765625, -0.976318359375, -0.9263763427734375, -0.876434326171875, -0.8264923095703125, -0.77655029296875, -0.7266082763671875, -0.676666259765625, -0.6267242431640625, -0.5767822265625, -0.5268402099609375, -0.476898193359375, -0.4269561767578125, -0.37701416015625, -0.3270721435546875, -0.277130126953125, -0.2271881103515625, -0.17724609375, -0.1273040771484375, -0.077362060546875, -0.0274200439453125, 0.02252197265625, 0.0724639892578125, 0.122406005859375, 0.1723480224609375, 0.2222900390625, 0.2722320556640625, 0.322174072265625, 0.3721160888671875, 0.42205810546875, 0.4720001220703125, 0.521942138671875, 0.5718841552734375, 0.621826171875, 0.6717681884765625, 0.721710205078125, 0.7716522216796875, 0.82159423828125, 0.8715362548828125, 0.921478271484375, 0.9714202880859375, 1.0213623046875, 1.0713043212890625, 1.121246337890625, 1.1711883544921875, 1.22113037109375, 1.2710723876953125, 1.321014404296875, 1.3709564208984375, 1.4208984375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 15.0, 15.0, 11.0, 12.0, 21.0, 22.0, 28.0, 31.0, 25.0, 29.0, 38.0, 37.0, 38.0, 42.0, 36.0, 41.0, 1076.0, 37.0, 50.0, 38.0, 43.0, 41.0, 21.0, 33.0, 33.0, 30.0, 31.0, 20.0, 23.0, 14.0, 16.0, 10.0, 13.0, 9.0, 9.0, 8.0, 2.0, 0.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1796875, -4.06561279296875, -3.9515380859375, -3.83746337890625, -3.723388671875, -3.60931396484375, -3.4952392578125, -3.38116455078125, -3.26708984375, -3.15301513671875, -3.0389404296875, -2.92486572265625, -2.810791015625, -2.69671630859375, -2.5826416015625, -2.46856689453125, -2.3544921875, -2.24041748046875, -2.1263427734375, -2.01226806640625, -1.898193359375, -1.78411865234375, -1.6700439453125, -1.55596923828125, -1.44189453125, -1.32781982421875, -1.2137451171875, -1.09967041015625, -0.985595703125, -0.87152099609375, -0.7574462890625, -0.64337158203125, -0.529296875, -0.41522216796875, -0.3011474609375, -0.18707275390625, -0.072998046875, 0.04107666015625, 0.1551513671875, 0.26922607421875, 0.38330078125, 0.49737548828125, 0.6114501953125, 0.72552490234375, 0.839599609375, 0.95367431640625, 1.0677490234375, 1.18182373046875, 1.2958984375, 1.40997314453125, 1.5240478515625, 1.63812255859375, 1.752197265625, 1.86627197265625, 1.9803466796875, 2.09442138671875, 2.20849609375, 2.32257080078125, 2.4366455078125, 2.55072021484375, 2.664794921875, 2.77886962890625, 2.8929443359375, 3.00701904296875, 3.12109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 19.0, 12.0, 28.0, 40.0, 68.0, 75.0, 115.0, 141.0, 212.0, 309.0, 426.0, 600.0, 866.0, 1336.0, 2113.0, 3664.0, 6868.0, 14045.0, 33734.0, 95462.0, 351619.0, 1170336.0, 278327.0, 80269.0, 28941.0, 12344.0, 5997.0, 3249.0, 1954.0, 1253.0, 845.0, 535.0, 373.0, 251.0, 220.0, 145.0, 109.0, 53.0, 60.0, 40.0, 31.0, 13.0, 7.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9248046875, -0.8971328735351562, -0.8694610595703125, -0.8417892456054688, -0.814117431640625, -0.7864456176757812, -0.7587738037109375, -0.7311019897460938, -0.70343017578125, -0.6757583618164062, -0.6480865478515625, -0.6204147338867188, -0.592742919921875, -0.5650711059570312, -0.5373992919921875, -0.5097274780273438, -0.4820556640625, -0.45438385009765625, -0.4267120361328125, -0.39904022216796875, -0.371368408203125, -0.34369659423828125, -0.3160247802734375, -0.28835296630859375, -0.26068115234375, -0.23300933837890625, -0.2053375244140625, -0.17766571044921875, -0.149993896484375, -0.12232208251953125, -0.0946502685546875, -0.06697845458984375, -0.039306640625, -0.01163482666015625, 0.0160369873046875, 0.04370880126953125, 0.071380615234375, 0.09905242919921875, 0.1267242431640625, 0.15439605712890625, 0.18206787109375, 0.20973968505859375, 0.2374114990234375, 0.26508331298828125, 0.292755126953125, 0.32042694091796875, 0.3480987548828125, 0.37577056884765625, 0.4034423828125, 0.43111419677734375, 0.4587860107421875, 0.48645782470703125, 0.514129638671875, 0.5418014526367188, 0.5694732666015625, 0.5971450805664062, 0.62481689453125, 0.6524887084960938, 0.6801605224609375, 0.7078323364257812, 0.735504150390625, 0.7631759643554688, 0.7908477783203125, 0.8185195922851562, 0.84619140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 11.0, 10.0, 11.0, 25.0, 19.0, 26.0, 28.0, 35.0, 48.0, 40.0, 59.0, 102.0, 109.0, 106.0, 68.0, 59.0, 39.0, 34.0, 40.0, 15.0, 22.0, 19.0, 10.0, 8.0, 5.0, 5.0, 11.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.191162109375, -0.18487930297851562, -0.17859649658203125, -0.17231369018554688, -0.1660308837890625, -0.15974807739257812, -0.15346527099609375, -0.14718246459960938, -0.140899658203125, -0.13461685180664062, -0.12833404541015625, -0.12205123901367188, -0.1157684326171875, -0.10948562622070312, -0.10320281982421875, -0.09692001342773438, -0.09063720703125, -0.08435440063476562, -0.07807159423828125, -0.07178878784179688, -0.0655059814453125, -0.059223175048828125, -0.05294036865234375, -0.046657562255859375, -0.040374755859375, -0.034091949462890625, -0.02780914306640625, -0.021526336669921875, -0.0152435302734375, -0.008960723876953125, -0.00267791748046875, 0.003604888916015625, 0.0098876953125, 0.016170501708984375, 0.02245330810546875, 0.028736114501953125, 0.0350189208984375, 0.041301727294921875, 0.04758453369140625, 0.053867340087890625, 0.060150146484375, 0.06643295288085938, 0.07271575927734375, 0.07899856567382812, 0.0852813720703125, 0.09156417846679688, 0.09784698486328125, 0.10412979125976562, 0.11041259765625, 0.11669540405273438, 0.12297821044921875, 0.12926101684570312, 0.1355438232421875, 0.14182662963867188, 0.14810943603515625, 0.15439224243164062, 0.160675048828125, 0.16695785522460938, 0.17324066162109375, 0.17952346801757812, 0.1858062744140625, 0.19208908081054688, 0.19837188720703125, 0.20465469360351562, 0.2109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 7.0, 6.0, 5.0, 11.0, 12.0, 21.0, 19.0, 32.0, 38.0, 61.0, 82.0, 198.0, 693.0, 7079.0, 923917.0, 112385.0, 3113.0, 451.0, 142.0, 69.0, 47.0, 38.0, 26.0, 26.0, 17.0, 15.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15625, -5.01239013671875, -4.8685302734375, -4.72467041015625, -4.580810546875, -4.43695068359375, -4.2930908203125, -4.14923095703125, -4.00537109375, -3.86151123046875, -3.7176513671875, -3.57379150390625, -3.429931640625, -3.28607177734375, -3.1422119140625, -2.99835205078125, -2.8544921875, -2.71063232421875, -2.5667724609375, -2.42291259765625, -2.279052734375, -2.13519287109375, -1.9913330078125, -1.84747314453125, -1.70361328125, -1.55975341796875, -1.4158935546875, -1.27203369140625, -1.128173828125, -0.98431396484375, -0.8404541015625, -0.69659423828125, -0.552734375, -0.40887451171875, -0.2650146484375, -0.12115478515625, 0.022705078125, 0.16656494140625, 0.3104248046875, 0.45428466796875, 0.59814453125, 0.74200439453125, 0.8858642578125, 1.02972412109375, 1.173583984375, 1.31744384765625, 1.4613037109375, 1.60516357421875, 1.7490234375, 1.89288330078125, 2.0367431640625, 2.18060302734375, 2.324462890625, 2.46832275390625, 2.6121826171875, 2.75604248046875, 2.89990234375, 3.04376220703125, 3.1876220703125, 3.33148193359375, 3.475341796875, 3.61920166015625, 3.7630615234375, 3.90692138671875, 4.05078125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 37.0, 147.0, 399.0, 332.0, 69.0, 15.0, 9.0], "bins": [-3.2481863498687744, -3.193763494491577, -3.139340877532959, -3.0849180221557617, -3.0304951667785645, -2.976072311401367, -2.921649694442749, -2.8672268390655518, -2.8128039836883545, -2.7583811283111572, -2.703958511352539, -2.649535655975342, -2.5951128005981445, -2.5406899452209473, -2.486267328262329, -2.431844472885132, -2.3774218559265137, -2.3229990005493164, -2.2685763835906982, -2.214153528213501, -2.1597306728363037, -2.1053078174591064, -2.0508852005004883, -1.996462345123291, -1.9420394897460938, -1.887616753578186, -1.8331938982009888, -1.778771162033081, -1.7243483066558838, -1.669925570487976, -1.6155028343200684, -1.561079978942871, -1.5066571235656738, -1.4522343873977661, -1.3978115320205688, -1.3433887958526611, -1.2889659404754639, -1.2345432043075562, -1.1801204681396484, -1.1256976127624512, -1.071274757385254, -1.0168520212173462, -0.9624291658401489, -0.9080064296722412, -0.853583574295044, -0.7991608381271362, -0.7447380423545837, -0.6903152465820312, -0.6358924508094788, -0.5814696550369263, -0.5270468592643738, -0.4726240932941437, -0.4182012975215912, -0.3637785017490387, -0.3093557357788086, -0.2549329400062561, -0.2005101591348648, -0.1460873782634735, -0.09166458249092102, -0.037241801619529724, 0.017180994153022766, 0.07160378992557526, 0.12602655589580536, 0.18044935166835785, 0.23487214744091034]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 3.0, 4.0, 10.0, 5.0, 13.0, 21.0, 14.0, 14.0, 18.0, 28.0, 30.0, 16.0, 29.0, 26.0, 39.0, 38.0, 32.0, 39.0, 31.0, 44.0, 36.0, 29.0, 31.0, 35.0, 55.0, 37.0, 40.0, 31.0, 33.0, 23.0, 29.0, 26.0, 18.0, 13.0, 15.0, 15.0, 11.0, 13.0, 12.0, 8.0, 17.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.34127140045166016, -0.3313886225223541, -0.3215058445930481, -0.31162306666374207, -0.30174028873443604, -0.2918574810028076, -0.2819747030735016, -0.27209192514419556, -0.2622091472148895, -0.2523263692855835, -0.24244359135627747, -0.23256079852581024, -0.2226780205965042, -0.21279524266719818, -0.20291244983673096, -0.19302967190742493, -0.1831468939781189, -0.17326411604881287, -0.16338133811950684, -0.1534985452890396, -0.14361576735973358, -0.13373298943042755, -0.12385020405054092, -0.1139674186706543, -0.10408464074134827, -0.09420186281204224, -0.08431907743215561, -0.07443629205226898, -0.06455351412296295, -0.05467073246836662, -0.044787950813770294, -0.03490516543388367, -0.025022387504577637, -0.015139605849981308, -0.005256824195384979, 0.0046259574592113495, 0.014508739113807678, 0.024391520768404007, 0.034274302423000336, 0.04415708780288696, 0.05403986573219299, 0.06392264366149902, 0.07380542904138565, 0.08368821442127228, 0.09357099235057831, 0.10345377027988434, 0.11333655565977097, 0.12321934103965759, 0.13310211896896362, 0.14298489689826965, 0.15286767482757568, 0.1627504676580429, 0.17263324558734894, 0.18251602351665497, 0.1923988163471222, 0.20228159427642822, 0.21216437220573425, 0.22204715013504028, 0.2319299280643463, 0.24181272089481354, 0.25169551372528076, 0.2615782916545868, 0.2714610695838928, 0.28134384751319885, 0.2912266254425049]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 8.0, 17.0, 11.0, 11.0, 10.0, 18.0, 30.0, 23.0, 28.0, 12.0, 25.0, 28.0, 25.0, 33.0, 43.0, 36.0, 42.0, 36.0, 50.0, 45.0, 46.0, 27.0, 37.0, 30.0, 32.0, 37.0, 29.0, 27.0, 18.0, 17.0, 16.0, 21.0, 15.0, 15.0, 13.0, 15.0, 7.0, 8.0, 8.0, 6.0, 6.0, 9.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.881561279296875, -3.75921630859375, -3.636871337890625, -3.5145263671875, -3.392181396484375, -3.26983642578125, -3.147491455078125, -3.025146484375, -2.902801513671875, -2.78045654296875, -2.658111572265625, -2.5357666015625, -2.413421630859375, -2.29107666015625, -2.168731689453125, -2.04638671875, -1.924041748046875, -1.80169677734375, -1.679351806640625, -1.5570068359375, -1.434661865234375, -1.31231689453125, -1.189971923828125, -1.067626953125, -0.945281982421875, -0.82293701171875, -0.700592041015625, -0.5782470703125, -0.455902099609375, -0.33355712890625, -0.211212158203125, -0.0888671875, 0.033477783203125, 0.15582275390625, 0.278167724609375, 0.4005126953125, 0.522857666015625, 0.64520263671875, 0.767547607421875, 0.889892578125, 1.012237548828125, 1.13458251953125, 1.256927490234375, 1.3792724609375, 1.501617431640625, 1.62396240234375, 1.746307373046875, 1.86865234375, 1.990997314453125, 2.11334228515625, 2.235687255859375, 2.3580322265625, 2.480377197265625, 2.60272216796875, 2.725067138671875, 2.847412109375, 2.969757080078125, 3.09210205078125, 3.214447021484375, 3.3367919921875, 3.459136962890625, 3.58148193359375, 3.703826904296875, 3.826171875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 8.0, 10.0, 14.0, 20.0, 26.0, 28.0, 48.0, 64.0, 97.0, 157.0, 231.0, 344.0, 568.0, 964.0, 1691.0, 3348.0, 7069.0, 16882.0, 45842.0, 150375.0, 493558.0, 221901.0, 64754.0, 22273.0, 8960.0, 4185.0, 2096.0, 1159.0, 630.0, 416.0, 243.0, 173.0, 121.0, 91.0, 58.0, 33.0, 25.0, 19.0, 13.0, 15.0, 11.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-8.9375, -8.6795654296875, -8.421630859375, -8.1636962890625, -7.90576171875, -7.6478271484375, -7.389892578125, -7.1319580078125, -6.8740234375, -6.6160888671875, -6.358154296875, -6.1002197265625, -5.84228515625, -5.5843505859375, -5.326416015625, -5.0684814453125, -4.810546875, -4.5526123046875, -4.294677734375, -4.0367431640625, -3.77880859375, -3.5208740234375, -3.262939453125, -3.0050048828125, -2.7470703125, -2.4891357421875, -2.231201171875, -1.9732666015625, -1.71533203125, -1.4573974609375, -1.199462890625, -0.9415283203125, -0.68359375, -0.4256591796875, -0.167724609375, 0.0902099609375, 0.34814453125, 0.6060791015625, 0.864013671875, 1.1219482421875, 1.3798828125, 1.6378173828125, 1.895751953125, 2.1536865234375, 2.41162109375, 2.6695556640625, 2.927490234375, 3.1854248046875, 3.443359375, 3.7012939453125, 3.959228515625, 4.2171630859375, 4.47509765625, 4.7330322265625, 4.990966796875, 5.2489013671875, 5.5068359375, 5.7647705078125, 6.022705078125, 6.2806396484375, 6.53857421875, 6.7965087890625, 7.054443359375, 7.3123779296875, 7.5703125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 4.0, 11.0, 10.0, 7.0, 7.0, 9.0, 14.0, 14.0, 17.0, 18.0, 26.0, 30.0, 30.0, 24.0, 27.0, 32.0, 51.0, 48.0, 85.0, 117.0, 231.0, 1430.0, 218.0, 110.0, 74.0, 47.0, 46.0, 38.0, 42.0, 30.0, 22.0, 22.0, 12.0, 21.0, 14.0, 14.0, 15.0, 16.0, 9.0, 10.0, 10.0, 7.0, 7.0, 4.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.7890625, -10.435546875, -10.08203125, -9.728515625, -9.375, -9.021484375, -8.66796875, -8.314453125, -7.9609375, -7.607421875, -7.25390625, -6.900390625, -6.546875, -6.193359375, -5.83984375, -5.486328125, -5.1328125, -4.779296875, -4.42578125, -4.072265625, -3.71875, -3.365234375, -3.01171875, -2.658203125, -2.3046875, -1.951171875, -1.59765625, -1.244140625, -0.890625, -0.537109375, -0.18359375, 0.169921875, 0.5234375, 0.876953125, 1.23046875, 1.583984375, 1.9375, 2.291015625, 2.64453125, 2.998046875, 3.3515625, 3.705078125, 4.05859375, 4.412109375, 4.765625, 5.119140625, 5.47265625, 5.826171875, 6.1796875, 6.533203125, 6.88671875, 7.240234375, 7.59375, 7.947265625, 8.30078125, 8.654296875, 9.0078125, 9.361328125, 9.71484375, 10.068359375, 10.421875, 10.775390625, 11.12890625, 11.482421875, 11.8359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 4.0, 12.0, 17.0, 6.0, 16.0, 24.0, 28.0, 43.0, 53.0, 72.0, 76.0, 97.0, 145.0, 263.0, 509.0, 1513.0, 9453.0, 945566.0, 2171779.0, 12725.0, 1785.0, 584.0, 270.0, 180.0, 111.0, 85.0, 71.0, 49.0, 37.0, 33.0, 24.0, 18.0, 13.0, 8.0, 11.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.71875, -33.6357421875, -32.552734375, -31.4697265625, -30.38671875, -29.3037109375, -28.220703125, -27.1376953125, -26.0546875, -24.9716796875, -23.888671875, -22.8056640625, -21.72265625, -20.6396484375, -19.556640625, -18.4736328125, -17.390625, -16.3076171875, -15.224609375, -14.1416015625, -13.05859375, -11.9755859375, -10.892578125, -9.8095703125, -8.7265625, -7.6435546875, -6.560546875, -5.4775390625, -4.39453125, -3.3115234375, -2.228515625, -1.1455078125, -0.0625, 1.0205078125, 2.103515625, 3.1865234375, 4.26953125, 5.3525390625, 6.435546875, 7.5185546875, 8.6015625, 9.6845703125, 10.767578125, 11.8505859375, 12.93359375, 14.0166015625, 15.099609375, 16.1826171875, 17.265625, 18.3486328125, 19.431640625, 20.5146484375, 21.59765625, 22.6806640625, 23.763671875, 24.8466796875, 25.9296875, 27.0126953125, 28.095703125, 29.1787109375, 30.26171875, 31.3447265625, 32.427734375, 33.5107421875, 34.59375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 15.0, 37.0, 60.0, 103.0, 140.0, 152.0, 155.0, 111.0, 99.0, 74.0, 32.0, 15.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.83727264404297, -36.88913345336914, -35.94099426269531, -34.992855072021484, -34.044715881347656, -33.096580505371094, -32.1484375, -31.200300216674805, -30.25216293334961, -29.30402374267578, -28.355884552001953, -27.407745361328125, -26.45960807800293, -25.5114688873291, -24.563329696655273, -23.615190505981445, -22.667051315307617, -21.71891212463379, -20.77077293395996, -19.822635650634766, -18.874496459960938, -17.92635726928711, -16.97821807861328, -16.030078887939453, -15.081940650939941, -14.133801460266113, -13.185663223266602, -12.237524032592773, -11.289384841918945, -10.341246604919434, -9.393107414245605, -8.444969177246094, -7.496828079223633, -6.548689365386963, -5.600550651550293, -4.652411460876465, -3.704272747039795, -2.756134033203125, -1.8079948425292969, -0.859856128692627, 0.08828258514404297, 1.0364214181900024, 1.984560251235962, 2.932699203491211, 3.880837917327881, 4.828976631164551, 5.777115821838379, 6.725254535675049, 7.673393249511719, 8.621532440185547, 9.569670677185059, 10.517809867858887, 11.465948104858398, 12.414087295532227, 13.362226486206055, 14.310365676879883, 15.258503913879395, 16.206642150878906, 17.154781341552734, 18.102920532226562, 19.05105972290039, 19.99919891357422, 20.947338104248047, 21.895475387573242, 22.84361457824707]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 9.0, 1.0, 2.0, 4.0, 1.0, 10.0, 10.0, 7.0, 9.0, 13.0, 22.0, 24.0, 24.0, 22.0, 27.0, 26.0, 34.0, 37.0, 35.0, 39.0, 38.0, 39.0, 34.0, 45.0, 54.0, 39.0, 35.0, 56.0, 40.0, 28.0, 36.0, 23.0, 29.0, 23.0, 26.0, 24.0, 8.0, 19.0, 10.0, 7.0, 11.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.1062126159668, -37.94628143310547, -36.78635025024414, -35.62642288208008, -34.46649169921875, -33.30656051635742, -32.146629333496094, -30.986698150634766, -29.82676887512207, -28.666837692260742, -27.506908416748047, -26.34697723388672, -25.18704605102539, -24.027116775512695, -22.867185592651367, -21.707256317138672, -20.547325134277344, -19.387393951416016, -18.22746467590332, -17.067533493041992, -15.90760326385498, -14.747673034667969, -13.58774185180664, -12.427811622619629, -11.267881393432617, -10.107951164245605, -8.948020935058594, -7.788089752197266, -6.628159523010254, -5.468229293823242, -4.308298587799072, -3.1483678817749023, -1.988433837890625, -0.8285033702850342, 0.33142709732055664, 1.4913575649261475, 2.6512880325317383, 3.81121826171875, 4.97114896774292, 6.13107967376709, 7.291009902954102, 8.450940132141113, 9.610870361328125, 10.770801544189453, 11.930731773376465, 13.090662002563477, 14.250593185424805, 15.410523414611816, 16.570453643798828, 17.730384826660156, 18.89031410217285, 20.05024528503418, 21.210174560546875, 22.370105743408203, 23.53003692626953, 24.68996810913086, 25.849897384643555, 27.009828567504883, 28.169757843017578, 29.329689025878906, 30.489620208740234, 31.64954948425293, 32.809478759765625, 33.96940994262695, 35.12934112548828]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 8.0, 6.0, 5.0, 9.0, 15.0, 14.0, 18.0, 18.0, 19.0, 26.0, 19.0, 28.0, 30.0, 29.0, 32.0, 47.0, 51.0, 28.0, 52.0, 39.0, 45.0, 34.0, 45.0, 51.0, 32.0, 31.0, 34.0, 35.0, 22.0, 24.0, 25.0, 25.0, 19.0, 17.0, 11.0, 13.0, 9.0, 15.0, 5.0, 9.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.15625, -5.00469970703125, -4.8531494140625, -4.70159912109375, -4.550048828125, -4.39849853515625, -4.2469482421875, -4.09539794921875, -3.94384765625, -3.79229736328125, -3.6407470703125, -3.48919677734375, -3.337646484375, -3.18609619140625, -3.0345458984375, -2.88299560546875, -2.7314453125, -2.57989501953125, -2.4283447265625, -2.27679443359375, -2.125244140625, -1.97369384765625, -1.8221435546875, -1.67059326171875, -1.51904296875, -1.36749267578125, -1.2159423828125, -1.06439208984375, -0.912841796875, -0.76129150390625, -0.6097412109375, -0.45819091796875, -0.306640625, -0.15509033203125, -0.0035400390625, 0.14801025390625, 0.299560546875, 0.45111083984375, 0.6026611328125, 0.75421142578125, 0.90576171875, 1.05731201171875, 1.2088623046875, 1.36041259765625, 1.511962890625, 1.66351318359375, 1.8150634765625, 1.96661376953125, 2.1181640625, 2.26971435546875, 2.4212646484375, 2.57281494140625, 2.724365234375, 2.87591552734375, 3.0274658203125, 3.17901611328125, 3.33056640625, 3.48211669921875, 3.6336669921875, 3.78521728515625, 3.936767578125, 4.08831787109375, 4.2398681640625, 4.39141845703125, 4.54296875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 3.0, 9.0, 9.0, 12.0, 17.0, 21.0, 23.0, 48.0, 66.0, 126.0, 187.0, 372.0, 762.0, 1572.0, 3885.0, 11164.0, 42119.0, 241674.0, 1792776.0, 1794843.0, 243886.0, 41917.0, 11373.0, 3968.0, 1683.0, 809.0, 396.0, 203.0, 117.0, 59.0, 49.0, 36.0, 26.0, 26.0, 10.0, 11.0, 9.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.304931640625, -9.99267578125, -9.680419921875, -9.3681640625, -9.055908203125, -8.74365234375, -8.431396484375, -8.119140625, -7.806884765625, -7.49462890625, -7.182373046875, -6.8701171875, -6.557861328125, -6.24560546875, -5.933349609375, -5.62109375, -5.308837890625, -4.99658203125, -4.684326171875, -4.3720703125, -4.059814453125, -3.74755859375, -3.435302734375, -3.123046875, -2.810791015625, -2.49853515625, -2.186279296875, -1.8740234375, -1.561767578125, -1.24951171875, -0.937255859375, -0.625, -0.312744140625, -0.00048828125, 0.311767578125, 0.6240234375, 0.936279296875, 1.24853515625, 1.560791015625, 1.873046875, 2.185302734375, 2.49755859375, 2.809814453125, 3.1220703125, 3.434326171875, 3.74658203125, 4.058837890625, 4.37109375, 4.683349609375, 4.99560546875, 5.307861328125, 5.6201171875, 5.932373046875, 6.24462890625, 6.556884765625, 6.869140625, 7.181396484375, 7.49365234375, 7.805908203125, 8.1181640625, 8.430419921875, 8.74267578125, 9.054931640625, 9.3671875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 4.0, 8.0, 4.0, 4.0, 5.0, 13.0, 27.0, 26.0, 23.0, 42.0, 45.0, 78.0, 95.0, 124.0, 167.0, 249.0, 360.0, 443.0, 507.0, 475.0, 368.0, 237.0, 185.0, 145.0, 104.0, 82.0, 71.0, 49.0, 31.0, 22.0, 22.0, 14.0, 10.0, 5.0, 6.0, 4.0, 7.0, 1.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.0546875, -8.80718994140625, -8.5596923828125, -8.31219482421875, -8.064697265625, -7.81719970703125, -7.5697021484375, -7.32220458984375, -7.07470703125, -6.82720947265625, -6.5797119140625, -6.33221435546875, -6.084716796875, -5.83721923828125, -5.5897216796875, -5.34222412109375, -5.0947265625, -4.84722900390625, -4.5997314453125, -4.35223388671875, -4.104736328125, -3.85723876953125, -3.6097412109375, -3.36224365234375, -3.11474609375, -2.86724853515625, -2.6197509765625, -2.37225341796875, -2.124755859375, -1.87725830078125, -1.6297607421875, -1.38226318359375, -1.134765625, -0.88726806640625, -0.6397705078125, -0.39227294921875, -0.144775390625, 0.10272216796875, 0.3502197265625, 0.59771728515625, 0.84521484375, 1.09271240234375, 1.3402099609375, 1.58770751953125, 1.835205078125, 2.08270263671875, 2.3302001953125, 2.57769775390625, 2.8251953125, 3.07269287109375, 3.3201904296875, 3.56768798828125, 3.815185546875, 4.06268310546875, 4.3101806640625, 4.55767822265625, 4.80517578125, 5.05267333984375, 5.3001708984375, 5.54766845703125, 5.795166015625, 6.04266357421875, 6.2901611328125, 6.53765869140625, 6.78515625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 1.0, 6.0, 14.0, 17.0, 15.0, 27.0, 25.0, 59.0, 44.0, 72.0, 114.0, 138.0, 193.0, 331.0, 872.0, 9757.0, 726916.0, 3417983.0, 34801.0, 1687.0, 429.0, 208.0, 135.0, 105.0, 73.0, 62.0, 41.0, 32.0, 18.0, 25.0, 16.0, 14.0, 6.0, 3.0, 9.0, 4.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.875, -30.74365234375, -29.6123046875, -28.48095703125, -27.349609375, -26.21826171875, -25.0869140625, -23.95556640625, -22.82421875, -21.69287109375, -20.5615234375, -19.43017578125, -18.298828125, -17.16748046875, -16.0361328125, -14.90478515625, -13.7734375, -12.64208984375, -11.5107421875, -10.37939453125, -9.248046875, -8.11669921875, -6.9853515625, -5.85400390625, -4.72265625, -3.59130859375, -2.4599609375, -1.32861328125, -0.197265625, 0.93408203125, 2.0654296875, 3.19677734375, 4.328125, 5.45947265625, 6.5908203125, 7.72216796875, 8.853515625, 9.98486328125, 11.1162109375, 12.24755859375, 13.37890625, 14.51025390625, 15.6416015625, 16.77294921875, 17.904296875, 19.03564453125, 20.1669921875, 21.29833984375, 22.4296875, 23.56103515625, 24.6923828125, 25.82373046875, 26.955078125, 28.08642578125, 29.2177734375, 30.34912109375, 31.48046875, 32.61181640625, 33.7431640625, 34.87451171875, 36.005859375, 37.13720703125, 38.2685546875, 39.39990234375, 40.53125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 7.0, 11.0, 18.0, 40.0, 36.0, 62.0, 88.0, 84.0, 102.0, 124.0, 118.0, 93.0, 79.0, 40.0, 44.0, 25.0, 18.0, 9.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.58208084106445, -42.439292907714844, -41.2965087890625, -40.153724670410156, -39.01093673706055, -37.86814880371094, -36.725364685058594, -35.58258056640625, -34.43979263305664, -33.29700469970703, -32.15422058105469, -31.01143455505371, -29.868648529052734, -28.725862503051758, -27.58307647705078, -26.440290451049805, -25.297504425048828, -24.15471839904785, -23.011932373046875, -21.8691463470459, -20.726360321044922, -19.583574295043945, -18.44078826904297, -17.298002243041992, -16.155216217041016, -15.012430191040039, -13.869644165039062, -12.726858139038086, -11.58407211303711, -10.441286087036133, -9.298500061035156, -8.15571403503418, -7.012929916381836, -5.870143890380859, -4.727357864379883, -3.5845718383789062, -2.4417858123779297, -1.2989997863769531, -0.15621376037597656, 0.986572265625, 2.1293582916259766, 3.272144317626953, 4.41493034362793, 5.557716369628906, 6.700502395629883, 7.843288421630859, 8.986074447631836, 10.128860473632812, 11.271646499633789, 12.414432525634766, 13.557218551635742, 14.700004577636719, 15.842790603637695, 16.985576629638672, 18.12836265563965, 19.271148681640625, 20.4139347076416, 21.556720733642578, 22.699506759643555, 23.84229278564453, 24.985078811645508, 26.127864837646484, 27.27065086364746, 28.413436889648438, 29.556222915649414]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 10.0, 5.0, 10.0, 10.0, 11.0, 18.0, 20.0, 18.0, 18.0, 30.0, 23.0, 38.0, 37.0, 30.0, 35.0, 35.0, 30.0, 48.0, 34.0, 31.0, 39.0, 46.0, 40.0, 47.0, 35.0, 40.0, 37.0, 28.0, 27.0, 26.0, 19.0, 14.0, 18.0, 13.0, 15.0, 17.0, 10.0, 9.0, 5.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.35515594482422, -25.532716751098633, -24.710277557373047, -23.887836456298828, -23.065397262573242, -22.242958068847656, -21.420516967773438, -20.59807777404785, -19.775638580322266, -18.95319938659668, -18.130760192871094, -17.308319091796875, -16.48587989807129, -15.663440704345703, -14.8410005569458, -14.018560409545898, -13.196121215820312, -12.373682022094727, -11.551241874694824, -10.728801727294922, -9.906362533569336, -9.08392333984375, -8.261483192443848, -7.4390435218811035, -6.616603851318359, -5.794164180755615, -4.971724510192871, -4.149284839630127, -3.326845169067383, -2.5044054985046387, -1.6819658279418945, -0.8595261573791504, -0.03708457946777344, 0.7853550910949707, 1.6077947616577148, 2.430234432220459, 3.252674102783203, 4.075113773345947, 4.897553443908691, 5.7199931144714355, 6.54243278503418, 7.364872455596924, 8.187312126159668, 9.00975227355957, 9.832191467285156, 10.654630661010742, 11.477070808410645, 12.299510955810547, 13.121950149536133, 13.944389343261719, 14.766829490661621, 15.589269638061523, 16.41170883178711, 17.234148025512695, 18.05658721923828, 18.8790283203125, 19.701467514038086, 20.523906707763672, 21.34634780883789, 22.168787002563477, 22.991226196289062, 23.81366539001465, 24.636104583740234, 25.458545684814453, 26.28098487854004]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 7.0, 8.0, 4.0, 16.0, 3.0, 14.0, 14.0, 19.0, 18.0, 22.0, 25.0, 35.0, 25.0, 38.0, 29.0, 26.0, 34.0, 30.0, 44.0, 44.0, 39.0, 35.0, 46.0, 38.0, 42.0, 29.0, 32.0, 23.0, 31.0, 22.0, 28.0, 29.0, 20.0, 26.0, 15.0, 11.0, 16.0, 15.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-4.484375, -4.3515625, -4.21875, -4.0859375, -3.953125, -3.8203125, -3.6875, -3.5546875, -3.421875, -3.2890625, -3.15625, -3.0234375, -2.890625, -2.7578125, -2.625, -2.4921875, -2.359375, -2.2265625, -2.09375, -1.9609375, -1.828125, -1.6953125, -1.5625, -1.4296875, -1.296875, -1.1640625, -1.03125, -0.8984375, -0.765625, -0.6328125, -0.5, -0.3671875, -0.234375, -0.1015625, 0.03125, 0.1640625, 0.296875, 0.4296875, 0.5625, 0.6953125, 0.828125, 0.9609375, 1.09375, 1.2265625, 1.359375, 1.4921875, 1.625, 1.7578125, 1.890625, 2.0234375, 2.15625, 2.2890625, 2.421875, 2.5546875, 2.6875, 2.8203125, 2.953125, 3.0859375, 3.21875, 3.3515625, 3.484375, 3.6171875, 3.75, 3.8828125, 4.015625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 10.0, 9.0, 26.0, 34.0, 51.0, 72.0, 88.0, 150.0, 205.0, 351.0, 525.0, 840.0, 1254.0, 2178.0, 3505.0, 5879.0, 9995.0, 17492.0, 33263.0, 67839.0, 175972.0, 370713.0, 201228.0, 74881.0, 35948.0, 19324.0, 10707.0, 6244.0, 3663.0, 2213.0, 1399.0, 856.0, 545.0, 361.0, 249.0, 152.0, 111.0, 76.0, 58.0, 32.0, 23.0, 15.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.4296875, -2.3650054931640625, -2.300323486328125, -2.2356414794921875, -2.17095947265625, -2.1062774658203125, -2.041595458984375, -1.9769134521484375, -1.9122314453125, -1.8475494384765625, -1.782867431640625, -1.7181854248046875, -1.65350341796875, -1.5888214111328125, -1.524139404296875, -1.4594573974609375, -1.394775390625, -1.3300933837890625, -1.265411376953125, -1.2007293701171875, -1.13604736328125, -1.0713653564453125, -1.006683349609375, -0.9420013427734375, -0.8773193359375, -0.8126373291015625, -0.747955322265625, -0.6832733154296875, -0.61859130859375, -0.5539093017578125, -0.489227294921875, -0.4245452880859375, -0.35986328125, -0.2951812744140625, -0.230499267578125, -0.1658172607421875, -0.10113525390625, -0.0364532470703125, 0.028228759765625, 0.0929107666015625, 0.1575927734375, 0.2222747802734375, 0.286956787109375, 0.3516387939453125, 0.41632080078125, 0.4810028076171875, 0.545684814453125, 0.6103668212890625, 0.675048828125, 0.7397308349609375, 0.804412841796875, 0.8690948486328125, 0.93377685546875, 0.9984588623046875, 1.063140869140625, 1.1278228759765625, 1.1925048828125, 1.2571868896484375, 1.321868896484375, 1.3865509033203125, 1.45123291015625, 1.5159149169921875, 1.580596923828125, 1.6452789306640625, 1.7099609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 3.0, 6.0, 7.0, 2.0, 10.0, 5.0, 10.0, 15.0, 14.0, 19.0, 16.0, 19.0, 20.0, 21.0, 22.0, 25.0, 30.0, 38.0, 31.0, 39.0, 40.0, 30.0, 48.0, 33.0, 1060.0, 44.0, 30.0, 30.0, 33.0, 36.0, 42.0, 37.0, 30.0, 25.0, 18.0, 22.0, 16.0, 11.0, 17.0, 14.0, 13.0, 8.0, 6.0, 13.0, 6.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.9619140625, -2.86328125, -2.7646484375, -2.666015625, -2.5673828125, -2.46875, -2.3701171875, -2.271484375, -2.1728515625, -2.07421875, -1.9755859375, -1.876953125, -1.7783203125, -1.6796875, -1.5810546875, -1.482421875, -1.3837890625, -1.28515625, -1.1865234375, -1.087890625, -0.9892578125, -0.890625, -0.7919921875, -0.693359375, -0.5947265625, -0.49609375, -0.3974609375, -0.298828125, -0.2001953125, -0.1015625, -0.0029296875, 0.095703125, 0.1943359375, 0.29296875, 0.3916015625, 0.490234375, 0.5888671875, 0.6875, 0.7861328125, 0.884765625, 0.9833984375, 1.08203125, 1.1806640625, 1.279296875, 1.3779296875, 1.4765625, 1.5751953125, 1.673828125, 1.7724609375, 1.87109375, 1.9697265625, 2.068359375, 2.1669921875, 2.265625, 2.3642578125, 2.462890625, 2.5615234375, 2.66015625, 2.7587890625, 2.857421875, 2.9560546875, 3.0546875, 3.1533203125, 3.251953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 16.0, 13.0, 20.0, 34.0, 53.0, 85.0, 120.0, 168.0, 285.0, 417.0, 681.0, 1178.0, 1949.0, 3494.0, 6816.0, 14660.0, 37556.0, 130494.0, 1060434.0, 673521.0, 105523.0, 32283.0, 13088.0, 6215.0, 3291.0, 1899.0, 1085.0, 633.0, 360.0, 264.0, 148.0, 114.0, 81.0, 43.0, 27.0, 21.0, 11.0, 13.0, 7.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.9941253662109375, -1.933563232421875, -1.8730010986328125, -1.81243896484375, -1.7518768310546875, -1.691314697265625, -1.6307525634765625, -1.5701904296875, -1.5096282958984375, -1.449066162109375, -1.3885040283203125, -1.32794189453125, -1.2673797607421875, -1.206817626953125, -1.1462554931640625, -1.085693359375, -1.0251312255859375, -0.964569091796875, -0.9040069580078125, -0.84344482421875, -0.7828826904296875, -0.722320556640625, -0.6617584228515625, -0.6011962890625, -0.5406341552734375, -0.480072021484375, -0.4195098876953125, -0.35894775390625, -0.2983856201171875, -0.237823486328125, -0.1772613525390625, -0.11669921875, -0.0561370849609375, 0.004425048828125, 0.0649871826171875, 0.12554931640625, 0.1861114501953125, 0.246673583984375, 0.3072357177734375, 0.3677978515625, 0.4283599853515625, 0.488922119140625, 0.5494842529296875, 0.61004638671875, 0.6706085205078125, 0.731170654296875, 0.7917327880859375, 0.852294921875, 0.9128570556640625, 0.973419189453125, 1.0339813232421875, 1.09454345703125, 1.1551055908203125, 1.215667724609375, 1.2762298583984375, 1.3367919921875, 1.3973541259765625, 1.457916259765625, 1.5184783935546875, 1.57904052734375, 1.6396026611328125, 1.700164794921875, 1.7607269287109375, 1.8212890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 1.0, 6.0, 4.0, 6.0, 6.0, 12.0, 8.0, 18.0, 13.0, 13.0, 20.0, 23.0, 21.0, 28.0, 36.0, 58.0, 84.0, 132.0, 141.0, 90.0, 51.0, 41.0, 33.0, 19.0, 18.0, 13.0, 10.0, 15.0, 15.0, 9.0, 5.0, 7.0, 8.0, 6.0, 5.0, 6.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.6279296875, -0.6094512939453125, -0.590972900390625, -0.5724945068359375, -0.55401611328125, -0.5355377197265625, -0.517059326171875, -0.4985809326171875, -0.4801025390625, -0.4616241455078125, -0.443145751953125, -0.4246673583984375, -0.40618896484375, -0.3877105712890625, -0.369232177734375, -0.3507537841796875, -0.332275390625, -0.3137969970703125, -0.295318603515625, -0.2768402099609375, -0.25836181640625, -0.2398834228515625, -0.221405029296875, -0.2029266357421875, -0.1844482421875, -0.1659698486328125, -0.147491455078125, -0.1290130615234375, -0.11053466796875, -0.0920562744140625, -0.073577880859375, -0.0550994873046875, -0.03662109375, -0.0181427001953125, 0.000335693359375, 0.0188140869140625, 0.03729248046875, 0.0557708740234375, 0.074249267578125, 0.0927276611328125, 0.1112060546875, 0.1296844482421875, 0.148162841796875, 0.1666412353515625, 0.18511962890625, 0.2035980224609375, 0.222076416015625, 0.2405548095703125, 0.259033203125, 0.2775115966796875, 0.295989990234375, 0.3144683837890625, 0.33294677734375, 0.3514251708984375, 0.369903564453125, 0.3883819580078125, 0.4068603515625, 0.4253387451171875, 0.443817138671875, 0.4622955322265625, 0.48077392578125, 0.4992523193359375, 0.517730712890625, 0.5362091064453125, 0.5546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 6.0, 8.0, 9.0, 7.0, 7.0, 16.0, 13.0, 25.0, 24.0, 33.0, 49.0, 83.0, 140.0, 207.0, 553.0, 8583.0, 1024691.0, 12768.0, 669.0, 220.0, 127.0, 68.0, 56.0, 39.0, 31.0, 21.0, 21.0, 16.0, 8.0, 5.0, 14.0, 7.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.640625, -11.2593994140625, -10.878173828125, -10.4969482421875, -10.11572265625, -9.7344970703125, -9.353271484375, -8.9720458984375, -8.5908203125, -8.2095947265625, -7.828369140625, -7.4471435546875, -7.06591796875, -6.6846923828125, -6.303466796875, -5.9222412109375, -5.541015625, -5.1597900390625, -4.778564453125, -4.3973388671875, -4.01611328125, -3.6348876953125, -3.253662109375, -2.8724365234375, -2.4912109375, -2.1099853515625, -1.728759765625, -1.3475341796875, -0.96630859375, -0.5850830078125, -0.203857421875, 0.1773681640625, 0.55859375, 0.9398193359375, 1.321044921875, 1.7022705078125, 2.08349609375, 2.4647216796875, 2.845947265625, 3.2271728515625, 3.6083984375, 3.9896240234375, 4.370849609375, 4.7520751953125, 5.13330078125, 5.5145263671875, 5.895751953125, 6.2769775390625, 6.658203125, 7.0394287109375, 7.420654296875, 7.8018798828125, 8.18310546875, 8.5643310546875, 8.945556640625, 9.3267822265625, 9.7080078125, 10.0892333984375, 10.470458984375, 10.8516845703125, 11.23291015625, 11.6141357421875, 11.995361328125, 12.3765869140625, 12.7578125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 34.0, 516.0, 426.0, 28.0, 3.0], "bins": [-9.861793518066406, -9.699729919433594, -9.537667274475098, -9.375603675842285, -9.213540077209473, -9.051477432250977, -8.889413833618164, -8.727350234985352, -8.565286636352539, -8.403223037719727, -8.24116039276123, -8.079096794128418, -7.9170331954956055, -7.754970073699951, -7.592906951904297, -7.430843353271484, -7.268780708312988, -7.106717586517334, -6.9446539878845215, -6.782590866088867, -6.620527267456055, -6.4584641456604, -6.296401023864746, -6.134337425231934, -5.972274303436279, -5.810211181640625, -5.6481475830078125, -5.486084461212158, -5.324021339416504, -5.161957740783691, -4.999894618988037, -4.837831497192383, -4.6757683753967285, -4.513705253601074, -4.351641654968262, -4.189578533172607, -4.027515411376953, -3.8654518127441406, -3.7033886909484863, -3.541325330734253, -3.3792617321014404, -3.217198371887207, -3.0551352500915527, -2.8930718898773193, -2.731008529663086, -2.5689451694488525, -2.406881809234619, -2.244818687438965, -2.0827553272247314, -1.920691967010498, -1.7586287260055542, -1.5965654850006104, -1.434502124786377, -1.2724387645721436, -1.1103755235671997, -0.9483122825622559, -0.7862489819526672, -0.6241856813430786, -0.46212238073349, -0.30005908012390137, -0.13799577951431274, 0.02406752109527588, 0.1861308217048645, 0.34819406270980835, 0.5102574229240417]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 12.0, 9.0, 8.0, 13.0, 27.0, 19.0, 27.0, 22.0, 22.0, 38.0, 44.0, 50.0, 44.0, 47.0, 42.0, 48.0, 42.0, 40.0, 44.0, 54.0, 37.0, 40.0, 34.0, 30.0, 29.0, 20.0, 20.0, 18.0, 21.0, 21.0, 12.0, 8.0, 6.0, 6.0, 3.0, 1.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7374405264854431, -0.7134808897972107, -0.6895212531089783, -0.6655616164207458, -0.6416019201278687, -0.6176422834396362, -0.5936826467514038, -0.5697230100631714, -0.545763373374939, -0.5218037366867065, -0.4978440999984741, -0.4738844335079193, -0.4499247968196869, -0.42596516013145447, -0.40200549364089966, -0.37804585695266724, -0.3540862202644348, -0.3301265835762024, -0.30616694688796997, -0.28220728039741516, -0.25824764370918274, -0.23428800702095032, -0.2103283554315567, -0.18636870384216309, -0.16240906715393066, -0.13844943046569824, -0.11448977887630463, -0.09053013473749161, -0.06657049059867859, -0.04261084645986557, -0.01865120232105255, 0.0053084492683410645, 0.02926802635192871, 0.05322767049074173, 0.07718731462955475, 0.10114695876836777, 0.1251066029071808, 0.1490662395954132, 0.17302589118480682, 0.19698554277420044, 0.22094517946243286, 0.24490481615066528, 0.2688644528388977, 0.2928241193294525, 0.31678375601768494, 0.34074339270591736, 0.36470305919647217, 0.3886626958847046, 0.412622332572937, 0.43658196926116943, 0.46054160594940186, 0.48450127243995667, 0.5084608793258667, 0.5324205756187439, 0.5563802123069763, 0.5803398489952087, 0.6042994856834412, 0.6282591223716736, 0.652218759059906, 0.6761783957481384, 0.7001380920410156, 0.724097728729248, 0.7480573654174805, 0.7720170021057129, 0.7959766387939453]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 9.0, 14.0, 5.0, 2.0, 12.0, 4.0, 17.0, 12.0, 13.0, 11.0, 19.0, 23.0, 31.0, 21.0, 30.0, 28.0, 15.0, 37.0, 34.0, 32.0, 42.0, 39.0, 39.0, 46.0, 42.0, 31.0, 37.0, 32.0, 30.0, 31.0, 24.0, 18.0, 21.0, 20.0, 20.0, 20.0, 24.0, 20.0, 19.0, 17.0, 12.0, 7.0, 9.0, 9.0, 9.0, 2.0, 5.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.859375, -3.7364501953125, -3.613525390625, -3.4906005859375, -3.36767578125, -3.2447509765625, -3.121826171875, -2.9989013671875, -2.8759765625, -2.7530517578125, -2.630126953125, -2.5072021484375, -2.38427734375, -2.2613525390625, -2.138427734375, -2.0155029296875, -1.892578125, -1.7696533203125, -1.646728515625, -1.5238037109375, -1.40087890625, -1.2779541015625, -1.155029296875, -1.0321044921875, -0.9091796875, -0.7862548828125, -0.663330078125, -0.5404052734375, -0.41748046875, -0.2945556640625, -0.171630859375, -0.0487060546875, 0.07421875, 0.1971435546875, 0.320068359375, 0.4429931640625, 0.56591796875, 0.6888427734375, 0.811767578125, 0.9346923828125, 1.0576171875, 1.1805419921875, 1.303466796875, 1.4263916015625, 1.54931640625, 1.6722412109375, 1.795166015625, 1.9180908203125, 2.041015625, 2.1639404296875, 2.286865234375, 2.4097900390625, 2.53271484375, 2.6556396484375, 2.778564453125, 2.9014892578125, 3.0244140625, 3.1473388671875, 3.270263671875, 3.3931884765625, 3.51611328125, 3.6390380859375, 3.761962890625, 3.8848876953125, 4.0078125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 12.0, 20.0, 19.0, 29.0, 27.0, 57.0, 69.0, 106.0, 171.0, 259.0, 341.0, 555.0, 927.0, 1402.0, 2484.0, 4183.0, 7339.0, 13213.0, 23808.0, 42996.0, 84355.0, 194132.0, 359533.0, 155559.0, 71658.0, 37617.0, 20248.0, 11565.0, 6442.0, 3623.0, 2154.0, 1286.0, 796.0, 497.0, 340.0, 223.0, 134.0, 97.0, 78.0, 54.0, 27.0, 27.0, 17.0, 15.0, 16.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-4.15625, -4.0238037109375, -3.891357421875, -3.7589111328125, -3.62646484375, -3.4940185546875, -3.361572265625, -3.2291259765625, -3.0966796875, -2.9642333984375, -2.831787109375, -2.6993408203125, -2.56689453125, -2.4344482421875, -2.302001953125, -2.1695556640625, -2.037109375, -1.9046630859375, -1.772216796875, -1.6397705078125, -1.50732421875, -1.3748779296875, -1.242431640625, -1.1099853515625, -0.9775390625, -0.8450927734375, -0.712646484375, -0.5802001953125, -0.44775390625, -0.3153076171875, -0.182861328125, -0.0504150390625, 0.08203125, 0.2144775390625, 0.346923828125, 0.4793701171875, 0.61181640625, 0.7442626953125, 0.876708984375, 1.0091552734375, 1.1416015625, 1.2740478515625, 1.406494140625, 1.5389404296875, 1.67138671875, 1.8038330078125, 1.936279296875, 2.0687255859375, 2.201171875, 2.3336181640625, 2.466064453125, 2.5985107421875, 2.73095703125, 2.8634033203125, 2.995849609375, 3.1282958984375, 3.2607421875, 3.3931884765625, 3.525634765625, 3.6580810546875, 3.79052734375, 3.9229736328125, 4.055419921875, 4.1878662109375, 4.3203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 1.0, 4.0, 5.0, 6.0, 8.0, 9.0, 10.0, 9.0, 12.0, 19.0, 12.0, 25.0, 24.0, 29.0, 40.0, 33.0, 32.0, 48.0, 44.0, 75.0, 118.0, 225.0, 1496.0, 241.0, 116.0, 55.0, 54.0, 43.0, 23.0, 30.0, 36.0, 21.0, 17.0, 21.0, 20.0, 16.0, 14.0, 9.0, 9.0, 9.0, 13.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.438720703125, -13.99462890625, -13.550537109375, -13.1064453125, -12.662353515625, -12.21826171875, -11.774169921875, -11.330078125, -10.885986328125, -10.44189453125, -9.997802734375, -9.5537109375, -9.109619140625, -8.66552734375, -8.221435546875, -7.77734375, -7.333251953125, -6.88916015625, -6.445068359375, -6.0009765625, -5.556884765625, -5.11279296875, -4.668701171875, -4.224609375, -3.780517578125, -3.33642578125, -2.892333984375, -2.4482421875, -2.004150390625, -1.56005859375, -1.115966796875, -0.671875, -0.227783203125, 0.21630859375, 0.660400390625, 1.1044921875, 1.548583984375, 1.99267578125, 2.436767578125, 2.880859375, 3.324951171875, 3.76904296875, 4.213134765625, 4.6572265625, 5.101318359375, 5.54541015625, 5.989501953125, 6.43359375, 6.877685546875, 7.32177734375, 7.765869140625, 8.2099609375, 8.654052734375, 9.09814453125, 9.542236328125, 9.986328125, 10.430419921875, 10.87451171875, 11.318603515625, 11.7626953125, 12.206787109375, 12.65087890625, 13.094970703125, 13.5390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 11.0, 7.0, 16.0, 12.0, 13.0, 15.0, 23.0, 31.0, 37.0, 48.0, 56.0, 83.0, 115.0, 167.0, 278.0, 556.0, 2419.0, 41363.0, 2948010.0, 146422.0, 4158.0, 820.0, 323.0, 188.0, 138.0, 96.0, 66.0, 59.0, 34.0, 20.0, 24.0, 24.0, 14.0, 12.0, 14.0, 6.0, 6.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-30.734375, -29.7626953125, -28.791015625, -27.8193359375, -26.84765625, -25.8759765625, -24.904296875, -23.9326171875, -22.9609375, -21.9892578125, -21.017578125, -20.0458984375, -19.07421875, -18.1025390625, -17.130859375, -16.1591796875, -15.1875, -14.2158203125, -13.244140625, -12.2724609375, -11.30078125, -10.3291015625, -9.357421875, -8.3857421875, -7.4140625, -6.4423828125, -5.470703125, -4.4990234375, -3.52734375, -2.5556640625, -1.583984375, -0.6123046875, 0.359375, 1.3310546875, 2.302734375, 3.2744140625, 4.24609375, 5.2177734375, 6.189453125, 7.1611328125, 8.1328125, 9.1044921875, 10.076171875, 11.0478515625, 12.01953125, 12.9912109375, 13.962890625, 14.9345703125, 15.90625, 16.8779296875, 17.849609375, 18.8212890625, 19.79296875, 20.7646484375, 21.736328125, 22.7080078125, 23.6796875, 24.6513671875, 25.623046875, 26.5947265625, 27.56640625, 28.5380859375, 29.509765625, 30.4814453125, 31.453125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 40.0, 192.0, 383.0, 292.0, 87.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.348018646240234, -13.059656143188477, -10.771293640136719, -8.482930183410645, -6.194567680358887, -3.906205177307129, -1.6178417205810547, 0.6705207824707031, 2.958883285522461, 5.247245788574219, 7.535608768463135, 9.82397174835205, 12.112334251403809, 14.400696754455566, 16.68906021118164, 18.9774227142334, 21.265785217285156, 23.554147720336914, 25.842510223388672, 28.130874633789062, 30.419235229492188, 32.70759963989258, 34.99596405029297, 37.284324645996094, 39.57268524169922, 41.86104965209961, 44.149410247802734, 46.437774658203125, 48.72613525390625, 51.01449966430664, 53.30286407470703, 55.591224670410156, 57.87958526611328, 60.16794967651367, 62.4563102722168, 64.74467468261719, 67.03303527832031, 69.32139587402344, 71.6097640991211, 73.89812469482422, 76.18648529052734, 78.47484588623047, 80.76321411132812, 83.05157470703125, 85.33993530273438, 87.6282958984375, 89.91666412353516, 92.20502471923828, 94.49339294433594, 96.78175354003906, 99.07012176513672, 101.35848236083984, 103.64684295654297, 105.9352035522461, 108.22357177734375, 110.51193237304688, 112.80029296875, 115.08865356445312, 117.37702178955078, 119.6653823852539, 121.95374298095703, 124.24210357666016, 126.53047180175781, 128.81883239746094, 131.10719299316406]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 12.0, 9.0, 13.0, 12.0, 17.0, 14.0, 20.0, 27.0, 21.0, 23.0, 23.0, 26.0, 28.0, 38.0, 34.0, 41.0, 33.0, 36.0, 35.0, 28.0, 51.0, 37.0, 40.0, 33.0, 30.0, 24.0, 38.0, 36.0, 27.0, 21.0, 23.0, 20.0, 12.0, 23.0, 15.0, 13.0, 11.0, 7.0, 8.0, 3.0, 2.0, 6.0, 3.0, 6.0, 9.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-38.676422119140625, -37.43272399902344, -36.18902587890625, -34.94532775878906, -33.701629638671875, -32.45793151855469, -31.2142333984375, -29.970535278320312, -28.726837158203125, -27.483139038085938, -26.23944091796875, -24.995742797851562, -23.752044677734375, -22.508346557617188, -21.2646484375, -20.020950317382812, -18.777252197265625, -17.533554077148438, -16.28985595703125, -15.046157836914062, -13.802459716796875, -12.558761596679688, -11.3150634765625, -10.071365356445312, -8.827667236328125, -7.5839691162109375, -6.34027099609375, -5.0965728759765625, -3.852874755859375, -2.6091766357421875, -1.365478515625, -0.1217803955078125, 1.121917724609375, 2.3656158447265625, 3.60931396484375, 4.8530120849609375, 6.096710205078125, 7.3404083251953125, 8.5841064453125, 9.827804565429688, 11.071502685546875, 12.315200805664062, 13.55889892578125, 14.802597045898438, 16.046295166015625, 17.289993286132812, 18.53369140625, 19.777389526367188, 21.021087646484375, 22.264785766601562, 23.50848388671875, 24.752182006835938, 25.995880126953125, 27.239578247070312, 28.4832763671875, 29.726974487304688, 30.970672607421875, 32.21437072753906, 33.45806884765625, 34.70176696777344, 35.945465087890625, 37.18916320800781, 38.432861328125, 39.67655944824219, 40.920257568359375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 4.0, 9.0, 10.0, 5.0, 5.0, 12.0, 13.0, 22.0, 9.0, 28.0, 22.0, 24.0, 29.0, 19.0, 38.0, 31.0, 32.0, 39.0, 26.0, 40.0, 35.0, 29.0, 41.0, 35.0, 33.0, 42.0, 35.0, 34.0, 27.0, 31.0, 21.0, 33.0, 21.0, 25.0, 18.0, 25.0, 20.0, 18.0, 12.0, 13.0, 6.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.70703125, -4.56591796875, -4.4248046875, -4.28369140625, -4.142578125, -4.00146484375, -3.8603515625, -3.71923828125, -3.578125, -3.43701171875, -3.2958984375, -3.15478515625, -3.013671875, -2.87255859375, -2.7314453125, -2.59033203125, -2.44921875, -2.30810546875, -2.1669921875, -2.02587890625, -1.884765625, -1.74365234375, -1.6025390625, -1.46142578125, -1.3203125, -1.17919921875, -1.0380859375, -0.89697265625, -0.755859375, -0.61474609375, -0.4736328125, -0.33251953125, -0.19140625, -0.05029296875, 0.0908203125, 0.23193359375, 0.373046875, 0.51416015625, 0.6552734375, 0.79638671875, 0.9375, 1.07861328125, 1.2197265625, 1.36083984375, 1.501953125, 1.64306640625, 1.7841796875, 1.92529296875, 2.06640625, 2.20751953125, 2.3486328125, 2.48974609375, 2.630859375, 2.77197265625, 2.9130859375, 3.05419921875, 3.1953125, 3.33642578125, 3.4775390625, 3.61865234375, 3.759765625, 3.90087890625, 4.0419921875, 4.18310546875, 4.32421875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 18.0, 37.0, 43.0, 81.0, 85.0, 155.0, 258.0, 344.0, 521.0, 765.0, 1158.0, 1962.0, 3082.0, 5349.0, 9820.0, 19151.0, 42325.0, 109286.0, 331213.0, 956733.0, 1461316.0, 811439.0, 273450.0, 92164.0, 36417.0, 16560.0, 8551.0, 4542.0, 2597.0, 1728.0, 1012.0, 647.0, 463.0, 279.0, 219.0, 154.0, 106.0, 70.0, 46.0, 36.0, 19.0, 10.0, 8.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.427001953125, -5.24853515625, -5.070068359375, -4.8916015625, -4.713134765625, -4.53466796875, -4.356201171875, -4.177734375, -3.999267578125, -3.82080078125, -3.642333984375, -3.4638671875, -3.285400390625, -3.10693359375, -2.928466796875, -2.75, -2.571533203125, -2.39306640625, -2.214599609375, -2.0361328125, -1.857666015625, -1.67919921875, -1.500732421875, -1.322265625, -1.143798828125, -0.96533203125, -0.786865234375, -0.6083984375, -0.429931640625, -0.25146484375, -0.072998046875, 0.10546875, 0.283935546875, 0.46240234375, 0.640869140625, 0.8193359375, 0.997802734375, 1.17626953125, 1.354736328125, 1.533203125, 1.711669921875, 1.89013671875, 2.068603515625, 2.2470703125, 2.425537109375, 2.60400390625, 2.782470703125, 2.9609375, 3.139404296875, 3.31787109375, 3.496337890625, 3.6748046875, 3.853271484375, 4.03173828125, 4.210205078125, 4.388671875, 4.567138671875, 4.74560546875, 4.924072265625, 5.1025390625, 5.281005859375, 5.45947265625, 5.637939453125, 5.81640625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 10.0, 16.0, 21.0, 22.0, 25.0, 47.0, 81.0, 116.0, 166.0, 228.0, 382.0, 521.0, 673.0, 549.0, 390.0, 301.0, 172.0, 103.0, 68.0, 53.0, 38.0, 27.0, 24.0, 15.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.04931640625, -9.6845703125, -9.31982421875, -8.955078125, -8.59033203125, -8.2255859375, -7.86083984375, -7.49609375, -7.13134765625, -6.7666015625, -6.40185546875, -6.037109375, -5.67236328125, -5.3076171875, -4.94287109375, -4.578125, -4.21337890625, -3.8486328125, -3.48388671875, -3.119140625, -2.75439453125, -2.3896484375, -2.02490234375, -1.66015625, -1.29541015625, -0.9306640625, -0.56591796875, -0.201171875, 0.16357421875, 0.5283203125, 0.89306640625, 1.2578125, 1.62255859375, 1.9873046875, 2.35205078125, 2.716796875, 3.08154296875, 3.4462890625, 3.81103515625, 4.17578125, 4.54052734375, 4.9052734375, 5.27001953125, 5.634765625, 5.99951171875, 6.3642578125, 6.72900390625, 7.09375, 7.45849609375, 7.8232421875, 8.18798828125, 8.552734375, 8.91748046875, 9.2822265625, 9.64697265625, 10.01171875, 10.37646484375, 10.7412109375, 11.10595703125, 11.470703125, 11.83544921875, 12.2001953125, 12.56494140625, 12.9296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 9.0, 13.0, 26.0, 32.0, 41.0, 59.0, 104.0, 132.0, 220.0, 361.0, 785.0, 2430.0, 49284.0, 3880070.0, 253822.0, 4695.0, 985.0, 466.0, 260.0, 175.0, 106.0, 70.0, 43.0, 38.0, 22.0, 13.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -37.06298828125, -35.8134765625, -34.56396484375, -33.314453125, -32.06494140625, -30.8154296875, -29.56591796875, -28.31640625, -27.06689453125, -25.8173828125, -24.56787109375, -23.318359375, -22.06884765625, -20.8193359375, -19.56982421875, -18.3203125, -17.07080078125, -15.8212890625, -14.57177734375, -13.322265625, -12.07275390625, -10.8232421875, -9.57373046875, -8.32421875, -7.07470703125, -5.8251953125, -4.57568359375, -3.326171875, -2.07666015625, -0.8271484375, 0.42236328125, 1.671875, 2.92138671875, 4.1708984375, 5.42041015625, 6.669921875, 7.91943359375, 9.1689453125, 10.41845703125, 11.66796875, 12.91748046875, 14.1669921875, 15.41650390625, 16.666015625, 17.91552734375, 19.1650390625, 20.41455078125, 21.6640625, 22.91357421875, 24.1630859375, 25.41259765625, 26.662109375, 27.91162109375, 29.1611328125, 30.41064453125, 31.66015625, 32.90966796875, 34.1591796875, 35.40869140625, 36.658203125, 37.90771484375, 39.1572265625, 40.40673828125, 41.65625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 121.0, 492.0, 358.0, 33.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.4548797607422, -156.1623077392578, -149.86972045898438, -143.5771484375, -137.28457641601562, -130.99200439453125, -124.69941711425781, -118.40684509277344, -112.11426544189453, -105.82168579101562, -99.52911376953125, -93.23653411865234, -86.94395446777344, -80.65138244628906, -74.35880279541016, -68.06622314453125, -61.773651123046875, -55.481075286865234, -49.188499450683594, -42.89591979980469, -36.60334396362305, -30.310768127441406, -24.0181884765625, -17.72561264038086, -11.433036804199219, -5.140460014343262, 1.1521167755126953, 7.444694519042969, 13.73727035522461, 20.02984619140625, 26.322425842285156, 32.6150016784668, 38.907562255859375, 45.200138092041016, 51.492713928222656, 57.78529357910156, 64.07786560058594, 70.37044525146484, 76.66302490234375, 82.95559692382812, 89.24817657470703, 95.54075622558594, 101.83332824707031, 108.12590789794922, 114.41848754882812, 120.7110595703125, 127.0036392211914, 133.2962188720703, 139.5887908935547, 145.88136291503906, 152.1739501953125, 158.46652221679688, 164.75909423828125, 171.05166625976562, 177.34425354003906, 183.63682556152344, 189.92941284179688, 196.22198486328125, 202.5145721435547, 208.80714416503906, 215.09971618652344, 221.39230346679688, 227.68487548828125, 233.97744750976562, 240.27001953125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 6.0, 8.0, 5.0, 7.0, 14.0, 7.0, 9.0, 9.0, 15.0, 14.0, 16.0, 18.0, 22.0, 25.0, 27.0, 31.0, 33.0, 28.0, 34.0, 37.0, 33.0, 42.0, 45.0, 40.0, 33.0, 49.0, 35.0, 33.0, 38.0, 32.0, 31.0, 21.0, 26.0, 23.0, 25.0, 20.0, 21.0, 14.0, 15.0, 12.0, 11.0, 14.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.650732040405273, -25.792898178100586, -24.9350643157959, -24.07723045349121, -23.219398498535156, -22.36156463623047, -21.50373077392578, -20.645896911621094, -19.788063049316406, -18.93022918701172, -18.07239532470703, -17.214561462402344, -16.356727600097656, -15.498894691467285, -14.641061782836914, -13.783227920532227, -12.925394058227539, -12.067560195922852, -11.209726333618164, -10.351893424987793, -9.494059562683105, -8.636225700378418, -7.778392314910889, -6.920558929443359, -6.062725067138672, -5.204891204833984, -4.347057819366455, -3.4892241954803467, -2.6313905715942383, -1.7735567092895508, -0.9157233238220215, -0.05788993835449219, 0.7999420166015625, 1.657775640487671, 2.5156092643737793, 3.3734428882598877, 4.231276512145996, 5.089110374450684, 5.946943759918213, 6.804777145385742, 7.66261100769043, 8.520444869995117, 9.378278732299805, 10.236111640930176, 11.093945503234863, 11.95177936553955, 12.809612274169922, 13.66744613647461, 14.525279998779297, 15.383113861083984, 16.240947723388672, 17.09878158569336, 17.956615447998047, 18.814449310302734, 19.67228126525879, 20.530115127563477, 21.387948989868164, 22.24578285217285, 23.10361671447754, 23.961450576782227, 24.81928253173828, 25.67711639404297, 26.534950256347656, 27.392784118652344, 28.25061798095703]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 6.0, 14.0, 10.0, 14.0, 16.0, 26.0, 18.0, 20.0, 31.0, 29.0, 30.0, 22.0, 35.0, 35.0, 44.0, 34.0, 37.0, 35.0, 42.0, 37.0, 30.0, 41.0, 39.0, 38.0, 29.0, 41.0, 29.0, 27.0, 29.0, 24.0, 9.0, 19.0, 16.0, 14.0, 19.0, 11.0, 9.0, 6.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.85546875, -4.716552734375, -4.57763671875, -4.438720703125, -4.2998046875, -4.160888671875, -4.02197265625, -3.883056640625, -3.744140625, -3.605224609375, -3.46630859375, -3.327392578125, -3.1884765625, -3.049560546875, -2.91064453125, -2.771728515625, -2.6328125, -2.493896484375, -2.35498046875, -2.216064453125, -2.0771484375, -1.938232421875, -1.79931640625, -1.660400390625, -1.521484375, -1.382568359375, -1.24365234375, -1.104736328125, -0.9658203125, -0.826904296875, -0.68798828125, -0.549072265625, -0.41015625, -0.271240234375, -0.13232421875, 0.006591796875, 0.1455078125, 0.284423828125, 0.42333984375, 0.562255859375, 0.701171875, 0.840087890625, 0.97900390625, 1.117919921875, 1.2568359375, 1.395751953125, 1.53466796875, 1.673583984375, 1.8125, 1.951416015625, 2.09033203125, 2.229248046875, 2.3681640625, 2.507080078125, 2.64599609375, 2.784912109375, 2.923828125, 3.062744140625, 3.20166015625, 3.340576171875, 3.4794921875, 3.618408203125, 3.75732421875, 3.896240234375, 4.03515625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 17.0, 24.0, 29.0, 58.0, 54.0, 103.0, 111.0, 153.0, 254.0, 361.0, 464.0, 784.0, 1192.0, 1773.0, 2845.0, 4616.0, 7554.0, 13381.0, 24948.0, 50882.0, 113986.0, 250558.0, 291308.0, 147925.0, 64561.0, 30717.0, 16148.0, 9013.0, 5285.0, 3193.0, 2097.0, 1315.0, 910.0, 595.0, 383.0, 316.0, 170.0, 151.0, 101.0, 69.0, 30.0, 29.0, 24.0, 16.0, 10.0, 5.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4770050048828125, -1.429595947265625, -1.3821868896484375, -1.33477783203125, -1.2873687744140625, -1.239959716796875, -1.1925506591796875, -1.1451416015625, -1.0977325439453125, -1.050323486328125, -1.0029144287109375, -0.95550537109375, -0.9080963134765625, -0.860687255859375, -0.8132781982421875, -0.765869140625, -0.7184600830078125, -0.671051025390625, -0.6236419677734375, -0.57623291015625, -0.5288238525390625, -0.481414794921875, -0.4340057373046875, -0.3865966796875, -0.3391876220703125, -0.291778564453125, -0.2443695068359375, -0.19696044921875, -0.1495513916015625, -0.102142333984375, -0.0547332763671875, -0.00732421875, 0.0400848388671875, 0.087493896484375, 0.1349029541015625, 0.18231201171875, 0.2297210693359375, 0.277130126953125, 0.3245391845703125, 0.3719482421875, 0.4193572998046875, 0.466766357421875, 0.5141754150390625, 0.56158447265625, 0.6089935302734375, 0.656402587890625, 0.7038116455078125, 0.751220703125, 0.7986297607421875, 0.846038818359375, 0.8934478759765625, 0.94085693359375, 0.9882659912109375, 1.035675048828125, 1.0830841064453125, 1.1304931640625, 1.1779022216796875, 1.225311279296875, 1.2727203369140625, 1.32012939453125, 1.3675384521484375, 1.414947509765625, 1.4623565673828125, 1.509765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 9.0, 7.0, 13.0, 10.0, 24.0, 14.0, 19.0, 18.0, 18.0, 26.0, 21.0, 25.0, 28.0, 26.0, 29.0, 32.0, 36.0, 39.0, 49.0, 1053.0, 37.0, 44.0, 34.0, 33.0, 41.0, 35.0, 35.0, 18.0, 30.0, 28.0, 26.0, 22.0, 17.0, 15.0, 12.0, 13.0, 16.0, 7.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.14453125, -3.048828125, -2.953125, -2.857421875, -2.76171875, -2.666015625, -2.5703125, -2.474609375, -2.37890625, -2.283203125, -2.1875, -2.091796875, -1.99609375, -1.900390625, -1.8046875, -1.708984375, -1.61328125, -1.517578125, -1.421875, -1.326171875, -1.23046875, -1.134765625, -1.0390625, -0.943359375, -0.84765625, -0.751953125, -0.65625, -0.560546875, -0.46484375, -0.369140625, -0.2734375, -0.177734375, -0.08203125, 0.013671875, 0.109375, 0.205078125, 0.30078125, 0.396484375, 0.4921875, 0.587890625, 0.68359375, 0.779296875, 0.875, 0.970703125, 1.06640625, 1.162109375, 1.2578125, 1.353515625, 1.44921875, 1.544921875, 1.640625, 1.736328125, 1.83203125, 1.927734375, 2.0234375, 2.119140625, 2.21484375, 2.310546875, 2.40625, 2.501953125, 2.59765625, 2.693359375, 2.7890625, 2.884765625, 2.98046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 7.0, 6.0, 16.0, 25.0, 27.0, 26.0, 30.0, 64.0, 70.0, 82.0, 129.0, 169.0, 261.0, 393.0, 542.0, 829.0, 1363.0, 2243.0, 4321.0, 9131.0, 23796.0, 84990.0, 593910.0, 1198773.0, 122052.0, 30588.0, 10924.0, 5170.0, 2706.0, 1515.0, 925.0, 643.0, 384.0, 293.0, 194.0, 142.0, 84.0, 61.0, 67.0, 48.0, 32.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.748046875, -1.691864013671875, -1.63568115234375, -1.579498291015625, -1.5233154296875, -1.467132568359375, -1.41094970703125, -1.354766845703125, -1.298583984375, -1.242401123046875, -1.18621826171875, -1.130035400390625, -1.0738525390625, -1.017669677734375, -0.96148681640625, -0.905303955078125, -0.84912109375, -0.792938232421875, -0.73675537109375, -0.680572509765625, -0.6243896484375, -0.568206787109375, -0.51202392578125, -0.455841064453125, -0.399658203125, -0.343475341796875, -0.28729248046875, -0.231109619140625, -0.1749267578125, -0.118743896484375, -0.06256103515625, -0.006378173828125, 0.0498046875, 0.105987548828125, 0.16217041015625, 0.218353271484375, 0.2745361328125, 0.330718994140625, 0.38690185546875, 0.443084716796875, 0.499267578125, 0.555450439453125, 0.61163330078125, 0.667816162109375, 0.7239990234375, 0.780181884765625, 0.83636474609375, 0.892547607421875, 0.94873046875, 1.004913330078125, 1.06109619140625, 1.117279052734375, 1.1734619140625, 1.229644775390625, 1.28582763671875, 1.342010498046875, 1.398193359375, 1.454376220703125, 1.51055908203125, 1.566741943359375, 1.6229248046875, 1.679107666015625, 1.73529052734375, 1.791473388671875, 1.84765625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 9.0, 10.0, 10.0, 10.0, 15.0, 14.0, 30.0, 28.0, 44.0, 81.0, 206.0, 214.0, 118.0, 68.0, 31.0, 22.0, 15.0, 13.0, 9.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6787109375, -0.65692138671875, -0.6351318359375, -0.61334228515625, -0.591552734375, -0.56976318359375, -0.5479736328125, -0.52618408203125, -0.50439453125, -0.48260498046875, -0.4608154296875, -0.43902587890625, -0.417236328125, -0.39544677734375, -0.3736572265625, -0.35186767578125, -0.330078125, -0.30828857421875, -0.2864990234375, -0.26470947265625, -0.242919921875, -0.22113037109375, -0.1993408203125, -0.17755126953125, -0.15576171875, -0.13397216796875, -0.1121826171875, -0.09039306640625, -0.068603515625, -0.04681396484375, -0.0250244140625, -0.00323486328125, 0.0185546875, 0.04034423828125, 0.0621337890625, 0.08392333984375, 0.105712890625, 0.12750244140625, 0.1492919921875, 0.17108154296875, 0.19287109375, 0.21466064453125, 0.2364501953125, 0.25823974609375, 0.280029296875, 0.30181884765625, 0.3236083984375, 0.34539794921875, 0.3671875, 0.38897705078125, 0.4107666015625, 0.43255615234375, 0.454345703125, 0.47613525390625, 0.4979248046875, 0.51971435546875, 0.54150390625, 0.56329345703125, 0.5850830078125, 0.60687255859375, 0.628662109375, 0.65045166015625, 0.6722412109375, 0.69403076171875, 0.7158203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 3.0, 7.0, 11.0, 14.0, 12.0, 19.0, 31.0, 27.0, 62.0, 103.0, 191.0, 1202.0, 962332.0, 83356.0, 672.0, 162.0, 86.0, 69.0, 34.0, 34.0, 18.0, 16.0, 20.0, 10.0, 11.0, 6.0, 4.0, 4.0, 0.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-13.78125, -13.3623046875, -12.943359375, -12.5244140625, -12.10546875, -11.6865234375, -11.267578125, -10.8486328125, -10.4296875, -10.0107421875, -9.591796875, -9.1728515625, -8.75390625, -8.3349609375, -7.916015625, -7.4970703125, -7.078125, -6.6591796875, -6.240234375, -5.8212890625, -5.40234375, -4.9833984375, -4.564453125, -4.1455078125, -3.7265625, -3.3076171875, -2.888671875, -2.4697265625, -2.05078125, -1.6318359375, -1.212890625, -0.7939453125, -0.375, 0.0439453125, 0.462890625, 0.8818359375, 1.30078125, 1.7197265625, 2.138671875, 2.5576171875, 2.9765625, 3.3955078125, 3.814453125, 4.2333984375, 4.65234375, 5.0712890625, 5.490234375, 5.9091796875, 6.328125, 6.7470703125, 7.166015625, 7.5849609375, 8.00390625, 8.4228515625, 8.841796875, 9.2607421875, 9.6796875, 10.0986328125, 10.517578125, 10.9365234375, 11.35546875, 11.7744140625, 12.193359375, 12.6123046875, 13.03125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 22.0, 221.0, 602.0, 159.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9447059631347656, -0.8324639797210693, -0.7202219367027283, -0.607979953289032, -0.4957379400730133, -0.38349592685699463, -0.27125394344329834, -0.15901190042495728, -0.046769917011260986, 0.0654720887541771, 0.17771409451961517, 0.28995609283447266, 0.40219810605049133, 0.51444011926651, 0.6266821026802063, 0.7389241456985474, 0.8511661291122437, 0.9634081125259399, 1.0756500959396362, 1.187892198562622, 1.3001341819763184, 1.4123761653900146, 1.524618148803711, 1.6368601322174072, 1.7491021156311035, 1.8613440990447998, 1.973586082458496, 2.0858280658721924, 2.1980700492858887, 2.310312271118164, 2.4225540161132812, 2.5347962379455566, 2.647038221359253, 2.759280204772949, 2.8715221881866455, 2.983764171600342, 3.096006155014038, 3.2082481384277344, 3.3204903602600098, 3.432732343673706, 3.5449743270874023, 3.6572163105010986, 3.769458293914795, 3.881700277328491, 3.9939422607421875, 4.106184482574463, 4.21842622756958, 4.3306684494018555, 4.442910194396973, 4.555152416229248, 4.667394161224365, 4.779636383056641, 4.891878128051758, 5.004120349884033, 5.11636209487915, 5.228604316711426, 5.340846538543701, 5.453088760375977, 5.565330505371094, 5.677572727203369, 5.789814472198486, 5.902056694030762, 6.014298439025879, 6.126540660858154, 6.2387824058532715]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 10.0, 10.0, 7.0, 19.0, 20.0, 16.0, 15.0, 27.0, 35.0, 29.0, 27.0, 40.0, 34.0, 36.0, 57.0, 48.0, 43.0, 39.0, 40.0, 44.0, 48.0, 43.0, 30.0, 30.0, 40.0, 25.0, 27.0, 29.0, 28.0, 21.0, 10.0, 12.0, 11.0, 11.0, 9.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5560384392738342, -0.5367377996444702, -0.517437219619751, -0.49813660979270935, -0.4788359999656677, -0.4595353603363037, -0.4402347505092621, -0.42093414068222046, -0.40163353085517883, -0.3823329210281372, -0.3630323112010956, -0.34373170137405396, -0.32443106174468994, -0.3051304817199707, -0.2858298420906067, -0.26652923226356506, -0.24722862243652344, -0.2279280126094818, -0.20862740278244019, -0.18932677805423737, -0.17002616822719574, -0.1507255584001541, -0.1314249336719513, -0.11212432384490967, -0.09282371401786804, -0.07352310419082642, -0.05422248691320419, -0.03492187336087227, -0.015621259808540344, 0.0036793500185012817, 0.022979967296123505, 0.04228058457374573, 0.061581194400787354, 0.08088180422782898, 0.1001824215054512, 0.11948303878307343, 0.13878364861011505, 0.15808425843715668, 0.1773848831653595, 0.19668549299240112, 0.21598610281944275, 0.23528671264648438, 0.254587322473526, 0.2738879323005676, 0.29318857192993164, 0.3124891519546509, 0.3317897915840149, 0.3510904014110565, 0.37039101123809814, 0.38969162106513977, 0.4089922308921814, 0.428292840719223, 0.44759345054626465, 0.46689409017562866, 0.4861947000026703, 0.5054953098297119, 0.5247958898544312, 0.5440965294837952, 0.5633971095085144, 0.5826977491378784, 0.6019983291625977, 0.6212989687919617, 0.6405995488166809, 0.6599001884460449, 0.6792008280754089]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 12.0, 11.0, 18.0, 19.0, 21.0, 27.0, 30.0, 41.0, 40.0, 23.0, 30.0, 39.0, 44.0, 45.0, 31.0, 52.0, 40.0, 38.0, 43.0, 46.0, 36.0, 25.0, 43.0, 35.0, 16.0, 34.0, 21.0, 16.0, 22.0, 22.0, 15.0, 16.0, 6.0, 9.0, 6.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.27734375, -5.12322998046875, -4.9691162109375, -4.81500244140625, -4.660888671875, -4.50677490234375, -4.3526611328125, -4.19854736328125, -4.04443359375, -3.89031982421875, -3.7362060546875, -3.58209228515625, -3.427978515625, -3.27386474609375, -3.1197509765625, -2.96563720703125, -2.8115234375, -2.65740966796875, -2.5032958984375, -2.34918212890625, -2.195068359375, -2.04095458984375, -1.8868408203125, -1.73272705078125, -1.57861328125, -1.42449951171875, -1.2703857421875, -1.11627197265625, -0.962158203125, -0.80804443359375, -0.6539306640625, -0.49981689453125, -0.345703125, -0.19158935546875, -0.0374755859375, 0.11663818359375, 0.270751953125, 0.42486572265625, 0.5789794921875, 0.73309326171875, 0.88720703125, 1.04132080078125, 1.1954345703125, 1.34954833984375, 1.503662109375, 1.65777587890625, 1.8118896484375, 1.96600341796875, 2.1201171875, 2.27423095703125, 2.4283447265625, 2.58245849609375, 2.736572265625, 2.89068603515625, 3.0447998046875, 3.19891357421875, 3.35302734375, 3.50714111328125, 3.6612548828125, 3.81536865234375, 3.969482421875, 4.12359619140625, 4.2777099609375, 4.43182373046875, 4.5859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 9.0, 12.0, 29.0, 31.0, 57.0, 86.0, 112.0, 136.0, 216.0, 323.0, 496.0, 728.0, 1067.0, 1676.0, 2899.0, 4592.0, 7917.0, 14289.0, 26145.0, 51253.0, 113992.0, 277063.0, 298817.0, 125515.0, 56376.0, 28110.0, 14938.0, 8428.0, 4991.0, 2958.0, 1883.0, 1097.0, 743.0, 512.0, 325.0, 226.0, 150.0, 118.0, 79.0, 52.0, 31.0, 17.0, 22.0, 13.0, 5.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.609375, -6.42083740234375, -6.2322998046875, -6.04376220703125, -5.855224609375, -5.66668701171875, -5.4781494140625, -5.28961181640625, -5.10107421875, -4.91253662109375, -4.7239990234375, -4.53546142578125, -4.346923828125, -4.15838623046875, -3.9698486328125, -3.78131103515625, -3.5927734375, -3.40423583984375, -3.2156982421875, -3.02716064453125, -2.838623046875, -2.65008544921875, -2.4615478515625, -2.27301025390625, -2.08447265625, -1.89593505859375, -1.7073974609375, -1.51885986328125, -1.330322265625, -1.14178466796875, -0.9532470703125, -0.76470947265625, -0.576171875, -0.38763427734375, -0.1990966796875, -0.01055908203125, 0.177978515625, 0.36651611328125, 0.5550537109375, 0.74359130859375, 0.93212890625, 1.12066650390625, 1.3092041015625, 1.49774169921875, 1.686279296875, 1.87481689453125, 2.0633544921875, 2.25189208984375, 2.4404296875, 2.62896728515625, 2.8175048828125, 3.00604248046875, 3.194580078125, 3.38311767578125, 3.5716552734375, 3.76019287109375, 3.94873046875, 4.13726806640625, 4.3258056640625, 4.51434326171875, 4.702880859375, 4.89141845703125, 5.0799560546875, 5.26849365234375, 5.45703125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 16.0, 14.0, 16.0, 15.0, 24.0, 18.0, 30.0, 25.0, 39.0, 34.0, 40.0, 36.0, 59.0, 112.0, 236.0, 1404.0, 281.0, 142.0, 66.0, 57.0, 44.0, 38.0, 38.0, 35.0, 25.0, 20.0, 22.0, 23.0, 15.0, 21.0, 11.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8984375, -14.427978515625, -13.95751953125, -13.487060546875, -13.0166015625, -12.546142578125, -12.07568359375, -11.605224609375, -11.134765625, -10.664306640625, -10.19384765625, -9.723388671875, -9.2529296875, -8.782470703125, -8.31201171875, -7.841552734375, -7.37109375, -6.900634765625, -6.43017578125, -5.959716796875, -5.4892578125, -5.018798828125, -4.54833984375, -4.077880859375, -3.607421875, -3.136962890625, -2.66650390625, -2.196044921875, -1.7255859375, -1.255126953125, -0.78466796875, -0.314208984375, 0.15625, 0.626708984375, 1.09716796875, 1.567626953125, 2.0380859375, 2.508544921875, 2.97900390625, 3.449462890625, 3.919921875, 4.390380859375, 4.86083984375, 5.331298828125, 5.8017578125, 6.272216796875, 6.74267578125, 7.213134765625, 7.68359375, 8.154052734375, 8.62451171875, 9.094970703125, 9.5654296875, 10.035888671875, 10.50634765625, 10.976806640625, 11.447265625, 11.917724609375, 12.38818359375, 12.858642578125, 13.3291015625, 13.799560546875, 14.27001953125, 14.740478515625, 15.2109375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 8.0, 16.0, 20.0, 18.0, 21.0, 44.0, 46.0, 47.0, 68.0, 97.0, 127.0, 180.0, 232.0, 437.0, 1071.0, 3965.0, 21376.0, 361700.0, 2661812.0, 81182.0, 9358.0, 2049.0, 650.0, 357.0, 198.0, 132.0, 107.0, 76.0, 67.0, 59.0, 36.0, 21.0, 20.0, 21.0, 9.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.578125, -21.878662109375, -21.17919921875, -20.479736328125, -19.7802734375, -19.080810546875, -18.38134765625, -17.681884765625, -16.982421875, -16.282958984375, -15.58349609375, -14.884033203125, -14.1845703125, -13.485107421875, -12.78564453125, -12.086181640625, -11.38671875, -10.687255859375, -9.98779296875, -9.288330078125, -8.5888671875, -7.889404296875, -7.18994140625, -6.490478515625, -5.791015625, -5.091552734375, -4.39208984375, -3.692626953125, -2.9931640625, -2.293701171875, -1.59423828125, -0.894775390625, -0.1953125, 0.504150390625, 1.20361328125, 1.903076171875, 2.6025390625, 3.302001953125, 4.00146484375, 4.700927734375, 5.400390625, 6.099853515625, 6.79931640625, 7.498779296875, 8.1982421875, 8.897705078125, 9.59716796875, 10.296630859375, 10.99609375, 11.695556640625, 12.39501953125, 13.094482421875, 13.7939453125, 14.493408203125, 15.19287109375, 15.892333984375, 16.591796875, 17.291259765625, 17.99072265625, 18.690185546875, 19.3896484375, 20.089111328125, 20.78857421875, 21.488037109375, 22.1875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 13.0, 134.0, 528.0, 305.0, 32.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.140018463134766, -40.91276550292969, -36.68551254272461, -32.45825958251953, -28.23100471496582, -24.003751754760742, -19.77649688720703, -15.549243927001953, -11.321990966796875, -7.094737529754639, -2.8674840927124023, 1.3597698211669922, 5.58702278137207, 9.814275741577148, 14.04153060913086, 18.268783569335938, 22.496036529541016, 26.723289489746094, 30.950542449951172, 35.17779541015625, 39.405052185058594, 43.632301330566406, 47.85955810546875, 52.08681106567383, 56.314064025878906, 60.541316986083984, 64.76856994628906, 68.9958267211914, 73.22307586669922, 77.45033264160156, 81.67758178710938, 85.90483856201172, 90.132080078125, 94.35933685302734, 98.58658599853516, 102.8138427734375, 107.04109191894531, 111.26834869384766, 115.49560546875, 119.72285461425781, 123.95010375976562, 128.17735290527344, 132.4046173095703, 136.63186645507812, 140.85911560058594, 145.08636474609375, 149.31362915039062, 153.54087829589844, 157.76812744140625, 161.99537658691406, 166.22264099121094, 170.44989013671875, 174.67713928222656, 178.90438842773438, 183.13165283203125, 187.35890197753906, 191.58616638183594, 195.81341552734375, 200.04067993164062, 204.26792907714844, 208.49517822265625, 212.72242736816406, 216.94969177246094, 221.17694091796875, 225.40419006347656]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 7.0, 9.0, 13.0, 18.0, 15.0, 20.0, 13.0, 16.0, 29.0, 25.0, 26.0, 28.0, 27.0, 34.0, 44.0, 37.0, 54.0, 53.0, 53.0, 28.0, 41.0, 36.0, 41.0, 42.0, 27.0, 32.0, 35.0, 25.0, 29.0, 30.0, 23.0, 13.0, 9.0, 12.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.925567626953125, -40.7198371887207, -39.51411056518555, -38.308380126953125, -37.1026496887207, -35.89691925048828, -34.691192626953125, -33.4854621887207, -32.27973175048828, -31.074003219604492, -29.86827278137207, -28.66254425048828, -27.45681381225586, -26.25108528137207, -25.04535675048828, -23.83962631225586, -22.633899688720703, -21.428171157836914, -20.222440719604492, -19.016712188720703, -17.81098175048828, -16.605253219604492, -15.399524688720703, -14.193795204162598, -12.988065719604492, -11.782336235046387, -10.576606750488281, -9.370878219604492, -8.165148735046387, -6.959419250488281, -5.753690242767334, -4.547961235046387, -3.3422279357910156, -2.1364986896514893, -0.9307694435119629, 0.2749598026275635, 1.4806890487670898, 2.6864185333251953, 3.8921475410461426, 5.09787654876709, 6.303606033325195, 7.509335517883301, 8.715065002441406, 9.920793533325195, 11.1265230178833, 12.332252502441406, 13.537981033325195, 14.7437105178833, 15.949440002441406, 17.155168533325195, 18.360898971557617, 19.566627502441406, 20.772357940673828, 21.978086471557617, 23.183815002441406, 24.389545440673828, 25.595273971557617, 26.801002502441406, 28.006732940673828, 29.212461471557617, 30.418190002441406, 31.623920440673828, 32.82965087890625, 34.035377502441406, 35.24110794067383]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 5.0, 9.0, 9.0, 14.0, 23.0, 24.0, 27.0, 21.0, 32.0, 23.0, 28.0, 29.0, 38.0, 30.0, 40.0, 41.0, 37.0, 53.0, 53.0, 34.0, 41.0, 54.0, 43.0, 35.0, 41.0, 23.0, 27.0, 25.0, 19.0, 17.0, 14.0, 16.0, 13.0, 18.0, 9.0, 8.0, 2.0, 5.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.5390625, -5.38116455078125, -5.2232666015625, -5.06536865234375, -4.907470703125, -4.74957275390625, -4.5916748046875, -4.43377685546875, -4.27587890625, -4.11798095703125, -3.9600830078125, -3.80218505859375, -3.644287109375, -3.48638916015625, -3.3284912109375, -3.17059326171875, -3.0126953125, -2.85479736328125, -2.6968994140625, -2.53900146484375, -2.381103515625, -2.22320556640625, -2.0653076171875, -1.90740966796875, -1.74951171875, -1.59161376953125, -1.4337158203125, -1.27581787109375, -1.117919921875, -0.96002197265625, -0.8021240234375, -0.64422607421875, -0.486328125, -0.32843017578125, -0.1705322265625, -0.01263427734375, 0.145263671875, 0.30316162109375, 0.4610595703125, 0.61895751953125, 0.77685546875, 0.93475341796875, 1.0926513671875, 1.25054931640625, 1.408447265625, 1.56634521484375, 1.7242431640625, 1.88214111328125, 2.0400390625, 2.19793701171875, 2.3558349609375, 2.51373291015625, 2.671630859375, 2.82952880859375, 2.9874267578125, 3.14532470703125, 3.30322265625, 3.46112060546875, 3.6190185546875, 3.77691650390625, 3.934814453125, 4.09271240234375, 4.2506103515625, 4.40850830078125, 4.56640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 11.0, 11.0, 21.0, 18.0, 21.0, 33.0, 47.0, 55.0, 104.0, 255.0, 515.0, 1478.0, 4313.0, 16256.0, 93538.0, 1205098.0, 2596807.0, 235284.0, 29724.0, 6989.0, 2157.0, 745.0, 348.0, 146.0, 85.0, 41.0, 34.0, 23.0, 21.0, 25.0, 14.0, 17.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.3515625, -13.955078125, -13.55859375, -13.162109375, -12.765625, -12.369140625, -11.97265625, -11.576171875, -11.1796875, -10.783203125, -10.38671875, -9.990234375, -9.59375, -9.197265625, -8.80078125, -8.404296875, -8.0078125, -7.611328125, -7.21484375, -6.818359375, -6.421875, -6.025390625, -5.62890625, -5.232421875, -4.8359375, -4.439453125, -4.04296875, -3.646484375, -3.25, -2.853515625, -2.45703125, -2.060546875, -1.6640625, -1.267578125, -0.87109375, -0.474609375, -0.078125, 0.318359375, 0.71484375, 1.111328125, 1.5078125, 1.904296875, 2.30078125, 2.697265625, 3.09375, 3.490234375, 3.88671875, 4.283203125, 4.6796875, 5.076171875, 5.47265625, 5.869140625, 6.265625, 6.662109375, 7.05859375, 7.455078125, 7.8515625, 8.248046875, 8.64453125, 9.041015625, 9.4375, 9.833984375, 10.23046875, 10.626953125, 11.0234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 8.0, 18.0, 16.0, 16.0, 26.0, 44.0, 40.0, 48.0, 73.0, 112.0, 158.0, 227.0, 282.0, 398.0, 510.0, 560.0, 408.0, 306.0, 221.0, 140.0, 105.0, 93.0, 68.0, 40.0, 29.0, 20.0, 20.0, 19.0, 16.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.59375, -8.3482666015625, -8.102783203125, -7.8572998046875, -7.61181640625, -7.3663330078125, -7.120849609375, -6.8753662109375, -6.6298828125, -6.3843994140625, -6.138916015625, -5.8934326171875, -5.64794921875, -5.4024658203125, -5.156982421875, -4.9114990234375, -4.666015625, -4.4205322265625, -4.175048828125, -3.9295654296875, -3.68408203125, -3.4385986328125, -3.193115234375, -2.9476318359375, -2.7021484375, -2.4566650390625, -2.211181640625, -1.9656982421875, -1.72021484375, -1.4747314453125, -1.229248046875, -0.9837646484375, -0.73828125, -0.4927978515625, -0.247314453125, -0.0018310546875, 0.24365234375, 0.4891357421875, 0.734619140625, 0.9801025390625, 1.2255859375, 1.4710693359375, 1.716552734375, 1.9620361328125, 2.20751953125, 2.4530029296875, 2.698486328125, 2.9439697265625, 3.189453125, 3.4349365234375, 3.680419921875, 3.9259033203125, 4.17138671875, 4.4168701171875, 4.662353515625, 4.9078369140625, 5.1533203125, 5.3988037109375, 5.644287109375, 5.8897705078125, 6.13525390625, 6.3807373046875, 6.626220703125, 6.8717041015625, 7.1171875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 10.0, 12.0, 12.0, 20.0, 31.0, 48.0, 44.0, 55.0, 99.0, 144.0, 225.0, 357.0, 729.0, 2497.0, 18914.0, 439432.0, 3572902.0, 146560.0, 9063.0, 1581.0, 614.0, 312.0, 194.0, 101.0, 87.0, 57.0, 44.0, 44.0, 22.0, 17.0, 10.0, 16.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.140625, -24.338623046875, -23.53662109375, -22.734619140625, -21.9326171875, -21.130615234375, -20.32861328125, -19.526611328125, -18.724609375, -17.922607421875, -17.12060546875, -16.318603515625, -15.5166015625, -14.714599609375, -13.91259765625, -13.110595703125, -12.30859375, -11.506591796875, -10.70458984375, -9.902587890625, -9.1005859375, -8.298583984375, -7.49658203125, -6.694580078125, -5.892578125, -5.090576171875, -4.28857421875, -3.486572265625, -2.6845703125, -1.882568359375, -1.08056640625, -0.278564453125, 0.5234375, 1.325439453125, 2.12744140625, 2.929443359375, 3.7314453125, 4.533447265625, 5.33544921875, 6.137451171875, 6.939453125, 7.741455078125, 8.54345703125, 9.345458984375, 10.1474609375, 10.949462890625, 11.75146484375, 12.553466796875, 13.35546875, 14.157470703125, 14.95947265625, 15.761474609375, 16.5634765625, 17.365478515625, 18.16748046875, 18.969482421875, 19.771484375, 20.573486328125, 21.37548828125, 22.177490234375, 22.9794921875, 23.781494140625, 24.58349609375, 25.385498046875, 26.1875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 11.0, 41.0, 103.0, 161.0, 229.0, 174.0, 146.0, 78.0, 38.0, 16.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.330360412597656, -38.19539260864258, -36.0604248046875, -33.92545700073242, -31.79048728942871, -29.655519485473633, -27.520549774169922, -25.385581970214844, -23.250614166259766, -21.115646362304688, -18.98067855834961, -16.8457088470459, -14.71074104309082, -12.575773239135742, -10.440804481506348, -8.305835723876953, -6.170867919921875, -4.035899639129639, -1.9009313583374023, 0.23403692245483398, 2.3690052032470703, 4.503973007202148, 6.638941764831543, 8.773910522460938, 10.908878326416016, 13.043846130371094, 15.178814888000488, 17.313783645629883, 19.44875144958496, 21.58371925354004, 23.71868896484375, 25.853656768798828, 27.988624572753906, 30.123592376708984, 32.25856018066406, 34.39352798461914, 36.52849578857422, 38.66346740722656, 40.79843521118164, 42.93340301513672, 45.0683708190918, 47.203338623046875, 49.33830642700195, 51.47327423095703, 53.608245849609375, 55.74320983886719, 57.87818145751953, 60.01314926147461, 62.14811706542969, 64.28308868408203, 66.41805267333984, 68.55302429199219, 70.68798828125, 72.82295989990234, 74.95792388916016, 77.0928955078125, 79.22785949707031, 81.36283111572266, 83.49779510498047, 85.63276672363281, 87.76773071289062, 89.90270233154297, 92.03766632080078, 94.17263793945312, 96.30760955810547]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 10.0, 5.0, 6.0, 10.0, 9.0, 15.0, 15.0, 27.0, 21.0, 19.0, 20.0, 27.0, 41.0, 21.0, 49.0, 34.0, 60.0, 44.0, 45.0, 41.0, 37.0, 56.0, 51.0, 45.0, 53.0, 35.0, 33.0, 30.0, 20.0, 25.0, 16.0, 12.0, 15.0, 9.0, 10.0, 9.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.600439071655273, -25.691951751708984, -24.783462524414062, -23.874975204467773, -22.966487884521484, -22.057998657226562, -21.149511337280273, -20.241024017333984, -19.332534790039062, -18.424047470092773, -17.51555824279785, -16.607070922851562, -15.698582649230957, -14.790094375610352, -13.881607055664062, -12.973118782043457, -12.064630508422852, -11.156142234802246, -10.24765396118164, -9.339166641235352, -8.430678367614746, -7.522190093994141, -6.613702297210693, -5.705214500427246, -4.796726226806641, -3.8882381916046143, -2.979750156402588, -2.0712621212005615, -1.1627740859985352, -0.2542858123779297, 0.6542019844055176, 1.5626897811889648, 2.471179962158203, 3.3796679973602295, 4.288156032562256, 5.196643829345703, 6.105132102966309, 7.013620376586914, 7.922108173370361, 8.830595970153809, 9.739084243774414, 10.64757251739502, 11.556060791015625, 12.464548110961914, 13.37303638458252, 14.281524658203125, 15.190011978149414, 16.098499298095703, 17.006988525390625, 17.915475845336914, 18.823965072631836, 19.732452392578125, 20.640941619873047, 21.549428939819336, 22.457916259765625, 23.366405487060547, 24.274892807006836, 25.183380126953125, 26.091869354248047, 27.000356674194336, 27.908843994140625, 28.817333221435547, 29.725820541381836, 30.634307861328125, 31.542797088623047]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 10.0, 11.0, 6.0, 16.0, 18.0, 20.0, 16.0, 20.0, 23.0, 41.0, 27.0, 26.0, 32.0, 32.0, 31.0, 40.0, 31.0, 25.0, 34.0, 41.0, 33.0, 26.0, 45.0, 32.0, 30.0, 19.0, 35.0, 36.0, 25.0, 19.0, 22.0, 19.0, 16.0, 16.0, 17.0, 13.0, 8.0, 13.0, 7.0, 3.0, 8.0, 8.0, 10.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.916015625, -3.789825439453125, -3.66363525390625, -3.537445068359375, -3.4112548828125, -3.285064697265625, -3.15887451171875, -3.032684326171875, -2.906494140625, -2.780303955078125, -2.65411376953125, -2.527923583984375, -2.4017333984375, -2.275543212890625, -2.14935302734375, -2.023162841796875, -1.89697265625, -1.770782470703125, -1.64459228515625, -1.518402099609375, -1.3922119140625, -1.266021728515625, -1.13983154296875, -1.013641357421875, -0.887451171875, -0.761260986328125, -0.63507080078125, -0.508880615234375, -0.3826904296875, -0.256500244140625, -0.13031005859375, -0.004119873046875, 0.1220703125, 0.248260498046875, 0.37445068359375, 0.500640869140625, 0.6268310546875, 0.753021240234375, 0.87921142578125, 1.005401611328125, 1.131591796875, 1.257781982421875, 1.38397216796875, 1.510162353515625, 1.6363525390625, 1.762542724609375, 1.88873291015625, 2.014923095703125, 2.14111328125, 2.267303466796875, 2.39349365234375, 2.519683837890625, 2.6458740234375, 2.772064208984375, 2.89825439453125, 3.024444580078125, 3.150634765625, 3.276824951171875, 3.40301513671875, 3.529205322265625, 3.6553955078125, 3.781585693359375, 3.90777587890625, 4.033966064453125, 4.16015625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 13.0, 16.0, 27.0, 36.0, 52.0, 80.0, 105.0, 173.0, 280.0, 478.0, 777.0, 1133.0, 1981.0, 3358.0, 5862.0, 11308.0, 24501.0, 63266.0, 194641.0, 399811.0, 216300.0, 70448.0, 26713.0, 11955.0, 6405.0, 3475.0, 2097.0, 1169.0, 753.0, 483.0, 278.0, 194.0, 130.0, 67.0, 69.0, 28.0, 26.0, 11.0, 7.0, 15.0, 6.0, 1.0, 8.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4836578369140625, -1.435089111328125, -1.3865203857421875, -1.33795166015625, -1.2893829345703125, -1.240814208984375, -1.1922454833984375, -1.1436767578125, -1.0951080322265625, -1.046539306640625, -0.9979705810546875, -0.94940185546875, -0.9008331298828125, -0.852264404296875, -0.8036956787109375, -0.755126953125, -0.7065582275390625, -0.657989501953125, -0.6094207763671875, -0.56085205078125, -0.5122833251953125, -0.463714599609375, -0.4151458740234375, -0.3665771484375, -0.3180084228515625, -0.269439697265625, -0.2208709716796875, -0.17230224609375, -0.1237335205078125, -0.075164794921875, -0.0265960693359375, 0.02197265625, 0.0705413818359375, 0.119110107421875, 0.1676788330078125, 0.21624755859375, 0.2648162841796875, 0.313385009765625, 0.3619537353515625, 0.4105224609375, 0.4590911865234375, 0.507659912109375, 0.5562286376953125, 0.60479736328125, 0.6533660888671875, 0.701934814453125, 0.7505035400390625, 0.799072265625, 0.8476409912109375, 0.896209716796875, 0.9447784423828125, 0.99334716796875, 1.0419158935546875, 1.090484619140625, 1.1390533447265625, 1.1876220703125, 1.2361907958984375, 1.284759521484375, 1.3333282470703125, 1.38189697265625, 1.4304656982421875, 1.479034423828125, 1.5276031494140625, 1.576171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 5.0, 3.0, 5.0, 13.0, 9.0, 10.0, 17.0, 18.0, 21.0, 25.0, 31.0, 20.0, 16.0, 33.0, 33.0, 34.0, 33.0, 31.0, 45.0, 36.0, 1070.0, 58.0, 41.0, 34.0, 33.0, 45.0, 28.0, 31.0, 31.0, 27.0, 23.0, 23.0, 20.0, 24.0, 22.0, 16.0, 9.0, 15.0, 7.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.203125, -3.100189208984375, -2.99725341796875, -2.894317626953125, -2.7913818359375, -2.688446044921875, -2.58551025390625, -2.482574462890625, -2.379638671875, -2.276702880859375, -2.17376708984375, -2.070831298828125, -1.9678955078125, -1.864959716796875, -1.76202392578125, -1.659088134765625, -1.55615234375, -1.453216552734375, -1.35028076171875, -1.247344970703125, -1.1444091796875, -1.041473388671875, -0.93853759765625, -0.835601806640625, -0.732666015625, -0.629730224609375, -0.52679443359375, -0.423858642578125, -0.3209228515625, -0.217987060546875, -0.11505126953125, -0.012115478515625, 0.0908203125, 0.193756103515625, 0.29669189453125, 0.399627685546875, 0.5025634765625, 0.605499267578125, 0.70843505859375, 0.811370849609375, 0.914306640625, 1.017242431640625, 1.12017822265625, 1.223114013671875, 1.3260498046875, 1.428985595703125, 1.53192138671875, 1.634857177734375, 1.73779296875, 1.840728759765625, 1.94366455078125, 2.046600341796875, 2.1495361328125, 2.252471923828125, 2.35540771484375, 2.458343505859375, 2.561279296875, 2.664215087890625, 2.76715087890625, 2.870086669921875, 2.9730224609375, 3.075958251953125, 3.17889404296875, 3.281829833984375, 3.384765625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 21.0, 24.0, 24.0, 41.0, 57.0, 91.0, 124.0, 206.0, 302.0, 473.0, 794.0, 1431.0, 2367.0, 4579.0, 9675.0, 26923.0, 106849.0, 1007877.0, 792547.0, 97825.0, 25426.0, 9329.0, 4370.0, 2316.0, 1316.0, 775.0, 433.0, 316.0, 203.0, 141.0, 83.0, 53.0, 41.0, 25.0, 18.0, 15.0, 9.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2666015625, -1.2257080078125, -1.184814453125, -1.1439208984375, -1.10302734375, -1.0621337890625, -1.021240234375, -0.9803466796875, -0.939453125, -0.8985595703125, -0.857666015625, -0.8167724609375, -0.77587890625, -0.7349853515625, -0.694091796875, -0.6531982421875, -0.6123046875, -0.5714111328125, -0.530517578125, -0.4896240234375, -0.44873046875, -0.4078369140625, -0.366943359375, -0.3260498046875, -0.28515625, -0.2442626953125, -0.203369140625, -0.1624755859375, -0.12158203125, -0.0806884765625, -0.039794921875, 0.0010986328125, 0.0419921875, 0.0828857421875, 0.123779296875, 0.1646728515625, 0.20556640625, 0.2464599609375, 0.287353515625, 0.3282470703125, 0.369140625, 0.4100341796875, 0.450927734375, 0.4918212890625, 0.53271484375, 0.5736083984375, 0.614501953125, 0.6553955078125, 0.6962890625, 0.7371826171875, 0.778076171875, 0.8189697265625, 0.85986328125, 0.9007568359375, 0.941650390625, 0.9825439453125, 1.0234375, 1.0643310546875, 1.105224609375, 1.1461181640625, 1.18701171875, 1.2279052734375, 1.268798828125, 1.3096923828125, 1.3505859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 16.0, 16.0, 37.0, 34.0, 70.0, 132.0, 129.0, 163.0, 125.0, 85.0, 44.0, 31.0, 19.0, 13.0, 17.0, 7.0, 10.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.2460041046142578, -0.23834609985351562, -0.23068809509277344, -0.22303009033203125, -0.21537208557128906, -0.20771408081054688, -0.2000560760498047, -0.1923980712890625, -0.1847400665283203, -0.17708206176757812, -0.16942405700683594, -0.16176605224609375, -0.15410804748535156, -0.14645004272460938, -0.1387920379638672, -0.131134033203125, -0.12347602844238281, -0.11581802368164062, -0.10816001892089844, -0.10050201416015625, -0.09284400939941406, -0.08518600463867188, -0.07752799987792969, -0.0698699951171875, -0.06221199035644531, -0.054553985595703125, -0.04689598083496094, -0.03923797607421875, -0.03157997131347656, -0.023921966552734375, -0.016263961791992188, -0.00860595703125, -0.0009479522705078125, 0.006710052490234375, 0.014368057250976562, 0.02202606201171875, 0.029684066772460938, 0.037342071533203125, 0.04500007629394531, 0.0526580810546875, 0.06031608581542969, 0.06797409057617188, 0.07563209533691406, 0.08329010009765625, 0.09094810485839844, 0.09860610961914062, 0.10626411437988281, 0.113922119140625, 0.12158012390136719, 0.12923812866210938, 0.13689613342285156, 0.14455413818359375, 0.15221214294433594, 0.15987014770507812, 0.1675281524658203, 0.1751861572265625, 0.1828441619873047, 0.19050216674804688, 0.19816017150878906, 0.20581817626953125, 0.21347618103027344, 0.22113418579101562, 0.2287921905517578, 0.2364501953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 3.0, 4.0, 5.0, 12.0, 13.0, 22.0, 26.0, 52.0, 88.0, 204.0, 861.0, 920289.0, 125944.0, 621.0, 194.0, 66.0, 43.0, 26.0, 27.0, 8.0, 10.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.255859375, -5.07421875, -4.892578125, -4.7109375, -4.529296875, -4.34765625, -4.166015625, -3.984375, -3.802734375, -3.62109375, -3.439453125, -3.2578125, -3.076171875, -2.89453125, -2.712890625, -2.53125, -2.349609375, -2.16796875, -1.986328125, -1.8046875, -1.623046875, -1.44140625, -1.259765625, -1.078125, -0.896484375, -0.71484375, -0.533203125, -0.3515625, -0.169921875, 0.01171875, 0.193359375, 0.375, 0.556640625, 0.73828125, 0.919921875, 1.1015625, 1.283203125, 1.46484375, 1.646484375, 1.828125, 2.009765625, 2.19140625, 2.373046875, 2.5546875, 2.736328125, 2.91796875, 3.099609375, 3.28125, 3.462890625, 3.64453125, 3.826171875, 4.0078125, 4.189453125, 4.37109375, 4.552734375, 4.734375, 4.916015625, 5.09765625, 5.279296875, 5.4609375, 5.642578125, 5.82421875, 6.005859375, 6.1875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 18.0, 48.0, 194.0, 406.0, 235.0, 92.0, 13.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0157800912857056, -0.993004560470581, -0.9702289700508118, -0.9474534392356873, -0.924677848815918, -0.9019023180007935, -0.879126787185669, -0.8563511967658997, -0.8335756659507751, -0.8108001351356506, -0.7880245447158813, -0.7652490139007568, -0.7424734234809875, -0.719697892665863, -0.6969223022460938, -0.6741467714309692, -0.6513712406158447, -0.6285957098007202, -0.6058201193809509, -0.5830445885658264, -0.5602689981460571, -0.5374934673309326, -0.5147179365158081, -0.4919423460960388, -0.46916675567626953, -0.44639119505882263, -0.42361563444137573, -0.4008401036262512, -0.3780645430088043, -0.3552889823913574, -0.3325134217739105, -0.3097378611564636, -0.2869623005390167, -0.2641867399215698, -0.24141119420528412, -0.21863563358783722, -0.1958600878715515, -0.17308452725410461, -0.15030896663665771, -0.127533420920372, -0.10475786030292511, -0.08198230713605881, -0.059206750243902206, -0.036431193351745605, -0.013655640184879303, 0.009119912981987, 0.0318954735994339, 0.054671019315719604, 0.0774465799331665, 0.1002221331000328, 0.12299768626689911, 0.145773246884346, 0.1685487926006317, 0.1913243532180786, 0.2140999138355255, 0.23687545955181122, 0.2596510052680969, 0.2824265658855438, 0.3052021265029907, 0.32797765731811523, 0.35075321793556213, 0.37352877855300903, 0.39630433917045593, 0.41907989978790283, 0.44185546040534973]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 5.0, 10.0, 8.0, 12.0, 10.0, 12.0, 12.0, 20.0, 19.0, 29.0, 32.0, 24.0, 44.0, 34.0, 37.0, 40.0, 35.0, 50.0, 34.0, 27.0, 36.0, 31.0, 44.0, 31.0, 44.0, 30.0, 30.0, 42.0, 28.0, 33.0, 25.0, 16.0, 18.0, 11.0, 10.0, 9.0, 16.0, 7.0, 6.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15076392889022827, -0.1457889974117279, -0.14081406593322754, -0.13583914935588837, -0.130864217877388, -0.12588928639888763, -0.12091436237096786, -0.1159394383430481, -0.11096450686454773, -0.10598957538604736, -0.1010146513581276, -0.09603972733020782, -0.09106479585170746, -0.08608986437320709, -0.08111494034528732, -0.07614001631736755, -0.07116508483886719, -0.06619015336036682, -0.06121522933244705, -0.056240301579236984, -0.051265373826026917, -0.04629044607281685, -0.04131551831960678, -0.03634059056639671, -0.031365662813186646, -0.026390735059976578, -0.02141580730676651, -0.016440879553556442, -0.011465951800346375, -0.006491024047136307, -0.001516096293926239, 0.0034588314592838287, 0.008433759212493896, 0.013408686965703964, 0.018383614718914032, 0.0233585424721241, 0.028333470225334167, 0.033308397978544235, 0.0382833257317543, 0.04325825348496437, 0.04823318123817444, 0.053208108991384506, 0.058183036744594574, 0.06315796077251434, 0.06813289225101471, 0.07310782372951508, 0.07808274775743484, 0.08305767178535461, 0.08803260326385498, 0.09300753474235535, 0.09798245877027512, 0.10295738279819489, 0.10793231427669525, 0.11290724575519562, 0.11788216978311539, 0.12285709381103516, 0.12783202528953552, 0.1328069567680359, 0.13778188824653625, 0.14275680482387543, 0.1477317363023758, 0.15270666778087616, 0.15768158435821533, 0.1626565158367157, 0.16763144731521606]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 15.0, 7.0, 6.0, 12.0, 18.0, 15.0, 20.0, 18.0, 23.0, 20.0, 23.0, 38.0, 25.0, 28.0, 46.0, 33.0, 32.0, 37.0, 41.0, 39.0, 32.0, 43.0, 38.0, 30.0, 39.0, 27.0, 29.0, 38.0, 25.0, 24.0, 26.0, 11.0, 20.0, 14.0, 19.0, 8.0, 14.0, 14.0, 8.0, 5.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.39453125, -4.26141357421875, -4.1282958984375, -3.99517822265625, -3.862060546875, -3.72894287109375, -3.5958251953125, -3.46270751953125, -3.32958984375, -3.19647216796875, -3.0633544921875, -2.93023681640625, -2.797119140625, -2.66400146484375, -2.5308837890625, -2.39776611328125, -2.2646484375, -2.13153076171875, -1.9984130859375, -1.86529541015625, -1.732177734375, -1.59906005859375, -1.4659423828125, -1.33282470703125, -1.19970703125, -1.06658935546875, -0.9334716796875, -0.80035400390625, -0.667236328125, -0.53411865234375, -0.4010009765625, -0.26788330078125, -0.134765625, -0.00164794921875, 0.1314697265625, 0.26458740234375, 0.397705078125, 0.53082275390625, 0.6639404296875, 0.79705810546875, 0.93017578125, 1.06329345703125, 1.1964111328125, 1.32952880859375, 1.462646484375, 1.59576416015625, 1.7288818359375, 1.86199951171875, 1.9951171875, 2.12823486328125, 2.2613525390625, 2.39447021484375, 2.527587890625, 2.66070556640625, 2.7938232421875, 2.92694091796875, 3.06005859375, 3.19317626953125, 3.3262939453125, 3.45941162109375, 3.592529296875, 3.72564697265625, 3.8587646484375, 3.99188232421875, 4.125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 14.0, 12.0, 23.0, 27.0, 45.0, 53.0, 72.0, 117.0, 167.0, 260.0, 357.0, 564.0, 844.0, 1325.0, 2120.0, 3445.0, 5801.0, 9996.0, 18580.0, 37643.0, 98570.0, 334095.0, 347311.0, 103508.0, 38594.0, 19298.0, 10296.0, 5747.0, 3451.0, 2156.0, 1423.0, 900.0, 577.0, 373.0, 225.0, 161.0, 117.0, 89.0, 55.0, 41.0, 33.0, 18.0, 19.0, 12.0, 14.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.724609375, -5.52734375, -5.330078125, -5.1328125, -4.935546875, -4.73828125, -4.541015625, -4.34375, -4.146484375, -3.94921875, -3.751953125, -3.5546875, -3.357421875, -3.16015625, -2.962890625, -2.765625, -2.568359375, -2.37109375, -2.173828125, -1.9765625, -1.779296875, -1.58203125, -1.384765625, -1.1875, -0.990234375, -0.79296875, -0.595703125, -0.3984375, -0.201171875, -0.00390625, 0.193359375, 0.390625, 0.587890625, 0.78515625, 0.982421875, 1.1796875, 1.376953125, 1.57421875, 1.771484375, 1.96875, 2.166015625, 2.36328125, 2.560546875, 2.7578125, 2.955078125, 3.15234375, 3.349609375, 3.546875, 3.744140625, 3.94140625, 4.138671875, 4.3359375, 4.533203125, 4.73046875, 4.927734375, 5.125, 5.322265625, 5.51953125, 5.716796875, 5.9140625, 6.111328125, 6.30859375, 6.505859375, 6.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 10.0, 14.0, 17.0, 18.0, 22.0, 22.0, 23.0, 31.0, 41.0, 30.0, 46.0, 57.0, 64.0, 105.0, 247.0, 1578.0, 222.0, 81.0, 80.0, 51.0, 29.0, 42.0, 38.0, 25.0, 30.0, 23.0, 24.0, 11.0, 7.0, 14.0, 7.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-21.46875, -20.9383544921875, -20.407958984375, -19.8775634765625, -19.34716796875, -18.8167724609375, -18.286376953125, -17.7559814453125, -17.2255859375, -16.6951904296875, -16.164794921875, -15.6343994140625, -15.10400390625, -14.5736083984375, -14.043212890625, -13.5128173828125, -12.982421875, -12.4520263671875, -11.921630859375, -11.3912353515625, -10.86083984375, -10.3304443359375, -9.800048828125, -9.2696533203125, -8.7392578125, -8.2088623046875, -7.678466796875, -7.1480712890625, -6.61767578125, -6.0872802734375, -5.556884765625, -5.0264892578125, -4.49609375, -3.9656982421875, -3.435302734375, -2.9049072265625, -2.37451171875, -1.8441162109375, -1.313720703125, -0.7833251953125, -0.2529296875, 0.2774658203125, 0.807861328125, 1.3382568359375, 1.86865234375, 2.3990478515625, 2.929443359375, 3.4598388671875, 3.990234375, 4.5206298828125, 5.051025390625, 5.5814208984375, 6.11181640625, 6.6422119140625, 7.172607421875, 7.7030029296875, 8.2333984375, 8.7637939453125, 9.294189453125, 9.8245849609375, 10.35498046875, 10.8853759765625, 11.415771484375, 11.9461669921875, 12.4765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 10.0, 7.0, 8.0, 14.0, 17.0, 21.0, 23.0, 39.0, 48.0, 73.0, 84.0, 123.0, 173.0, 273.0, 550.0, 1975.0, 11909.0, 239623.0, 2843056.0, 40715.0, 4712.0, 1093.0, 420.0, 207.0, 153.0, 86.0, 74.0, 57.0, 44.0, 34.0, 27.0, 23.0, 9.0, 9.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.568115234375, -23.69873046875, -22.829345703125, -21.9599609375, -21.090576171875, -20.22119140625, -19.351806640625, -18.482421875, -17.613037109375, -16.74365234375, -15.874267578125, -15.0048828125, -14.135498046875, -13.26611328125, -12.396728515625, -11.52734375, -10.657958984375, -9.78857421875, -8.919189453125, -8.0498046875, -7.180419921875, -6.31103515625, -5.441650390625, -4.572265625, -3.702880859375, -2.83349609375, -1.964111328125, -1.0947265625, -0.225341796875, 0.64404296875, 1.513427734375, 2.3828125, 3.252197265625, 4.12158203125, 4.990966796875, 5.8603515625, 6.729736328125, 7.59912109375, 8.468505859375, 9.337890625, 10.207275390625, 11.07666015625, 11.946044921875, 12.8154296875, 13.684814453125, 14.55419921875, 15.423583984375, 16.29296875, 17.162353515625, 18.03173828125, 18.901123046875, 19.7705078125, 20.639892578125, 21.50927734375, 22.378662109375, 23.248046875, 24.117431640625, 24.98681640625, 25.856201171875, 26.7255859375, 27.594970703125, 28.46435546875, 29.333740234375, 30.203125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 80.0, 342.0, 443.0, 127.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-144.48536682128906, -141.76321411132812, -139.04104614257812, -136.3188934326172, -133.59674072265625, -130.87457275390625, -128.1524200439453, -125.43025970458984, -122.70809936523438, -119.9859390258789, -117.26378631591797, -114.5416259765625, -111.81946563720703, -109.09730529785156, -106.37515258789062, -103.65299224853516, -100.93083190917969, -98.20867156982422, -95.48651885986328, -92.76435852050781, -90.04219818115234, -87.32003784179688, -84.59788513183594, -81.87572479248047, -79.15357208251953, -76.43141174316406, -73.70925903320312, -70.98709869384766, -68.26493835449219, -65.54277801513672, -62.82062530517578, -60.09846496582031, -57.37630081176758, -54.654144287109375, -51.931983947753906, -49.2098274230957, -46.487667083740234, -43.76551055908203, -41.04335021972656, -38.32119369506836, -35.599037170410156, -32.87688064575195, -30.154720306396484, -27.43256378173828, -24.710403442382812, -21.98824691772461, -19.266088485717773, -16.543930053710938, -13.821769714355469, -11.099611282348633, -8.377452850341797, -5.655295372009277, -2.9331369400024414, -0.21097850799560547, 2.511178970336914, 5.23333740234375, 7.955495834350586, 10.677654266357422, 13.399812698364258, 16.121971130371094, 18.844127655029297, 21.566287994384766, 24.28844451904297, 27.010602951049805, 29.73276138305664]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 11.0, 9.0, 11.0, 12.0, 16.0, 9.0, 15.0, 14.0, 19.0, 23.0, 27.0, 27.0, 32.0, 37.0, 30.0, 27.0, 33.0, 35.0, 26.0, 39.0, 37.0, 33.0, 43.0, 31.0, 51.0, 45.0, 35.0, 31.0, 21.0, 23.0, 24.0, 33.0, 20.0, 15.0, 24.0, 16.0, 11.0, 6.0, 9.0, 6.0, 8.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.05522918701172, -30.963394165039062, -29.87156105041504, -28.779726028442383, -27.68789291381836, -26.596057891845703, -25.504222869873047, -24.412389755249023, -23.320556640625, -22.228721618652344, -21.13688850402832, -20.045053482055664, -18.95322036743164, -17.861385345458984, -16.769550323486328, -15.677717208862305, -14.585882186889648, -13.494048118591309, -12.402214050292969, -11.310379028320312, -10.218545913696289, -9.126710891723633, -8.034876823425293, -6.943042755126953, -5.851208686828613, -4.759374618530273, -3.6675403118133545, -2.5757060050964355, -1.4838719367980957, -0.39203786849975586, 0.6997966766357422, 1.791630744934082, 2.883464813232422, 3.9752988815307617, 5.067132949829102, 6.1589674949646, 7.2508015632629395, 8.342636108398438, 9.434470176696777, 10.526304244995117, 11.618138313293457, 12.709972381591797, 13.801806449890137, 14.893640518188477, 15.985475540161133, 17.077308654785156, 18.169143676757812, 19.26097869873047, 20.352811813354492, 21.44464683532715, 22.536479949951172, 23.628314971923828, 24.72014808654785, 25.811983108520508, 26.90381622314453, 27.995651245117188, 29.087486267089844, 30.1793212890625, 31.271154403686523, 32.36298751831055, 33.4548225402832, 34.54665756225586, 35.638492584228516, 36.730323791503906, 37.82215881347656]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 10.0, 13.0, 6.0, 15.0, 15.0, 15.0, 19.0, 17.0, 20.0, 26.0, 31.0, 18.0, 32.0, 40.0, 28.0, 34.0, 32.0, 43.0, 34.0, 47.0, 44.0, 44.0, 35.0, 37.0, 22.0, 25.0, 25.0, 29.0, 21.0, 28.0, 18.0, 25.0, 15.0, 23.0, 14.0, 7.0, 18.0, 15.0, 11.0, 5.0, 10.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.19140625, -4.05609130859375, -3.9207763671875, -3.78546142578125, -3.650146484375, -3.51483154296875, -3.3795166015625, -3.24420166015625, -3.10888671875, -2.97357177734375, -2.8382568359375, -2.70294189453125, -2.567626953125, -2.43231201171875, -2.2969970703125, -2.16168212890625, -2.0263671875, -1.89105224609375, -1.7557373046875, -1.62042236328125, -1.485107421875, -1.34979248046875, -1.2144775390625, -1.07916259765625, -0.94384765625, -0.80853271484375, -0.6732177734375, -0.53790283203125, -0.402587890625, -0.26727294921875, -0.1319580078125, 0.00335693359375, 0.138671875, 0.27398681640625, 0.4093017578125, 0.54461669921875, 0.679931640625, 0.81524658203125, 0.9505615234375, 1.08587646484375, 1.22119140625, 1.35650634765625, 1.4918212890625, 1.62713623046875, 1.762451171875, 1.89776611328125, 2.0330810546875, 2.16839599609375, 2.3037109375, 2.43902587890625, 2.5743408203125, 2.70965576171875, 2.844970703125, 2.98028564453125, 3.1156005859375, 3.25091552734375, 3.38623046875, 3.52154541015625, 3.6568603515625, 3.79217529296875, 3.927490234375, 4.06280517578125, 4.1981201171875, 4.33343505859375, 4.46875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 5.0, 1.0, 13.0, 14.0, 15.0, 39.0, 40.0, 69.0, 111.0, 166.0, 278.0, 462.0, 895.0, 1545.0, 2955.0, 6149.0, 14220.0, 38239.0, 150432.0, 840805.0, 2214209.0, 731753.0, 131984.0, 35066.0, 13056.0, 5774.0, 2679.0, 1372.0, 786.0, 418.0, 280.0, 163.0, 95.0, 58.0, 49.0, 32.0, 15.0, 10.0, 6.0, 14.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.25, -7.995849609375, -7.74169921875, -7.487548828125, -7.2333984375, -6.979248046875, -6.72509765625, -6.470947265625, -6.216796875, -5.962646484375, -5.70849609375, -5.454345703125, -5.2001953125, -4.946044921875, -4.69189453125, -4.437744140625, -4.18359375, -3.929443359375, -3.67529296875, -3.421142578125, -3.1669921875, -2.912841796875, -2.65869140625, -2.404541015625, -2.150390625, -1.896240234375, -1.64208984375, -1.387939453125, -1.1337890625, -0.879638671875, -0.62548828125, -0.371337890625, -0.1171875, 0.136962890625, 0.39111328125, 0.645263671875, 0.8994140625, 1.153564453125, 1.40771484375, 1.661865234375, 1.916015625, 2.170166015625, 2.42431640625, 2.678466796875, 2.9326171875, 3.186767578125, 3.44091796875, 3.695068359375, 3.94921875, 4.203369140625, 4.45751953125, 4.711669921875, 4.9658203125, 5.219970703125, 5.47412109375, 5.728271484375, 5.982421875, 6.236572265625, 6.49072265625, 6.744873046875, 6.9990234375, 7.253173828125, 7.50732421875, 7.761474609375, 8.015625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 13.0, 17.0, 23.0, 17.0, 34.0, 31.0, 38.0, 55.0, 93.0, 126.0, 181.0, 261.0, 378.0, 488.0, 562.0, 530.0, 387.0, 228.0, 192.0, 115.0, 79.0, 55.0, 47.0, 35.0, 15.0, 8.0, 18.0, 5.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.296875, -10.0361328125, -9.775390625, -9.5146484375, -9.25390625, -8.9931640625, -8.732421875, -8.4716796875, -8.2109375, -7.9501953125, -7.689453125, -7.4287109375, -7.16796875, -6.9072265625, -6.646484375, -6.3857421875, -6.125, -5.8642578125, -5.603515625, -5.3427734375, -5.08203125, -4.8212890625, -4.560546875, -4.2998046875, -4.0390625, -3.7783203125, -3.517578125, -3.2568359375, -2.99609375, -2.7353515625, -2.474609375, -2.2138671875, -1.953125, -1.6923828125, -1.431640625, -1.1708984375, -0.91015625, -0.6494140625, -0.388671875, -0.1279296875, 0.1328125, 0.3935546875, 0.654296875, 0.9150390625, 1.17578125, 1.4365234375, 1.697265625, 1.9580078125, 2.21875, 2.4794921875, 2.740234375, 3.0009765625, 3.26171875, 3.5224609375, 3.783203125, 4.0439453125, 4.3046875, 4.5654296875, 4.826171875, 5.0869140625, 5.34765625, 5.6083984375, 5.869140625, 6.1298828125, 6.390625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 16.0, 21.0, 20.0, 25.0, 40.0, 73.0, 112.0, 167.0, 358.0, 714.0, 1991.0, 8135.0, 69044.0, 2528539.0, 1526940.0, 48284.0, 6660.0, 1640.0, 641.0, 299.0, 183.0, 126.0, 76.0, 52.0, 41.0, 22.0, 18.0, 9.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.150634765625, -26.39501953125, -25.639404296875, -24.8837890625, -24.128173828125, -23.37255859375, -22.616943359375, -21.861328125, -21.105712890625, -20.35009765625, -19.594482421875, -18.8388671875, -18.083251953125, -17.32763671875, -16.572021484375, -15.81640625, -15.060791015625, -14.30517578125, -13.549560546875, -12.7939453125, -12.038330078125, -11.28271484375, -10.527099609375, -9.771484375, -9.015869140625, -8.26025390625, -7.504638671875, -6.7490234375, -5.993408203125, -5.23779296875, -4.482177734375, -3.7265625, -2.970947265625, -2.21533203125, -1.459716796875, -0.7041015625, 0.051513671875, 0.80712890625, 1.562744140625, 2.318359375, 3.073974609375, 3.82958984375, 4.585205078125, 5.3408203125, 6.096435546875, 6.85205078125, 7.607666015625, 8.36328125, 9.118896484375, 9.87451171875, 10.630126953125, 11.3857421875, 12.141357421875, 12.89697265625, 13.652587890625, 14.408203125, 15.163818359375, 15.91943359375, 16.675048828125, 17.4306640625, 18.186279296875, 18.94189453125, 19.697509765625, 20.453125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [3.0, 4.0, 11.0, 47.0, 87.0, 203.0, 249.0, 236.0, 121.0, 36.0, 15.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.981788635253906, -14.481010437011719, -11.980232238769531, -9.479454040527344, -6.978675842285156, -4.477897644042969, -1.9771194458007812, 0.5236587524414062, 3.0244369506835938, 5.525215148925781, 8.025993347167969, 10.526771545410156, 13.027549743652344, 15.528327941894531, 18.02910614013672, 20.529884338378906, 23.030662536621094, 25.53144073486328, 28.03221893310547, 30.532997131347656, 33.033775329589844, 35.53455352783203, 38.03533172607422, 40.536109924316406, 43.036888122558594, 45.53766632080078, 48.03844451904297, 50.539222717285156, 53.040000915527344, 55.54077911376953, 58.04155731201172, 60.542335510253906, 63.043121337890625, 65.54389953613281, 68.044677734375, 70.54545593261719, 73.04623413085938, 75.54701232910156, 78.04779052734375, 80.54856872558594, 83.04934692382812, 85.55012512207031, 88.0509033203125, 90.55168151855469, 93.05245971679688, 95.55323791503906, 98.05401611328125, 100.55479431152344, 103.05557250976562, 105.55635070800781, 108.05712890625, 110.55790710449219, 113.05868530273438, 115.55946350097656, 118.06024169921875, 120.56101989746094, 123.06179809570312, 125.56257629394531, 128.0633544921875, 130.5641326904297, 133.06491088867188, 135.56568908691406, 138.06646728515625, 140.56724548339844, 143.06802368164062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 5.0, 10.0, 7.0, 16.0, 18.0, 12.0, 21.0, 23.0, 24.0, 24.0, 31.0, 26.0, 37.0, 36.0, 30.0, 43.0, 33.0, 39.0, 42.0, 44.0, 50.0, 33.0, 47.0, 44.0, 29.0, 39.0, 43.0, 19.0, 30.0, 25.0, 13.0, 20.0, 11.0, 14.0, 13.0, 10.0, 4.0, 8.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.143146514892578, -25.287883758544922, -24.4326229095459, -23.577360153198242, -22.72209930419922, -21.866836547851562, -21.011573791503906, -20.15631103515625, -19.301050186157227, -18.44578742980957, -17.590526580810547, -16.73526382446289, -15.88000202178955, -15.024740219116211, -14.169477462768555, -13.314215660095215, -12.458953857421875, -11.603692054748535, -10.748430252075195, -9.893167495727539, -9.0379056930542, -8.18264389038086, -7.327381610870361, -6.472119331359863, -5.616857528686523, -4.761595726013184, -3.9063334465026855, -3.0510714054107666, -2.1958093643188477, -1.3405475616455078, -0.48528528213500977, 0.3699769973754883, 1.2252388000488281, 2.080500841140747, 2.935762882232666, 3.791024923324585, 4.646286964416504, 5.501548767089844, 6.356811046600342, 7.21207332611084, 8.06733512878418, 8.92259693145752, 9.77785873413086, 10.633121490478516, 11.488383293151855, 12.343645095825195, 13.198907852172852, 14.054169654846191, 14.909431457519531, 15.764693260192871, 16.61995506286621, 17.475217819213867, 18.33047866821289, 19.185741424560547, 20.041004180908203, 20.89626693725586, 21.751527786254883, 22.60679054260254, 23.462051391601562, 24.31731414794922, 25.172576904296875, 26.0278377532959, 26.883100509643555, 27.738361358642578, 28.593624114990234]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 2.0, 7.0, 10.0, 10.0, 10.0, 12.0, 16.0, 17.0, 26.0, 25.0, 28.0, 31.0, 37.0, 38.0, 37.0, 35.0, 33.0, 41.0, 42.0, 50.0, 44.0, 32.0, 49.0, 44.0, 32.0, 35.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 12.0, 14.0, 11.0, 8.0, 16.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.71417236328125, -4.5611572265625, -4.40814208984375, -4.255126953125, -4.10211181640625, -3.9490966796875, -3.79608154296875, -3.64306640625, -3.49005126953125, -3.3370361328125, -3.18402099609375, -3.031005859375, -2.87799072265625, -2.7249755859375, -2.57196044921875, -2.4189453125, -2.26593017578125, -2.1129150390625, -1.95989990234375, -1.806884765625, -1.65386962890625, -1.5008544921875, -1.34783935546875, -1.19482421875, -1.04180908203125, -0.8887939453125, -0.73577880859375, -0.582763671875, -0.42974853515625, -0.2767333984375, -0.12371826171875, 0.029296875, 0.18231201171875, 0.3353271484375, 0.48834228515625, 0.641357421875, 0.79437255859375, 0.9473876953125, 1.10040283203125, 1.25341796875, 1.40643310546875, 1.5594482421875, 1.71246337890625, 1.865478515625, 2.01849365234375, 2.1715087890625, 2.32452392578125, 2.4775390625, 2.63055419921875, 2.7835693359375, 2.93658447265625, 3.089599609375, 3.24261474609375, 3.3956298828125, 3.54864501953125, 3.70166015625, 3.85467529296875, 4.0076904296875, 4.16070556640625, 4.313720703125, 4.46673583984375, 4.6197509765625, 4.77276611328125, 4.92578125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 11.0, 13.0, 14.0, 32.0, 39.0, 43.0, 53.0, 98.0, 142.0, 230.0, 273.0, 396.0, 613.0, 1063.0, 1939.0, 4362.0, 13254.0, 62889.0, 353374.0, 480754.0, 98415.0, 19180.0, 5549.0, 2326.0, 1234.0, 713.0, 477.0, 316.0, 230.0, 157.0, 106.0, 71.0, 48.0, 32.0, 25.0, 20.0, 14.0, 11.0, 9.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7644195556640625, -1.701690673828125, -1.6389617919921875, -1.57623291015625, -1.5135040283203125, -1.450775146484375, -1.3880462646484375, -1.3253173828125, -1.2625885009765625, -1.199859619140625, -1.1371307373046875, -1.07440185546875, -1.0116729736328125, -0.948944091796875, -0.8862152099609375, -0.823486328125, -0.7607574462890625, -0.698028564453125, -0.6352996826171875, -0.57257080078125, -0.5098419189453125, -0.447113037109375, -0.3843841552734375, -0.3216552734375, -0.2589263916015625, -0.196197509765625, -0.1334686279296875, -0.07073974609375, -0.0080108642578125, 0.054718017578125, 0.1174468994140625, 0.18017578125, 0.2429046630859375, 0.305633544921875, 0.3683624267578125, 0.43109130859375, 0.4938201904296875, 0.556549072265625, 0.6192779541015625, 0.6820068359375, 0.7447357177734375, 0.807464599609375, 0.8701934814453125, 0.93292236328125, 0.9956512451171875, 1.058380126953125, 1.1211090087890625, 1.183837890625, 1.2465667724609375, 1.309295654296875, 1.3720245361328125, 1.43475341796875, 1.4974822998046875, 1.560211181640625, 1.6229400634765625, 1.6856689453125, 1.7483978271484375, 1.811126708984375, 1.8738555908203125, 1.93658447265625, 1.9993133544921875, 2.062042236328125, 2.1247711181640625, 2.1875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 14.0, 12.0, 13.0, 25.0, 22.0, 35.0, 28.0, 35.0, 33.0, 40.0, 45.0, 51.0, 70.0, 1083.0, 48.0, 50.0, 54.0, 50.0, 53.0, 33.0, 39.0, 35.0, 35.0, 27.0, 21.0, 18.0, 10.0, 9.0, 5.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3272705078125, -4.181884765625, -4.0364990234375, -3.89111328125, -3.7457275390625, -3.600341796875, -3.4549560546875, -3.3095703125, -3.1641845703125, -3.018798828125, -2.8734130859375, -2.72802734375, -2.5826416015625, -2.437255859375, -2.2918701171875, -2.146484375, -2.0010986328125, -1.855712890625, -1.7103271484375, -1.56494140625, -1.4195556640625, -1.274169921875, -1.1287841796875, -0.9833984375, -0.8380126953125, -0.692626953125, -0.5472412109375, -0.40185546875, -0.2564697265625, -0.111083984375, 0.0343017578125, 0.1796875, 0.3250732421875, 0.470458984375, 0.6158447265625, 0.76123046875, 0.9066162109375, 1.052001953125, 1.1973876953125, 1.3427734375, 1.4881591796875, 1.633544921875, 1.7789306640625, 1.92431640625, 2.0697021484375, 2.215087890625, 2.3604736328125, 2.505859375, 2.6512451171875, 2.796630859375, 2.9420166015625, 3.08740234375, 3.2327880859375, 3.378173828125, 3.5235595703125, 3.6689453125, 3.8143310546875, 3.959716796875, 4.1051025390625, 4.25048828125, 4.3958740234375, 4.541259765625, 4.6866455078125, 4.83203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 12.0, 20.0, 21.0, 37.0, 40.0, 54.0, 126.0, 155.0, 248.0, 417.0, 625.0, 1260.0, 2541.0, 6411.0, 21306.0, 100807.0, 1107769.0, 736292.0, 89291.0, 18951.0, 5684.0, 2306.0, 1158.0, 607.0, 345.0, 208.0, 137.0, 88.0, 51.0, 43.0, 20.0, 23.0, 23.0, 12.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2333984375, -1.1981201171875, -1.162841796875, -1.1275634765625, -1.09228515625, -1.0570068359375, -1.021728515625, -0.9864501953125, -0.951171875, -0.9158935546875, -0.880615234375, -0.8453369140625, -0.81005859375, -0.7747802734375, -0.739501953125, -0.7042236328125, -0.6689453125, -0.6336669921875, -0.598388671875, -0.5631103515625, -0.52783203125, -0.4925537109375, -0.457275390625, -0.4219970703125, -0.38671875, -0.3514404296875, -0.316162109375, -0.2808837890625, -0.24560546875, -0.2103271484375, -0.175048828125, -0.1397705078125, -0.1044921875, -0.0692138671875, -0.033935546875, 0.0013427734375, 0.03662109375, 0.0718994140625, 0.107177734375, 0.1424560546875, 0.177734375, 0.2130126953125, 0.248291015625, 0.2835693359375, 0.31884765625, 0.3541259765625, 0.389404296875, 0.4246826171875, 0.4599609375, 0.4952392578125, 0.530517578125, 0.5657958984375, 0.60107421875, 0.6363525390625, 0.671630859375, 0.7069091796875, 0.7421875, 0.7774658203125, 0.812744140625, 0.8480224609375, 0.88330078125, 0.9185791015625, 0.953857421875, 0.9891357421875, 1.0244140625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 2.0, 16.0, 18.0, 22.0, 32.0, 81.0, 109.0, 179.0, 191.0, 129.0, 78.0, 50.0, 26.0, 13.0, 11.0, 11.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.1526813507080078, -0.14776992797851562, -0.14285850524902344, -0.13794708251953125, -0.13303565979003906, -0.12812423706054688, -0.12321281433105469, -0.1183013916015625, -0.11338996887207031, -0.10847854614257812, -0.10356712341308594, -0.09865570068359375, -0.09374427795410156, -0.08883285522460938, -0.08392143249511719, -0.079010009765625, -0.07409858703613281, -0.06918716430664062, -0.06427574157714844, -0.05936431884765625, -0.05445289611816406, -0.049541473388671875, -0.04463005065917969, -0.0397186279296875, -0.03480720520019531, -0.029895782470703125, -0.024984359741210938, -0.02007293701171875, -0.015161514282226562, -0.010250091552734375, -0.0053386688232421875, -0.00042724609375, 0.0044841766357421875, 0.009395599365234375, 0.014307022094726562, 0.01921844482421875, 0.024129867553710938, 0.029041290283203125, 0.03395271301269531, 0.0388641357421875, 0.04377555847167969, 0.048686981201171875, 0.05359840393066406, 0.05850982666015625, 0.06342124938964844, 0.06833267211914062, 0.07324409484863281, 0.078155517578125, 0.08306694030761719, 0.08797836303710938, 0.09288978576660156, 0.09780120849609375, 0.10271263122558594, 0.10762405395507812, 0.11253547668457031, 0.1174468994140625, 0.12235832214355469, 0.12726974487304688, 0.13218116760253906, 0.13709259033203125, 0.14200401306152344, 0.14691543579101562, 0.1518268585205078, 0.15673828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 10.0, 6.0, 12.0, 35.0, 55.0, 104.0, 406.0, 22091.0, 1024665.0, 859.0, 143.0, 66.0, 34.0, 15.0, 14.0, 4.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0152587890625, -3.882080078125, -3.7489013671875, -3.61572265625, -3.4825439453125, -3.349365234375, -3.2161865234375, -3.0830078125, -2.9498291015625, -2.816650390625, -2.6834716796875, -2.55029296875, -2.4171142578125, -2.283935546875, -2.1507568359375, -2.017578125, -1.8843994140625, -1.751220703125, -1.6180419921875, -1.48486328125, -1.3516845703125, -1.218505859375, -1.0853271484375, -0.9521484375, -0.8189697265625, -0.685791015625, -0.5526123046875, -0.41943359375, -0.2862548828125, -0.153076171875, -0.0198974609375, 0.11328125, 0.2464599609375, 0.379638671875, 0.5128173828125, 0.64599609375, 0.7791748046875, 0.912353515625, 1.0455322265625, 1.1787109375, 1.3118896484375, 1.445068359375, 1.5782470703125, 1.71142578125, 1.8446044921875, 1.977783203125, 2.1109619140625, 2.244140625, 2.3773193359375, 2.510498046875, 2.6436767578125, 2.77685546875, 2.9100341796875, 3.043212890625, 3.1763916015625, 3.3095703125, 3.4427490234375, 3.575927734375, 3.7091064453125, 3.84228515625, 3.9754638671875, 4.108642578125, 4.2418212890625, 4.375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 38.0, 729.0, 248.0, 6.0], "bins": [-2.036968946456909, -2.0040080547332764, -1.9710474014282227, -1.9380865097045898, -1.9051257371902466, -1.8721649646759033, -1.83920419216156, -1.8062434196472168, -1.773282527923584, -1.7403217554092407, -1.7073609828948975, -1.6744000911712646, -1.6414393186569214, -1.6084785461425781, -1.5755177736282349, -1.5425570011138916, -1.5095962285995483, -1.476635456085205, -1.4436746835708618, -1.410713791847229, -1.3777530193328857, -1.3447922468185425, -1.3118314743041992, -1.278870701789856, -1.2459099292755127, -1.2129491567611694, -1.1799883842468262, -1.1470274925231934, -1.11406672000885, -1.0811059474945068, -1.0481451749801636, -1.0151844024658203, -0.9822235107421875, -0.9492627382278442, -0.9163019061088562, -0.8833411335945129, -0.8503803014755249, -0.8174195289611816, -0.7844587564468384, -0.7514979839324951, -0.7185371518135071, -0.6855763792991638, -0.6526155471801758, -0.6196547746658325, -0.5866940021514893, -0.5537331700325012, -0.520772397518158, -0.4878115952014923, -0.45485079288482666, -0.421889990568161, -0.38892918825149536, -0.3559684157371521, -0.32300761342048645, -0.2900468111038208, -0.25708603858947754, -0.2241252362728119, -0.19116444885730743, -0.15820366144180298, -0.12524285912513733, -0.09228206425905228, -0.059321269392967224, -0.026360467076301575, 0.006600320339202881, 0.039561107754707336, 0.07252191007137299]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 6.0, 13.0, 8.0, 9.0, 10.0, 11.0, 13.0, 21.0, 27.0, 18.0, 28.0, 26.0, 25.0, 34.0, 37.0, 35.0, 42.0, 24.0, 41.0, 30.0, 48.0, 43.0, 36.0, 41.0, 31.0, 40.0, 33.0, 42.0, 21.0, 28.0, 30.0, 17.0, 16.0, 21.0, 16.0, 15.0, 12.0, 7.0, 6.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.0807221531867981, -0.07827619463205338, -0.07583022862672806, -0.07338427007198334, -0.07093830406665802, -0.0684923455119133, -0.06604638695716858, -0.06360042095184326, -0.06115446239709854, -0.05870850011706352, -0.0562625378370285, -0.05381657928228378, -0.051370617002248764, -0.048924654722213745, -0.046478696167469025, -0.044032733887434006, -0.04158677160739899, -0.03914080932736397, -0.03669484704732895, -0.03424888849258423, -0.03180292621254921, -0.02935696393251419, -0.02691100351512432, -0.02446504309773445, -0.022019080817699432, -0.019573118537664413, -0.017127158120274544, -0.0146811967715621, -0.012235235422849655, -0.00978927407413721, -0.0073433127254247665, -0.004897352308034897, -0.002451390027999878, -5.428679287433624e-06, 0.0024405326694250107, 0.004886494018137455, 0.007332455366849899, 0.009778416715562344, 0.012224378064274788, 0.014670338481664658, 0.017116300761699677, 0.019562263041734695, 0.022008223459124565, 0.024454183876514435, 0.026900146156549454, 0.029346108436584473, 0.03179206699132919, 0.03423802927136421, 0.03668399155139923, 0.03912995383143425, 0.04157591611146927, 0.04402187466621399, 0.04646783694624901, 0.04891379922628403, 0.05135975778102875, 0.053805720061063766, 0.056251682341098785, 0.058697644621133804, 0.06114360690116882, 0.06358956545591354, 0.06603552401065826, 0.06848149001598358, 0.0709274485707283, 0.07337340712547302, 0.07581937313079834]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 3.0, 9.0, 6.0, 10.0, 18.0, 16.0, 22.0, 31.0, 25.0, 29.0, 33.0, 37.0, 36.0, 42.0, 33.0, 39.0, 43.0, 43.0, 41.0, 44.0, 39.0, 34.0, 36.0, 32.0, 45.0, 39.0, 24.0, 23.0, 21.0, 18.0, 16.0, 14.0, 13.0, 13.0, 12.0, 10.0, 11.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.640625, -4.48828125, -4.3359375, -4.18359375, -4.03125, -3.87890625, -3.7265625, -3.57421875, -3.421875, -3.26953125, -3.1171875, -2.96484375, -2.8125, -2.66015625, -2.5078125, -2.35546875, -2.203125, -2.05078125, -1.8984375, -1.74609375, -1.59375, -1.44140625, -1.2890625, -1.13671875, -0.984375, -0.83203125, -0.6796875, -0.52734375, -0.375, -0.22265625, -0.0703125, 0.08203125, 0.234375, 0.38671875, 0.5390625, 0.69140625, 0.84375, 0.99609375, 1.1484375, 1.30078125, 1.453125, 1.60546875, 1.7578125, 1.91015625, 2.0625, 2.21484375, 2.3671875, 2.51953125, 2.671875, 2.82421875, 2.9765625, 3.12890625, 3.28125, 3.43359375, 3.5859375, 3.73828125, 3.890625, 4.04296875, 4.1953125, 4.34765625, 4.5, 4.65234375, 4.8046875, 4.95703125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 16.0, 13.0, 33.0, 41.0, 56.0, 80.0, 114.0, 197.0, 293.0, 509.0, 951.0, 1700.0, 3252.0, 6400.0, 13595.0, 32761.0, 106088.0, 498080.0, 279328.0, 62209.0, 22305.0, 9886.0, 4868.0, 2593.0, 1313.0, 726.0, 415.0, 257.0, 145.0, 107.0, 53.0, 35.0, 33.0, 24.0, 14.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5546875, -8.28564453125, -8.0166015625, -7.74755859375, -7.478515625, -7.20947265625, -6.9404296875, -6.67138671875, -6.40234375, -6.13330078125, -5.8642578125, -5.59521484375, -5.326171875, -5.05712890625, -4.7880859375, -4.51904296875, -4.25, -3.98095703125, -3.7119140625, -3.44287109375, -3.173828125, -2.90478515625, -2.6357421875, -2.36669921875, -2.09765625, -1.82861328125, -1.5595703125, -1.29052734375, -1.021484375, -0.75244140625, -0.4833984375, -0.21435546875, 0.0546875, 0.32373046875, 0.5927734375, 0.86181640625, 1.130859375, 1.39990234375, 1.6689453125, 1.93798828125, 2.20703125, 2.47607421875, 2.7451171875, 3.01416015625, 3.283203125, 3.55224609375, 3.8212890625, 4.09033203125, 4.359375, 4.62841796875, 4.8974609375, 5.16650390625, 5.435546875, 5.70458984375, 5.9736328125, 6.24267578125, 6.51171875, 6.78076171875, 7.0498046875, 7.31884765625, 7.587890625, 7.85693359375, 8.1259765625, 8.39501953125, 8.6640625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 1.0, 7.0, 7.0, 10.0, 14.0, 14.0, 20.0, 27.0, 21.0, 23.0, 17.0, 25.0, 41.0, 40.0, 37.0, 52.0, 85.0, 141.0, 351.0, 1474.0, 183.0, 88.0, 56.0, 50.0, 30.0, 35.0, 28.0, 35.0, 23.0, 27.0, 13.0, 14.0, 13.0, 7.0, 11.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.9609375, -14.4952392578125, -14.029541015625, -13.5638427734375, -13.09814453125, -12.6324462890625, -12.166748046875, -11.7010498046875, -11.2353515625, -10.7696533203125, -10.303955078125, -9.8382568359375, -9.37255859375, -8.9068603515625, -8.441162109375, -7.9754638671875, -7.509765625, -7.0440673828125, -6.578369140625, -6.1126708984375, -5.64697265625, -5.1812744140625, -4.715576171875, -4.2498779296875, -3.7841796875, -3.3184814453125, -2.852783203125, -2.3870849609375, -1.92138671875, -1.4556884765625, -0.989990234375, -0.5242919921875, -0.05859375, 0.4071044921875, 0.872802734375, 1.3385009765625, 1.80419921875, 2.2698974609375, 2.735595703125, 3.2012939453125, 3.6669921875, 4.1326904296875, 4.598388671875, 5.0640869140625, 5.52978515625, 5.9954833984375, 6.461181640625, 6.9268798828125, 7.392578125, 7.8582763671875, 8.323974609375, 8.7896728515625, 9.25537109375, 9.7210693359375, 10.186767578125, 10.6524658203125, 11.1181640625, 11.5838623046875, 12.049560546875, 12.5152587890625, 12.98095703125, 13.4466552734375, 13.912353515625, 14.3780517578125, 14.84375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 4.0, 2.0, 3.0, 11.0, 8.0, 16.0, 18.0, 14.0, 27.0, 42.0, 48.0, 90.0, 163.0, 238.0, 489.0, 1517.0, 9757.0, 245145.0, 2845603.0, 36866.0, 3831.0, 871.0, 365.0, 194.0, 105.0, 94.0, 48.0, 39.0, 26.0, 12.0, 12.0, 11.0, 12.0, 7.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.453125, -28.567626953125, -27.68212890625, -26.796630859375, -25.9111328125, -25.025634765625, -24.14013671875, -23.254638671875, -22.369140625, -21.483642578125, -20.59814453125, -19.712646484375, -18.8271484375, -17.941650390625, -17.05615234375, -16.170654296875, -15.28515625, -14.399658203125, -13.51416015625, -12.628662109375, -11.7431640625, -10.857666015625, -9.97216796875, -9.086669921875, -8.201171875, -7.315673828125, -6.43017578125, -5.544677734375, -4.6591796875, -3.773681640625, -2.88818359375, -2.002685546875, -1.1171875, -0.231689453125, 0.65380859375, 1.539306640625, 2.4248046875, 3.310302734375, 4.19580078125, 5.081298828125, 5.966796875, 6.852294921875, 7.73779296875, 8.623291015625, 9.5087890625, 10.394287109375, 11.27978515625, 12.165283203125, 13.05078125, 13.936279296875, 14.82177734375, 15.707275390625, 16.5927734375, 17.478271484375, 18.36376953125, 19.249267578125, 20.134765625, 21.020263671875, 21.90576171875, 22.791259765625, 23.6767578125, 24.562255859375, 25.44775390625, 26.333251953125, 27.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 50.0, 236.0, 435.0, 237.0, 44.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.090768814086914, -8.679426193237305, -6.268082618713379, -3.8567395210266113, -1.4453964233398438, 0.9659461975097656, 3.3772897720336914, 5.788633346557617, 8.199975967407227, 10.611318588256836, 13.022662162780762, 15.434005737304688, 17.845348358154297, 20.256690979003906, 22.668033599853516, 25.079378128051758, 27.490720748901367, 29.902063369750977, 32.31340789794922, 34.72475051879883, 37.13609313964844, 39.54743576049805, 41.958778381347656, 44.37012481689453, 46.781463623046875, 49.192806243896484, 51.604148864746094, 54.0154914855957, 56.42683410644531, 58.83818054199219, 61.2495231628418, 63.660865783691406, 66.07220458984375, 68.48355102539062, 70.89488983154297, 73.30623626708984, 75.71757507324219, 78.12892150878906, 80.5402603149414, 82.95160675048828, 85.36294555664062, 87.7742919921875, 90.18563079833984, 92.59697723388672, 95.00831604003906, 97.41966247558594, 99.83100128173828, 102.24234771728516, 104.65369415283203, 107.0650405883789, 109.47637939453125, 111.88772583007812, 114.29906463623047, 116.71041107177734, 119.12174987792969, 121.53309631347656, 123.94444274902344, 126.35578918457031, 128.7671356201172, 131.178466796875, 133.58981323242188, 136.00115966796875, 138.41250610351562, 140.8238525390625, 143.2351837158203]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 12.0, 3.0, 7.0, 10.0, 14.0, 12.0, 10.0, 15.0, 12.0, 14.0, 23.0, 23.0, 34.0, 39.0, 30.0, 33.0, 22.0, 42.0, 32.0, 37.0, 45.0, 51.0, 41.0, 36.0, 45.0, 44.0, 39.0, 36.0, 38.0, 24.0, 23.0, 27.0, 19.0, 18.0, 13.0, 14.0, 7.0, 9.0, 4.0, 6.0, 3.0, 5.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-33.95932388305664, -32.9387092590332, -31.918092727661133, -30.897478103637695, -29.876863479614258, -28.856246948242188, -27.83563232421875, -26.815017700195312, -25.794403076171875, -24.773788452148438, -23.753171920776367, -22.73255729675293, -21.711942672729492, -20.691326141357422, -19.670711517333984, -18.650096893310547, -17.629480361938477, -16.60886573791504, -15.588250160217285, -14.567634582519531, -13.547019958496094, -12.52640438079834, -11.505788803100586, -10.485174179077148, -9.464558601379395, -8.44394302368164, -7.423328399658203, -6.402712821960449, -5.3820977210998535, -4.361482620239258, -3.340867042541504, -2.320251941680908, -1.2996349334716797, -0.27901971340179443, 0.7415955066680908, 1.7622108459472656, 2.7828259468078613, 3.803441047668457, 4.824056625366211, 5.844671726226807, 6.865286827087402, 7.885901927947998, 8.906517028808594, 9.927132606506348, 10.947748184204102, 11.968362808227539, 12.988978385925293, 14.009593963623047, 15.030208587646484, 16.050823211669922, 17.071439743041992, 18.09205436706543, 19.112668991088867, 20.133285522460938, 21.153900146484375, 22.174514770507812, 23.19512939453125, 24.215744018554688, 25.236360549926758, 26.256975173950195, 27.277589797973633, 28.298206329345703, 29.31882095336914, 30.339435577392578, 31.36005210876465]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 7.0, 16.0, 10.0, 14.0, 12.0, 19.0, 15.0, 18.0, 30.0, 32.0, 24.0, 27.0, 35.0, 47.0, 30.0, 39.0, 36.0, 39.0, 29.0, 48.0, 53.0, 48.0, 32.0, 33.0, 34.0, 29.0, 34.0, 25.0, 22.0, 25.0, 20.0, 13.0, 11.0, 13.0, 14.0, 12.0, 9.0, 4.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.65625, -4.50836181640625, -4.3604736328125, -4.21258544921875, -4.064697265625, -3.91680908203125, -3.7689208984375, -3.62103271484375, -3.47314453125, -3.32525634765625, -3.1773681640625, -3.02947998046875, -2.881591796875, -2.73370361328125, -2.5858154296875, -2.43792724609375, -2.2900390625, -2.14215087890625, -1.9942626953125, -1.84637451171875, -1.698486328125, -1.55059814453125, -1.4027099609375, -1.25482177734375, -1.10693359375, -0.95904541015625, -0.8111572265625, -0.66326904296875, -0.515380859375, -0.36749267578125, -0.2196044921875, -0.07171630859375, 0.076171875, 0.22406005859375, 0.3719482421875, 0.51983642578125, 0.667724609375, 0.81561279296875, 0.9635009765625, 1.11138916015625, 1.25927734375, 1.40716552734375, 1.5550537109375, 1.70294189453125, 1.850830078125, 1.99871826171875, 2.1466064453125, 2.29449462890625, 2.4423828125, 2.59027099609375, 2.7381591796875, 2.88604736328125, 3.033935546875, 3.18182373046875, 3.3297119140625, 3.47760009765625, 3.62548828125, 3.77337646484375, 3.9212646484375, 4.06915283203125, 4.217041015625, 4.36492919921875, 4.5128173828125, 4.66070556640625, 4.80859375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 8.0, 9.0, 11.0, 18.0, 28.0, 38.0, 52.0, 65.0, 105.0, 130.0, 226.0, 294.0, 456.0, 722.0, 1107.0, 1784.0, 2908.0, 4961.0, 9879.0, 21755.0, 64314.0, 280313.0, 1399609.0, 1836483.0, 425880.0, 89254.0, 27862.0, 11863.0, 5919.0, 3093.0, 1820.0, 1145.0, 692.0, 461.0, 315.0, 210.0, 155.0, 89.0, 75.0, 53.0, 34.0, 26.0, 17.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0], "bins": [-8.3125, -8.06890869140625, -7.8253173828125, -7.58172607421875, -7.338134765625, -7.09454345703125, -6.8509521484375, -6.60736083984375, -6.36376953125, -6.12017822265625, -5.8765869140625, -5.63299560546875, -5.389404296875, -5.14581298828125, -4.9022216796875, -4.65863037109375, -4.4150390625, -4.17144775390625, -3.9278564453125, -3.68426513671875, -3.440673828125, -3.19708251953125, -2.9534912109375, -2.70989990234375, -2.46630859375, -2.22271728515625, -1.9791259765625, -1.73553466796875, -1.491943359375, -1.24835205078125, -1.0047607421875, -0.76116943359375, -0.517578125, -0.27398681640625, -0.0303955078125, 0.21319580078125, 0.456787109375, 0.70037841796875, 0.9439697265625, 1.18756103515625, 1.43115234375, 1.67474365234375, 1.9183349609375, 2.16192626953125, 2.405517578125, 2.64910888671875, 2.8927001953125, 3.13629150390625, 3.3798828125, 3.62347412109375, 3.8670654296875, 4.11065673828125, 4.354248046875, 4.59783935546875, 4.8414306640625, 5.08502197265625, 5.32861328125, 5.57220458984375, 5.8157958984375, 6.05938720703125, 6.302978515625, 6.54656982421875, 6.7901611328125, 7.03375244140625, 7.27734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 8.0, 9.0, 17.0, 11.0, 17.0, 29.0, 36.0, 55.0, 61.0, 72.0, 98.0, 149.0, 207.0, 306.0, 346.0, 432.0, 503.0, 447.0, 303.0, 237.0, 180.0, 125.0, 102.0, 60.0, 61.0, 41.0, 31.0, 28.0, 13.0, 16.0, 17.0, 10.0, 15.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.63671875, -7.41375732421875, -7.1907958984375, -6.96783447265625, -6.744873046875, -6.52191162109375, -6.2989501953125, -6.07598876953125, -5.85302734375, -5.63006591796875, -5.4071044921875, -5.18414306640625, -4.961181640625, -4.73822021484375, -4.5152587890625, -4.29229736328125, -4.0693359375, -3.84637451171875, -3.6234130859375, -3.40045166015625, -3.177490234375, -2.95452880859375, -2.7315673828125, -2.50860595703125, -2.28564453125, -2.06268310546875, -1.8397216796875, -1.61676025390625, -1.393798828125, -1.17083740234375, -0.9478759765625, -0.72491455078125, -0.501953125, -0.27899169921875, -0.0560302734375, 0.16693115234375, 0.389892578125, 0.61285400390625, 0.8358154296875, 1.05877685546875, 1.28173828125, 1.50469970703125, 1.7276611328125, 1.95062255859375, 2.173583984375, 2.39654541015625, 2.6195068359375, 2.84246826171875, 3.0654296875, 3.28839111328125, 3.5113525390625, 3.73431396484375, 3.957275390625, 4.18023681640625, 4.4031982421875, 4.62615966796875, 4.84912109375, 5.07208251953125, 5.2950439453125, 5.51800537109375, 5.740966796875, 5.96392822265625, 6.1868896484375, 6.40985107421875, 6.6328125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 2.0, 4.0, 9.0, 14.0, 12.0, 20.0, 22.0, 28.0, 35.0, 68.0, 68.0, 83.0, 171.0, 287.0, 550.0, 1556.0, 4547.0, 17616.0, 140100.0, 3070701.0, 892734.0, 51267.0, 9513.0, 2765.0, 962.0, 429.0, 239.0, 125.0, 84.0, 65.0, 47.0, 30.0, 28.0, 14.0, 16.0, 18.0, 16.0, 8.0, 6.0, 6.0, 1.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.515625, -21.868408203125, -21.22119140625, -20.573974609375, -19.9267578125, -19.279541015625, -18.63232421875, -17.985107421875, -17.337890625, -16.690673828125, -16.04345703125, -15.396240234375, -14.7490234375, -14.101806640625, -13.45458984375, -12.807373046875, -12.16015625, -11.512939453125, -10.86572265625, -10.218505859375, -9.5712890625, -8.924072265625, -8.27685546875, -7.629638671875, -6.982421875, -6.335205078125, -5.68798828125, -5.040771484375, -4.3935546875, -3.746337890625, -3.09912109375, -2.451904296875, -1.8046875, -1.157470703125, -0.51025390625, 0.136962890625, 0.7841796875, 1.431396484375, 2.07861328125, 2.725830078125, 3.373046875, 4.020263671875, 4.66748046875, 5.314697265625, 5.9619140625, 6.609130859375, 7.25634765625, 7.903564453125, 8.55078125, 9.197998046875, 9.84521484375, 10.492431640625, 11.1396484375, 11.786865234375, 12.43408203125, 13.081298828125, 13.728515625, 14.375732421875, 15.02294921875, 15.670166015625, 16.3173828125, 16.964599609375, 17.61181640625, 18.259033203125, 18.90625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 14.0, 40.0, 105.0, 203.0, 277.0, 198.0, 113.0, 38.0, 16.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.33648681640625, -108.83415222167969, -106.33182525634766, -103.8294906616211, -101.32715606689453, -98.8248291015625, -96.32249450683594, -93.82015991210938, -91.31783294677734, -88.81549835205078, -86.31317138671875, -83.81083679199219, -81.30850219726562, -78.8061752319336, -76.30384063720703, -73.801513671875, -71.29917907714844, -68.79684448242188, -66.29451751708984, -63.79218292236328, -61.289852142333984, -58.78752136230469, -56.285186767578125, -53.78285598754883, -51.280517578125, -48.7781867980957, -46.27585220336914, -43.773521423339844, -41.27119064331055, -38.76885986328125, -36.26652526855469, -33.76419448852539, -31.26186752319336, -28.75953483581543, -26.257204055786133, -23.754871368408203, -21.252540588378906, -18.750207901000977, -16.247875213623047, -13.74554443359375, -11.24321174621582, -8.740880012512207, -6.2385478019714355, -3.736215591430664, -1.2338838577270508, 1.2684478759765625, 3.770780563354492, 6.273111343383789, 8.775444030761719, 11.277775764465332, 13.780107498168945, 16.282440185546875, 18.784770965576172, 21.2871036529541, 23.78943634033203, 26.291767120361328, 28.794099807739258, 31.296432495117188, 33.798763275146484, 36.30109405517578, 38.803428649902344, 41.30575942993164, 43.80809020996094, 46.3104248046875, 48.8127555847168]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 3.0, 7.0, 12.0, 10.0, 12.0, 9.0, 13.0, 17.0, 21.0, 16.0, 22.0, 28.0, 32.0, 25.0, 29.0, 27.0, 46.0, 31.0, 56.0, 49.0, 37.0, 36.0, 43.0, 34.0, 34.0, 34.0, 39.0, 44.0, 26.0, 34.0, 26.0, 23.0, 16.0, 29.0, 12.0, 14.0, 11.0, 11.0, 6.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-25.700098037719727, -24.933231353759766, -24.166364669799805, -23.399497985839844, -22.632631301879883, -21.865764617919922, -21.098896026611328, -20.33203125, -19.565162658691406, -18.798295974731445, -18.031429290771484, -17.264562606811523, -16.497695922851562, -15.730829238891602, -14.963961601257324, -14.197094917297363, -13.430229187011719, -12.663362503051758, -11.896495819091797, -11.129629135131836, -10.362762451171875, -9.595895767211914, -8.829028129577637, -8.062161445617676, -7.295294761657715, -6.528428077697754, -5.761561393737793, -4.994694232940674, -4.227827548980713, -3.460960865020752, -2.694093704223633, -1.9272270202636719, -1.160360336303711, -0.39349353313446045, 0.37337327003479004, 1.14024019241333, 1.907106876373291, 2.673973560333252, 3.440840721130371, 4.207707405090332, 4.974574089050293, 5.741440773010254, 6.508307456970215, 7.275174617767334, 8.042041778564453, 8.808908462524414, 9.575775146484375, 10.342641830444336, 11.109508514404297, 11.876375198364258, 12.643241882324219, 13.41010856628418, 14.17697525024414, 14.943841934204102, 15.710709571838379, 16.477577209472656, 17.244441986083984, 18.011308670043945, 18.778175354003906, 19.545042037963867, 20.311908721923828, 21.07877540588379, 21.84564208984375, 22.612510681152344, 23.379377365112305]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 9.0, 11.0, 6.0, 6.0, 12.0, 11.0, 16.0, 24.0, 22.0, 29.0, 30.0, 31.0, 39.0, 38.0, 38.0, 40.0, 28.0, 48.0, 48.0, 52.0, 41.0, 40.0, 39.0, 37.0, 35.0, 29.0, 37.0, 32.0, 16.0, 29.0, 20.0, 20.0, 18.0, 20.0, 8.0, 7.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.2869873046875, -4.128662109375, -3.9703369140625, -3.81201171875, -3.6536865234375, -3.495361328125, -3.3370361328125, -3.1787109375, -3.0203857421875, -2.862060546875, -2.7037353515625, -2.54541015625, -2.3870849609375, -2.228759765625, -2.0704345703125, -1.912109375, -1.7537841796875, -1.595458984375, -1.4371337890625, -1.27880859375, -1.1204833984375, -0.962158203125, -0.8038330078125, -0.6455078125, -0.4871826171875, -0.328857421875, -0.1705322265625, -0.01220703125, 0.1461181640625, 0.304443359375, 0.4627685546875, 0.62109375, 0.7794189453125, 0.937744140625, 1.0960693359375, 1.25439453125, 1.4127197265625, 1.571044921875, 1.7293701171875, 1.8876953125, 2.0460205078125, 2.204345703125, 2.3626708984375, 2.52099609375, 2.6793212890625, 2.837646484375, 2.9959716796875, 3.154296875, 3.3126220703125, 3.470947265625, 3.6292724609375, 3.78759765625, 3.9459228515625, 4.104248046875, 4.2625732421875, 4.4208984375, 4.5792236328125, 4.737548828125, 4.8958740234375, 5.05419921875, 5.2125244140625, 5.370849609375, 5.5291748046875, 5.6875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 12.0, 22.0, 33.0, 50.0, 73.0, 100.0, 177.0, 267.0, 403.0, 616.0, 1000.0, 1590.0, 2512.0, 4209.0, 6800.0, 11541.0, 19808.0, 33965.0, 58555.0, 99282.0, 155931.0, 201673.0, 171908.0, 113141.0, 68043.0, 39675.0, 22958.0, 13333.0, 8156.0, 4783.0, 3000.0, 1728.0, 1170.0, 752.0, 468.0, 292.0, 181.0, 119.0, 75.0, 46.0, 35.0, 22.0, 16.0, 9.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60107421875, -0.5832061767578125, -0.565338134765625, -0.5474700927734375, -0.52960205078125, -0.5117340087890625, -0.493865966796875, -0.4759979248046875, -0.4581298828125, -0.4402618408203125, -0.422393798828125, -0.4045257568359375, -0.38665771484375, -0.3687896728515625, -0.350921630859375, -0.3330535888671875, -0.315185546875, -0.2973175048828125, -0.279449462890625, -0.2615814208984375, -0.24371337890625, -0.2258453369140625, -0.207977294921875, -0.1901092529296875, -0.1722412109375, -0.1543731689453125, -0.136505126953125, -0.1186370849609375, -0.10076904296875, -0.0829010009765625, -0.065032958984375, -0.0471649169921875, -0.029296875, -0.0114288330078125, 0.006439208984375, 0.0243072509765625, 0.04217529296875, 0.0600433349609375, 0.077911376953125, 0.0957794189453125, 0.1136474609375, 0.1315155029296875, 0.149383544921875, 0.1672515869140625, 0.18511962890625, 0.2029876708984375, 0.220855712890625, 0.2387237548828125, 0.256591796875, 0.2744598388671875, 0.292327880859375, 0.3101959228515625, 0.32806396484375, 0.3459320068359375, 0.363800048828125, 0.3816680908203125, 0.3995361328125, 0.4174041748046875, 0.435272216796875, 0.4531402587890625, 0.47100830078125, 0.4888763427734375, 0.506744384765625, 0.5246124267578125, 0.54248046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 3.0, 11.0, 10.0, 12.0, 21.0, 12.0, 19.0, 35.0, 30.0, 28.0, 34.0, 50.0, 39.0, 45.0, 38.0, 49.0, 40.0, 1077.0, 59.0, 40.0, 46.0, 42.0, 38.0, 28.0, 41.0, 27.0, 21.0, 14.0, 18.0, 20.0, 14.0, 11.0, 12.0, 11.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.85150146484375, -3.7322998046875, -3.61309814453125, -3.493896484375, -3.37469482421875, -3.2554931640625, -3.13629150390625, -3.01708984375, -2.89788818359375, -2.7786865234375, -2.65948486328125, -2.540283203125, -2.42108154296875, -2.3018798828125, -2.18267822265625, -2.0634765625, -1.94427490234375, -1.8250732421875, -1.70587158203125, -1.586669921875, -1.46746826171875, -1.3482666015625, -1.22906494140625, -1.10986328125, -0.99066162109375, -0.8714599609375, -0.75225830078125, -0.633056640625, -0.51385498046875, -0.3946533203125, -0.27545166015625, -0.15625, -0.03704833984375, 0.0821533203125, 0.20135498046875, 0.320556640625, 0.43975830078125, 0.5589599609375, 0.67816162109375, 0.79736328125, 0.91656494140625, 1.0357666015625, 1.15496826171875, 1.274169921875, 1.39337158203125, 1.5125732421875, 1.63177490234375, 1.7509765625, 1.87017822265625, 1.9893798828125, 2.10858154296875, 2.227783203125, 2.34698486328125, 2.4661865234375, 2.58538818359375, 2.70458984375, 2.82379150390625, 2.9429931640625, 3.06219482421875, 3.181396484375, 3.30059814453125, 3.4197998046875, 3.53900146484375, 3.658203125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 8.0, 12.0, 14.0, 14.0, 26.0, 32.0, 38.0, 50.0, 83.0, 129.0, 175.0, 246.0, 369.0, 530.0, 877.0, 1379.0, 2343.0, 4012.0, 7374.0, 14037.0, 26889.0, 53959.0, 110295.0, 247624.0, 1097168.0, 286525.0, 120026.0, 58917.0, 29504.0, 15061.0, 8102.0, 4480.0, 2511.0, 1520.0, 943.0, 562.0, 411.0, 257.0, 206.0, 138.0, 69.0, 66.0, 44.0, 31.0, 21.0, 14.0, 15.0, 11.0, 2.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4150390625, -0.401458740234375, -0.38787841796875, -0.374298095703125, -0.3607177734375, -0.347137451171875, -0.33355712890625, -0.319976806640625, -0.306396484375, -0.292816162109375, -0.27923583984375, -0.265655517578125, -0.2520751953125, -0.238494873046875, -0.22491455078125, -0.211334228515625, -0.19775390625, -0.184173583984375, -0.17059326171875, -0.157012939453125, -0.1434326171875, -0.129852294921875, -0.11627197265625, -0.102691650390625, -0.089111328125, -0.075531005859375, -0.06195068359375, -0.048370361328125, -0.0347900390625, -0.021209716796875, -0.00762939453125, 0.005950927734375, 0.01953125, 0.033111572265625, 0.04669189453125, 0.060272216796875, 0.0738525390625, 0.087432861328125, 0.10101318359375, 0.114593505859375, 0.128173828125, 0.141754150390625, 0.15533447265625, 0.168914794921875, 0.1824951171875, 0.196075439453125, 0.20965576171875, 0.223236083984375, 0.23681640625, 0.250396728515625, 0.26397705078125, 0.277557373046875, 0.2911376953125, 0.304718017578125, 0.31829833984375, 0.331878662109375, 0.345458984375, 0.359039306640625, 0.37261962890625, 0.386199951171875, 0.3997802734375, 0.413360595703125, 0.42694091796875, 0.440521240234375, 0.4541015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 4.0, 7.0, 7.0, 9.0, 18.0, 26.0, 36.0, 61.0, 141.0, 256.0, 181.0, 102.0, 46.0, 19.0, 15.0, 8.0, 6.0, 6.0, 3.0, 4.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.14691162109375, -0.1416015625, -0.13629150390625, -0.1309814453125, -0.12567138671875, -0.120361328125, -0.11505126953125, -0.1097412109375, -0.10443115234375, -0.09912109375, -0.09381103515625, -0.0885009765625, -0.08319091796875, -0.077880859375, -0.07257080078125, -0.0672607421875, -0.06195068359375, -0.056640625, -0.05133056640625, -0.0460205078125, -0.04071044921875, -0.035400390625, -0.03009033203125, -0.0247802734375, -0.01947021484375, -0.01416015625, -0.00885009765625, -0.0035400390625, 0.00177001953125, 0.007080078125, 0.01239013671875, 0.0177001953125, 0.02301025390625, 0.0283203125, 0.03363037109375, 0.0389404296875, 0.04425048828125, 0.049560546875, 0.05487060546875, 0.0601806640625, 0.06549072265625, 0.07080078125, 0.07611083984375, 0.0814208984375, 0.08673095703125, 0.092041015625, 0.09735107421875, 0.1026611328125, 0.10797119140625, 0.11328125, 0.11859130859375, 0.1239013671875, 0.12921142578125, 0.134521484375, 0.13983154296875, 0.1451416015625, 0.15045166015625, 0.15576171875, 0.16107177734375, 0.1663818359375, 0.17169189453125, 0.177001953125, 0.18231201171875, 0.1876220703125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 15.0, 11.0, 49.0, 65.0, 162.0, 891.0, 1017508.0, 29013.0, 488.0, 135.0, 56.0, 29.0, 23.0, 11.0, 10.0, 7.0, 2.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.52734375, -4.3936767578125, -4.260009765625, -4.1263427734375, -3.99267578125, -3.8590087890625, -3.725341796875, -3.5916748046875, -3.4580078125, -3.3243408203125, -3.190673828125, -3.0570068359375, -2.92333984375, -2.7896728515625, -2.656005859375, -2.5223388671875, -2.388671875, -2.2550048828125, -2.121337890625, -1.9876708984375, -1.85400390625, -1.7203369140625, -1.586669921875, -1.4530029296875, -1.3193359375, -1.1856689453125, -1.052001953125, -0.9183349609375, -0.78466796875, -0.6510009765625, -0.517333984375, -0.3836669921875, -0.25, -0.1163330078125, 0.017333984375, 0.1510009765625, 0.28466796875, 0.4183349609375, 0.552001953125, 0.6856689453125, 0.8193359375, 0.9530029296875, 1.086669921875, 1.2203369140625, 1.35400390625, 1.4876708984375, 1.621337890625, 1.7550048828125, 1.888671875, 2.0223388671875, 2.156005859375, 2.2896728515625, 2.42333984375, 2.5570068359375, 2.690673828125, 2.8243408203125, 2.9580078125, 3.0916748046875, 3.225341796875, 3.3590087890625, 3.49267578125, 3.6263427734375, 3.760009765625, 3.8936767578125, 4.02734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 8.0, 21.0, 65.0, 324.0, 471.0, 102.0, 18.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1493738293647766, -0.12853878736495972, -0.10770375281572342, -0.08686871826648712, -0.06603367626667023, -0.04519863426685333, -0.024363607168197632, -0.0035285651683807373, 0.017306476831436157, 0.03814151510596275, 0.05897655338048935, 0.07981158792972565, 0.10064662992954254, 0.12148167192935944, 0.14231669902801514, 0.16315174102783203, 0.18398678302764893, 0.20482182502746582, 0.22565686702728271, 0.24649189412593842, 0.2673269510269165, 0.2881619930267334, 0.3089970052242279, 0.3298320472240448, 0.3506670892238617, 0.3715021312236786, 0.3923371732234955, 0.41317218542099, 0.4340072274208069, 0.4548422694206238, 0.4756773114204407, 0.49651235342025757, 0.5173473358154297, 0.5381823778152466, 0.5590174198150635, 0.5798524618148804, 0.6006875038146973, 0.6215225458145142, 0.642357587814331, 0.663192629814148, 0.6840276718139648, 0.7048627138137817, 0.7256977558135986, 0.7465327978134155, 0.7673678398132324, 0.7882028818130493, 0.8090379238128662, 0.8298729658126831, 0.8507079482078552, 0.8715429902076721, 0.892378032207489, 0.9132130742073059, 0.9340481162071228, 0.9548831582069397, 0.9757181406021118, 0.9965531826019287, 1.0173882246017456, 1.0382232666015625, 1.0590583086013794, 1.0798933506011963, 1.1007283926010132, 1.12156343460083, 1.142398476600647, 1.1632335186004639, 1.1840685606002808]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 8.0, 7.0, 12.0, 13.0, 23.0, 11.0, 26.0, 27.0, 24.0, 26.0, 24.0, 48.0, 29.0, 38.0, 37.0, 39.0, 41.0, 43.0, 37.0, 46.0, 47.0, 34.0, 34.0, 37.0, 22.0, 27.0, 32.0, 34.0, 15.0, 29.0, 23.0, 17.0, 18.0, 13.0, 10.0, 5.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.13939166069030762, -0.13498206436634064, -0.13057246804237366, -0.12616287171840668, -0.1217532753944397, -0.11734367907047272, -0.11293409019708633, -0.10852449387311935, -0.10411489754915237, -0.0997053012251854, -0.09529570490121841, -0.09088610857725143, -0.08647651970386505, -0.08206692337989807, -0.07765732705593109, -0.07324773073196411, -0.06883813440799713, -0.06442853808403015, -0.06001894176006317, -0.05560934916138649, -0.05119975283741951, -0.04679015651345253, -0.04238056391477585, -0.03797096759080887, -0.03356137126684189, -0.02915177494287491, -0.024742180481553078, -0.020332586020231247, -0.015922989696264267, -0.011513393372297287, -0.007103798910975456, -0.0026942044496536255, 0.0017153918743133545, 0.00612498726695776, 0.010534582659602165, 0.01494417805224657, 0.019353773444890976, 0.023763369768857956, 0.028172964230179787, 0.03258255869150162, 0.0369921550154686, 0.04140175133943558, 0.04581134766340256, 0.05022094026207924, 0.05463053658604622, 0.0590401329100132, 0.06344972550868988, 0.06785932183265686, 0.07226891815662384, 0.07667851448059082, 0.0810881108045578, 0.08549770712852478, 0.08990730345249176, 0.09431689977645874, 0.09872648864984512, 0.1031360849738121, 0.10754568129777908, 0.11195527762174606, 0.11636487394571304, 0.12077447026968002, 0.1251840591430664, 0.1295936554670334, 0.13400325179100037, 0.13841284811496735, 0.14282244443893433]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 1.0, 7.0, 8.0, 7.0, 9.0, 16.0, 11.0, 16.0, 18.0, 21.0, 28.0, 31.0, 27.0, 28.0, 44.0, 41.0, 41.0, 38.0, 33.0, 42.0, 31.0, 50.0, 45.0, 35.0, 30.0, 37.0, 36.0, 33.0, 31.0, 28.0, 17.0, 23.0, 22.0, 18.0, 14.0, 15.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.28350830078125, -4.1334228515625, -3.98333740234375, -3.833251953125, -3.68316650390625, -3.5330810546875, -3.38299560546875, -3.23291015625, -3.08282470703125, -2.9327392578125, -2.78265380859375, -2.632568359375, -2.48248291015625, -2.3323974609375, -2.18231201171875, -2.0322265625, -1.88214111328125, -1.7320556640625, -1.58197021484375, -1.431884765625, -1.28179931640625, -1.1317138671875, -0.98162841796875, -0.83154296875, -0.68145751953125, -0.5313720703125, -0.38128662109375, -0.231201171875, -0.08111572265625, 0.0689697265625, 0.21905517578125, 0.369140625, 0.51922607421875, 0.6693115234375, 0.81939697265625, 0.969482421875, 1.11956787109375, 1.2696533203125, 1.41973876953125, 1.56982421875, 1.71990966796875, 1.8699951171875, 2.02008056640625, 2.170166015625, 2.32025146484375, 2.4703369140625, 2.62042236328125, 2.7705078125, 2.92059326171875, 3.0706787109375, 3.22076416015625, 3.370849609375, 3.52093505859375, 3.6710205078125, 3.82110595703125, 3.97119140625, 4.12127685546875, 4.2713623046875, 4.42144775390625, 4.571533203125, 4.72161865234375, 4.8717041015625, 5.02178955078125, 5.171875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 3.0, 7.0, 14.0, 18.0, 24.0, 37.0, 56.0, 93.0, 117.0, 198.0, 257.0, 463.0, 759.0, 1079.0, 1675.0, 2579.0, 4115.0, 6497.0, 10488.0, 16789.0, 28301.0, 47709.0, 86201.0, 168187.0, 263240.0, 184794.0, 94144.0, 51490.0, 30265.0, 18402.0, 11247.0, 7018.0, 4400.0, 2794.0, 1750.0, 1158.0, 760.0, 493.0, 282.0, 193.0, 143.0, 100.0, 64.0, 57.0, 33.0, 19.0, 13.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.64453125, -5.48126220703125, -5.3179931640625, -5.15472412109375, -4.991455078125, -4.82818603515625, -4.6649169921875, -4.50164794921875, -4.33837890625, -4.17510986328125, -4.0118408203125, -3.84857177734375, -3.685302734375, -3.52203369140625, -3.3587646484375, -3.19549560546875, -3.0322265625, -2.86895751953125, -2.7056884765625, -2.54241943359375, -2.379150390625, -2.21588134765625, -2.0526123046875, -1.88934326171875, -1.72607421875, -1.56280517578125, -1.3995361328125, -1.23626708984375, -1.072998046875, -0.90972900390625, -0.7464599609375, -0.58319091796875, -0.419921875, -0.25665283203125, -0.0933837890625, 0.06988525390625, 0.233154296875, 0.39642333984375, 0.5596923828125, 0.72296142578125, 0.88623046875, 1.04949951171875, 1.2127685546875, 1.37603759765625, 1.539306640625, 1.70257568359375, 1.8658447265625, 2.02911376953125, 2.1923828125, 2.35565185546875, 2.5189208984375, 2.68218994140625, 2.845458984375, 3.00872802734375, 3.1719970703125, 3.33526611328125, 3.49853515625, 3.66180419921875, 3.8250732421875, 3.98834228515625, 4.151611328125, 4.31488037109375, 4.4781494140625, 4.64141845703125, 4.8046875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 8.0, 7.0, 16.0, 7.0, 17.0, 27.0, 23.0, 30.0, 34.0, 42.0, 47.0, 49.0, 56.0, 69.0, 113.0, 170.0, 1383.0, 276.0, 156.0, 88.0, 50.0, 58.0, 38.0, 29.0, 31.0, 36.0, 28.0, 21.0, 24.0, 20.0, 15.0, 14.0, 13.0, 14.0, 6.0, 4.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.125, -13.7078857421875, -13.290771484375, -12.8736572265625, -12.45654296875, -12.0394287109375, -11.622314453125, -11.2052001953125, -10.7880859375, -10.3709716796875, -9.953857421875, -9.5367431640625, -9.11962890625, -8.7025146484375, -8.285400390625, -7.8682861328125, -7.451171875, -7.0340576171875, -6.616943359375, -6.1998291015625, -5.78271484375, -5.3656005859375, -4.948486328125, -4.5313720703125, -4.1142578125, -3.6971435546875, -3.280029296875, -2.8629150390625, -2.44580078125, -2.0286865234375, -1.611572265625, -1.1944580078125, -0.77734375, -0.3602294921875, 0.056884765625, 0.4739990234375, 0.89111328125, 1.3082275390625, 1.725341796875, 2.1424560546875, 2.5595703125, 2.9766845703125, 3.393798828125, 3.8109130859375, 4.22802734375, 4.6451416015625, 5.062255859375, 5.4793701171875, 5.896484375, 6.3135986328125, 6.730712890625, 7.1478271484375, 7.56494140625, 7.9820556640625, 8.399169921875, 8.8162841796875, 9.2333984375, 9.6505126953125, 10.067626953125, 10.4847412109375, 10.90185546875, 11.3189697265625, 11.736083984375, 12.1531982421875, 12.5703125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 9.0, 9.0, 22.0, 19.0, 29.0, 34.0, 50.0, 82.0, 103.0, 118.0, 186.0, 276.0, 487.0, 1084.0, 4403.0, 32736.0, 722225.0, 2305729.0, 67616.0, 7319.0, 1587.0, 567.0, 281.0, 196.0, 127.0, 96.0, 77.0, 49.0, 48.0, 35.0, 23.0, 18.0, 11.0, 18.0, 9.0, 11.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.296875, -21.603271484375, -20.90966796875, -20.216064453125, -19.5224609375, -18.828857421875, -18.13525390625, -17.441650390625, -16.748046875, -16.054443359375, -15.36083984375, -14.667236328125, -13.9736328125, -13.280029296875, -12.58642578125, -11.892822265625, -11.19921875, -10.505615234375, -9.81201171875, -9.118408203125, -8.4248046875, -7.731201171875, -7.03759765625, -6.343994140625, -5.650390625, -4.956787109375, -4.26318359375, -3.569580078125, -2.8759765625, -2.182373046875, -1.48876953125, -0.795166015625, -0.1015625, 0.592041015625, 1.28564453125, 1.979248046875, 2.6728515625, 3.366455078125, 4.06005859375, 4.753662109375, 5.447265625, 6.140869140625, 6.83447265625, 7.528076171875, 8.2216796875, 8.915283203125, 9.60888671875, 10.302490234375, 10.99609375, 11.689697265625, 12.38330078125, 13.076904296875, 13.7705078125, 14.464111328125, 15.15771484375, 15.851318359375, 16.544921875, 17.238525390625, 17.93212890625, 18.625732421875, 19.3193359375, 20.012939453125, 20.70654296875, 21.400146484375, 22.09375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 33.0, 148.0, 363.0, 314.0, 124.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-101.5394287109375, -98.79120635986328, -96.04297637939453, -93.29475402832031, -90.54652404785156, -87.79830169677734, -85.05007934570312, -82.30184936523438, -79.55362701416016, -76.80540466308594, -74.05717468261719, -71.30895233154297, -68.56072998046875, -65.8125, -63.06427764892578, -60.3160514831543, -57.56782531738281, -54.81959915161133, -52.071372985839844, -49.323150634765625, -46.57492446899414, -43.826698303222656, -41.07847595214844, -38.33024978637695, -35.58202362060547, -32.833797454833984, -30.085573196411133, -27.33734893798828, -24.589122772216797, -21.840896606445312, -19.09267234802246, -16.34444808959961, -13.596229553222656, -10.848004341125488, -8.09977912902832, -5.351553916931152, -2.6033287048339844, 0.1448965072631836, 2.8931217193603516, 5.641345977783203, 8.389572143554688, 11.137797355651855, 13.886022567749023, 16.634246826171875, 19.38247299194336, 22.130699157714844, 24.878923416137695, 27.627147674560547, 30.37537384033203, 33.123600006103516, 35.871826171875, 38.62004852294922, 41.3682746887207, 44.11650085449219, 46.864723205566406, 49.61294937133789, 52.361175537109375, 55.10940170288086, 57.857627868652344, 60.60585021972656, 63.35407638549805, 66.10230255126953, 68.85052490234375, 71.5987548828125, 74.34697723388672]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 4.0, 11.0, 5.0, 12.0, 2.0, 4.0, 12.0, 19.0, 28.0, 20.0, 23.0, 17.0, 21.0, 31.0, 25.0, 31.0, 34.0, 45.0, 31.0, 42.0, 45.0, 36.0, 41.0, 42.0, 38.0, 34.0, 43.0, 44.0, 32.0, 40.0, 28.0, 26.0, 25.0, 14.0, 19.0, 16.0, 17.0, 9.0, 8.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.792816162109375, -28.82180404663086, -27.850791931152344, -26.879779815673828, -25.908767700195312, -24.937755584716797, -23.96674346923828, -22.995731353759766, -22.02471923828125, -21.053707122802734, -20.08269500732422, -19.111682891845703, -18.140670776367188, -17.169658660888672, -16.198646545410156, -15.22763442993164, -14.256621360778809, -13.285609245300293, -12.314597129821777, -11.343585014343262, -10.372572898864746, -9.401559829711914, -8.430547714233398, -7.459536075592041, -6.488523960113525, -5.51751184463501, -4.546499729156494, -3.5754873752593994, -2.604475259780884, -1.633462905883789, -0.6624507904052734, 0.3085613250732422, 1.2795734405517578, 2.2505855560302734, 3.221597671508789, 4.192609786987305, 5.16362190246582, 6.134634494781494, 7.10564661026001, 8.076658248901367, 9.047670364379883, 10.018682479858398, 10.989694595336914, 11.96070671081543, 12.931718826293945, 13.902730941772461, 14.873743057250977, 15.844755172729492, 16.81576919555664, 17.786781311035156, 18.757793426513672, 19.728805541992188, 20.699817657470703, 21.67082977294922, 22.641841888427734, 23.61285400390625, 24.583866119384766, 25.55487823486328, 26.525890350341797, 27.496902465820312, 28.467914581298828, 29.438926696777344, 30.40993881225586, 31.380950927734375, 32.35196304321289]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 4.0, 13.0, 20.0, 15.0, 20.0, 21.0, 31.0, 32.0, 31.0, 20.0, 33.0, 44.0, 56.0, 41.0, 50.0, 52.0, 38.0, 43.0, 41.0, 47.0, 33.0, 23.0, 44.0, 40.0, 35.0, 21.0, 21.0, 23.0, 12.0, 17.0, 9.0, 15.0, 11.0, 6.0, 4.0, 6.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.03125, -4.865966796875, -4.70068359375, -4.535400390625, -4.3701171875, -4.204833984375, -4.03955078125, -3.874267578125, -3.708984375, -3.543701171875, -3.37841796875, -3.213134765625, -3.0478515625, -2.882568359375, -2.71728515625, -2.552001953125, -2.38671875, -2.221435546875, -2.05615234375, -1.890869140625, -1.7255859375, -1.560302734375, -1.39501953125, -1.229736328125, -1.064453125, -0.899169921875, -0.73388671875, -0.568603515625, -0.4033203125, -0.238037109375, -0.07275390625, 0.092529296875, 0.2578125, 0.423095703125, 0.58837890625, 0.753662109375, 0.9189453125, 1.084228515625, 1.24951171875, 1.414794921875, 1.580078125, 1.745361328125, 1.91064453125, 2.075927734375, 2.2412109375, 2.406494140625, 2.57177734375, 2.737060546875, 2.90234375, 3.067626953125, 3.23291015625, 3.398193359375, 3.5634765625, 3.728759765625, 3.89404296875, 4.059326171875, 4.224609375, 4.389892578125, 4.55517578125, 4.720458984375, 4.8857421875, 5.051025390625, 5.21630859375, 5.381591796875, 5.546875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 15.0, 12.0, 18.0, 16.0, 27.0, 21.0, 28.0, 40.0, 65.0, 110.0, 181.0, 444.0, 909.0, 2529.0, 8119.0, 53362.0, 2634385.0, 1448138.0, 35344.0, 6705.0, 2119.0, 863.0, 339.0, 152.0, 84.0, 53.0, 37.0, 28.0, 28.0, 14.0, 20.0, 15.0, 9.0, 12.0, 1.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.866455078125, -19.15478515625, -18.443115234375, -17.7314453125, -17.019775390625, -16.30810546875, -15.596435546875, -14.884765625, -14.173095703125, -13.46142578125, -12.749755859375, -12.0380859375, -11.326416015625, -10.61474609375, -9.903076171875, -9.19140625, -8.479736328125, -7.76806640625, -7.056396484375, -6.3447265625, -5.633056640625, -4.92138671875, -4.209716796875, -3.498046875, -2.786376953125, -2.07470703125, -1.363037109375, -0.6513671875, 0.060302734375, 0.77197265625, 1.483642578125, 2.1953125, 2.906982421875, 3.61865234375, 4.330322265625, 5.0419921875, 5.753662109375, 6.46533203125, 7.177001953125, 7.888671875, 8.600341796875, 9.31201171875, 10.023681640625, 10.7353515625, 11.447021484375, 12.15869140625, 12.870361328125, 13.58203125, 14.293701171875, 15.00537109375, 15.717041015625, 16.4287109375, 17.140380859375, 17.85205078125, 18.563720703125, 19.275390625, 19.987060546875, 20.69873046875, 21.410400390625, 22.1220703125, 22.833740234375, 23.54541015625, 24.257080078125, 24.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 2.0, 12.0, 8.0, 12.0, 8.0, 10.0, 11.0, 20.0, 16.0, 25.0, 32.0, 49.0, 67.0, 95.0, 117.0, 185.0, 228.0, 321.0, 390.0, 470.0, 478.0, 385.0, 319.0, 196.0, 163.0, 115.0, 81.0, 57.0, 35.0, 31.0, 28.0, 21.0, 12.0, 17.0, 12.0, 10.0, 8.0, 4.0, 1.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.18359375, -6.97076416015625, -6.7579345703125, -6.54510498046875, -6.332275390625, -6.11944580078125, -5.9066162109375, -5.69378662109375, -5.48095703125, -5.26812744140625, -5.0552978515625, -4.84246826171875, -4.629638671875, -4.41680908203125, -4.2039794921875, -3.99114990234375, -3.7783203125, -3.56549072265625, -3.3526611328125, -3.13983154296875, -2.927001953125, -2.71417236328125, -2.5013427734375, -2.28851318359375, -2.07568359375, -1.86285400390625, -1.6500244140625, -1.43719482421875, -1.224365234375, -1.01153564453125, -0.7987060546875, -0.58587646484375, -0.373046875, -0.16021728515625, 0.0526123046875, 0.26544189453125, 0.478271484375, 0.69110107421875, 0.9039306640625, 1.11676025390625, 1.32958984375, 1.54241943359375, 1.7552490234375, 1.96807861328125, 2.180908203125, 2.39373779296875, 2.6065673828125, 2.81939697265625, 3.0322265625, 3.24505615234375, 3.4578857421875, 3.67071533203125, 3.883544921875, 4.09637451171875, 4.3092041015625, 4.52203369140625, 4.73486328125, 4.94769287109375, 5.1605224609375, 5.37335205078125, 5.586181640625, 5.79901123046875, 6.0118408203125, 6.22467041015625, 6.4375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 13.0, 8.0, 14.0, 20.0, 23.0, 26.0, 27.0, 23.0, 52.0, 82.0, 124.0, 272.0, 841.0, 3125.0, 15797.0, 178554.0, 3696109.0, 273952.0, 19540.0, 3895.0, 1036.0, 313.0, 140.0, 77.0, 41.0, 39.0, 35.0, 24.0, 15.0, 27.0, 8.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.734619140625, -25.93798828125, -25.141357421875, -24.3447265625, -23.548095703125, -22.75146484375, -21.954833984375, -21.158203125, -20.361572265625, -19.56494140625, -18.768310546875, -17.9716796875, -17.175048828125, -16.37841796875, -15.581787109375, -14.78515625, -13.988525390625, -13.19189453125, -12.395263671875, -11.5986328125, -10.802001953125, -10.00537109375, -9.208740234375, -8.412109375, -7.615478515625, -6.81884765625, -6.022216796875, -5.2255859375, -4.428955078125, -3.63232421875, -2.835693359375, -2.0390625, -1.242431640625, -0.44580078125, 0.350830078125, 1.1474609375, 1.944091796875, 2.74072265625, 3.537353515625, 4.333984375, 5.130615234375, 5.92724609375, 6.723876953125, 7.5205078125, 8.317138671875, 9.11376953125, 9.910400390625, 10.70703125, 11.503662109375, 12.30029296875, 13.096923828125, 13.8935546875, 14.690185546875, 15.48681640625, 16.283447265625, 17.080078125, 17.876708984375, 18.67333984375, 19.469970703125, 20.2666015625, 21.063232421875, 21.85986328125, 22.656494140625, 23.453125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 15.0, 178.0, 578.0, 224.0, 17.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-326.8696594238281, -321.08831787109375, -315.3070068359375, -309.5256652832031, -303.7443542480469, -297.9630126953125, -292.18170166015625, -286.4003601074219, -280.6190490722656, -274.83770751953125, -269.056396484375, -263.2750549316406, -257.4937438964844, -251.71241760253906, -245.93109130859375, -240.14976501464844, -234.36843872070312, -228.5871124267578, -222.8057861328125, -217.0244598388672, -211.24313354492188, -205.46180725097656, -199.68048095703125, -193.89915466308594, -188.11781311035156, -182.33648681640625, -176.55516052246094, -170.77383422851562, -164.9925079345703, -159.211181640625, -153.4298553466797, -147.64852905273438, -141.8671875, -136.0858612060547, -130.30453491210938, -124.52320861816406, -118.74188232421875, -112.96055603027344, -107.17922973632812, -101.39790344238281, -95.6165771484375, -89.83525085449219, -84.05392456054688, -78.27259826660156, -72.49127197265625, -66.70994567871094, -60.92861557006836, -55.14728927612305, -49.365962982177734, -43.58463668823242, -37.80331039428711, -32.02198028564453, -26.24065589904785, -20.45932960510254, -14.678001403808594, -8.896675109863281, -3.1153488159179688, 2.665977954864502, 8.447304725646973, 14.228631973266602, 20.009958267211914, 25.791284561157227, 31.572612762451172, 37.353939056396484, 43.1352653503418]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 4.0, 10.0, 10.0, 14.0, 10.0, 18.0, 17.0, 20.0, 14.0, 27.0, 26.0, 20.0, 35.0, 30.0, 30.0, 34.0, 33.0, 40.0, 46.0, 32.0, 46.0, 41.0, 38.0, 33.0, 36.0, 36.0, 39.0, 28.0, 33.0, 23.0, 25.0, 27.0, 12.0, 13.0, 15.0, 13.0, 12.0, 11.0, 11.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-26.38810157775879, -25.64605140686035, -24.904001235961914, -24.161951065063477, -23.419902801513672, -22.677852630615234, -21.935802459716797, -21.19375228881836, -20.451702117919922, -19.709651947021484, -18.967601776123047, -18.22555160522461, -17.483501434326172, -16.741453170776367, -15.99940299987793, -15.257352828979492, -14.515302658081055, -13.773252487182617, -13.03120231628418, -12.289153099060059, -11.547102928161621, -10.805052757263184, -10.063003540039062, -9.320953369140625, -8.578903198242188, -7.83685302734375, -7.094803333282471, -6.352753639221191, -5.610703468322754, -4.868653297424316, -4.126603603363037, -3.384553909301758, -2.642505645751953, -1.9004557132720947, -1.1584057807922363, -0.41635584831237793, 0.32569408416748047, 1.0677440166473389, 1.8097939491271973, 2.5518436431884766, 3.293893814086914, 4.035943984985352, 4.777993679046631, 5.52004337310791, 6.262093544006348, 7.004143714904785, 7.7461934089660645, 8.488243103027344, 9.230293273925781, 9.972343444824219, 10.714393615722656, 11.456442832946777, 12.198493003845215, 12.940543174743652, 13.682592391967773, 14.424642562866211, 15.166692733764648, 15.908742904663086, 16.650793075561523, 17.39284324645996, 18.134891510009766, 18.876941680908203, 19.61899185180664, 20.361042022705078, 21.103092193603516]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 5.0, 11.0, 8.0, 10.0, 21.0, 25.0, 23.0, 20.0, 16.0, 30.0, 29.0, 38.0, 39.0, 44.0, 44.0, 46.0, 37.0, 54.0, 48.0, 56.0, 40.0, 33.0, 31.0, 37.0, 33.0, 33.0, 25.0, 24.0, 29.0, 11.0, 5.0, 18.0, 10.0, 11.0, 17.0, 12.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.89410400390625, -4.7257080078125, -4.55731201171875, -4.388916015625, -4.22052001953125, -4.0521240234375, -3.88372802734375, -3.71533203125, -3.54693603515625, -3.3785400390625, -3.21014404296875, -3.041748046875, -2.87335205078125, -2.7049560546875, -2.53656005859375, -2.3681640625, -2.19976806640625, -2.0313720703125, -1.86297607421875, -1.694580078125, -1.52618408203125, -1.3577880859375, -1.18939208984375, -1.02099609375, -0.85260009765625, -0.6842041015625, -0.51580810546875, -0.347412109375, -0.17901611328125, -0.0106201171875, 0.15777587890625, 0.326171875, 0.49456787109375, 0.6629638671875, 0.83135986328125, 0.999755859375, 1.16815185546875, 1.3365478515625, 1.50494384765625, 1.67333984375, 1.84173583984375, 2.0101318359375, 2.17852783203125, 2.346923828125, 2.51531982421875, 2.6837158203125, 2.85211181640625, 3.0205078125, 3.18890380859375, 3.3572998046875, 3.52569580078125, 3.694091796875, 3.86248779296875, 4.0308837890625, 4.19927978515625, 4.36767578125, 4.53607177734375, 4.7044677734375, 4.87286376953125, 5.041259765625, 5.20965576171875, 5.3780517578125, 5.54644775390625, 5.71484375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 8.0, 15.0, 14.0, 17.0, 32.0, 61.0, 87.0, 162.0, 204.0, 361.0, 619.0, 1106.0, 2134.0, 4037.0, 7778.0, 16249.0, 34627.0, 79972.0, 181366.0, 297938.0, 227758.0, 106486.0, 45937.0, 20723.0, 9833.0, 5001.0, 2646.0, 1438.0, 733.0, 468.0, 285.0, 174.0, 87.0, 76.0, 44.0, 28.0, 23.0, 12.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.9476165771484375, -0.917694091796875, -0.8877716064453125, -0.85784912109375, -0.8279266357421875, -0.798004150390625, -0.7680816650390625, -0.7381591796875, -0.7082366943359375, -0.678314208984375, -0.6483917236328125, -0.61846923828125, -0.5885467529296875, -0.558624267578125, -0.5287017822265625, -0.498779296875, -0.4688568115234375, -0.438934326171875, -0.4090118408203125, -0.37908935546875, -0.3491668701171875, -0.319244384765625, -0.2893218994140625, -0.2593994140625, -0.2294769287109375, -0.199554443359375, -0.1696319580078125, -0.13970947265625, -0.1097869873046875, -0.079864501953125, -0.0499420166015625, -0.02001953125, 0.0099029541015625, 0.039825439453125, 0.0697479248046875, 0.09967041015625, 0.1295928955078125, 0.159515380859375, 0.1894378662109375, 0.2193603515625, 0.2492828369140625, 0.279205322265625, 0.3091278076171875, 0.33905029296875, 0.3689727783203125, 0.398895263671875, 0.4288177490234375, 0.458740234375, 0.4886627197265625, 0.518585205078125, 0.5485076904296875, 0.57843017578125, 0.6083526611328125, 0.638275146484375, 0.6681976318359375, 0.6981201171875, 0.7280426025390625, 0.757965087890625, 0.7878875732421875, 0.81781005859375, 0.8477325439453125, 0.877655029296875, 0.9075775146484375, 0.9375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 11.0, 6.0, 7.0, 16.0, 18.0, 21.0, 27.0, 20.0, 42.0, 24.0, 40.0, 34.0, 46.0, 36.0, 43.0, 40.0, 38.0, 1072.0, 35.0, 47.0, 44.0, 41.0, 40.0, 33.0, 36.0, 18.0, 19.0, 20.0, 25.0, 12.0, 14.0, 15.0, 9.0, 18.0, 10.0, 4.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.677734375, -3.566497802734375, -3.45526123046875, -3.344024658203125, -3.2327880859375, -3.121551513671875, -3.01031494140625, -2.899078369140625, -2.787841796875, -2.676605224609375, -2.56536865234375, -2.454132080078125, -2.3428955078125, -2.231658935546875, -2.12042236328125, -2.009185791015625, -1.89794921875, -1.786712646484375, -1.67547607421875, -1.564239501953125, -1.4530029296875, -1.341766357421875, -1.23052978515625, -1.119293212890625, -1.008056640625, -0.896820068359375, -0.78558349609375, -0.674346923828125, -0.5631103515625, -0.451873779296875, -0.34063720703125, -0.229400634765625, -0.1181640625, -0.006927490234375, 0.10430908203125, 0.215545654296875, 0.3267822265625, 0.438018798828125, 0.54925537109375, 0.660491943359375, 0.771728515625, 0.882965087890625, 0.99420166015625, 1.105438232421875, 1.2166748046875, 1.327911376953125, 1.43914794921875, 1.550384521484375, 1.66162109375, 1.772857666015625, 1.88409423828125, 1.995330810546875, 2.1065673828125, 2.217803955078125, 2.32904052734375, 2.440277099609375, 2.551513671875, 2.662750244140625, 2.77398681640625, 2.885223388671875, 2.9964599609375, 3.107696533203125, 3.21893310546875, 3.330169677734375, 3.44140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 10.0, 17.0, 32.0, 38.0, 78.0, 105.0, 152.0, 241.0, 411.0, 691.0, 1171.0, 2099.0, 4037.0, 8292.0, 18200.0, 43575.0, 110210.0, 320262.0, 1191999.0, 240743.0, 88882.0, 35562.0, 15232.0, 7066.0, 3480.0, 1902.0, 1023.0, 599.0, 382.0, 208.0, 121.0, 109.0, 47.0, 41.0, 22.0, 26.0, 15.0, 11.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.62890625, -0.6100692749023438, -0.5912322998046875, -0.5723953247070312, -0.553558349609375, -0.5347213745117188, -0.5158843994140625, -0.49704742431640625, -0.47821044921875, -0.45937347412109375, -0.4405364990234375, -0.42169952392578125, -0.402862548828125, -0.38402557373046875, -0.3651885986328125, -0.34635162353515625, -0.3275146484375, -0.30867767333984375, -0.2898406982421875, -0.27100372314453125, -0.252166748046875, -0.23332977294921875, -0.2144927978515625, -0.19565582275390625, -0.17681884765625, -0.15798187255859375, -0.1391448974609375, -0.12030792236328125, -0.101470947265625, -0.08263397216796875, -0.0637969970703125, -0.04496002197265625, -0.026123046875, -0.00728607177734375, 0.0115509033203125, 0.03038787841796875, 0.049224853515625, 0.06806182861328125, 0.0868988037109375, 0.10573577880859375, 0.12457275390625, 0.14340972900390625, 0.1622467041015625, 0.18108367919921875, 0.199920654296875, 0.21875762939453125, 0.2375946044921875, 0.25643157958984375, 0.2752685546875, 0.29410552978515625, 0.3129425048828125, 0.33177947998046875, 0.350616455078125, 0.36945343017578125, 0.3882904052734375, 0.40712738037109375, 0.42596435546875, 0.44480133056640625, 0.4636383056640625, 0.48247528076171875, 0.501312255859375, 0.5201492309570312, 0.5389862060546875, 0.5578231811523438, 0.57666015625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 5.0, 6.0, 3.0, 6.0, 8.0, 9.0, 13.0, 10.0, 16.0, 36.0, 26.0, 38.0, 59.0, 98.0, 145.0, 153.0, 94.0, 51.0, 45.0, 39.0, 28.0, 22.0, 13.0, 6.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10364437103271484, -0.10029411315917969, -0.09694385528564453, -0.09359359741210938, -0.09024333953857422, -0.08689308166503906, -0.0835428237915039, -0.08019256591796875, -0.0768423080444336, -0.07349205017089844, -0.07014179229736328, -0.06679153442382812, -0.06344127655029297, -0.06009101867675781, -0.056740760803222656, -0.0533905029296875, -0.050040245056152344, -0.04668998718261719, -0.04333972930908203, -0.039989471435546875, -0.03663921356201172, -0.03328895568847656, -0.029938697814941406, -0.02658843994140625, -0.023238182067871094, -0.019887924194335938, -0.01653766632080078, -0.013187408447265625, -0.009837150573730469, -0.0064868927001953125, -0.0031366348266601562, 0.000213623046875, 0.0035638809204101562, 0.0069141387939453125, 0.010264396667480469, 0.013614654541015625, 0.01696491241455078, 0.020315170288085938, 0.023665428161621094, 0.02701568603515625, 0.030365943908691406, 0.03371620178222656, 0.03706645965576172, 0.040416717529296875, 0.04376697540283203, 0.04711723327636719, 0.050467491149902344, 0.0538177490234375, 0.057168006896972656, 0.06051826477050781, 0.06386852264404297, 0.06721878051757812, 0.07056903839111328, 0.07391929626464844, 0.0772695541381836, 0.08061981201171875, 0.0839700698852539, 0.08732032775878906, 0.09067058563232422, 0.09402084350585938, 0.09737110137939453, 0.10072135925292969, 0.10407161712646484, 0.107421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 7.0, 17.0, 26.0, 35.0, 39.0, 70.0, 117.0, 235.0, 638.0, 47750.0, 997871.0, 1039.0, 308.0, 119.0, 79.0, 48.0, 28.0, 24.0, 14.0, 13.0, 9.0, 7.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.951202392578125, -2.86724853515625, -2.783294677734375, -2.6993408203125, -2.615386962890625, -2.53143310546875, -2.447479248046875, -2.363525390625, -2.279571533203125, -2.19561767578125, -2.111663818359375, -2.0277099609375, -1.943756103515625, -1.85980224609375, -1.775848388671875, -1.69189453125, -1.607940673828125, -1.52398681640625, -1.440032958984375, -1.3560791015625, -1.272125244140625, -1.18817138671875, -1.104217529296875, -1.020263671875, -0.936309814453125, -0.85235595703125, -0.768402099609375, -0.6844482421875, -0.600494384765625, -0.51654052734375, -0.432586669921875, -0.3486328125, -0.264678955078125, -0.18072509765625, -0.096771240234375, -0.0128173828125, 0.071136474609375, 0.15509033203125, 0.239044189453125, 0.322998046875, 0.406951904296875, 0.49090576171875, 0.574859619140625, 0.6588134765625, 0.742767333984375, 0.82672119140625, 0.910675048828125, 0.99462890625, 1.078582763671875, 1.16253662109375, 1.246490478515625, 1.3304443359375, 1.414398193359375, 1.49835205078125, 1.582305908203125, 1.666259765625, 1.750213623046875, 1.83416748046875, 1.918121337890625, 2.0020751953125, 2.086029052734375, 2.16998291015625, 2.253936767578125, 2.337890625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 26.0, 110.0, 223.0, 364.0, 191.0, 65.0, 14.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4099210202693939, -0.4008985757827759, -0.3918761610984802, -0.3828537166118622, -0.37383127212524414, -0.3648088276386261, -0.35578638315200806, -0.3467639684677124, -0.33774152398109436, -0.3287190794944763, -0.31969666481018066, -0.3106742203235626, -0.3016517758369446, -0.29262933135032654, -0.2836068868637085, -0.27458447217941284, -0.2655620276927948, -0.25653958320617676, -0.2475171536207199, -0.23849472403526306, -0.22947227954864502, -0.22044983506202698, -0.21142740547657013, -0.20240497589111328, -0.19338253140449524, -0.1843600869178772, -0.17533765733242035, -0.1663152277469635, -0.15729278326034546, -0.14827033877372742, -0.13924790918827057, -0.13022547960281372, -0.12120306491851807, -0.11218062788248062, -0.10315819084644318, -0.09413575381040573, -0.08511331677436829, -0.07609087973833084, -0.0670684427022934, -0.05804600566625595, -0.049023568630218506, -0.04000113159418106, -0.030978694558143616, -0.02195625752210617, -0.012933820486068726, -0.0039113834500312805, 0.0051110535860061646, 0.01413349062204361, 0.023155927658081055, 0.0321783646941185, 0.041200801730155945, 0.05022323876619339, 0.059245675802230835, 0.06826811283826828, 0.07729054987430573, 0.08631298691034317, 0.09533542394638062, 0.10435786098241806, 0.1133802980184555, 0.12240273505449295, 0.1314251720905304, 0.14044761657714844, 0.14947004616260529, 0.15849247574806213, 0.16751492023468018]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 8.0, 8.0, 13.0, 9.0, 10.0, 17.0, 22.0, 19.0, 27.0, 27.0, 34.0, 42.0, 37.0, 40.0, 46.0, 48.0, 53.0, 41.0, 42.0, 46.0, 48.0, 42.0, 30.0, 35.0, 31.0, 25.0, 33.0, 22.0, 18.0, 22.0, 15.0, 14.0, 14.0, 13.0, 13.0, 9.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0960661768913269, -0.09268291294574738, -0.08929964900016785, -0.08591638505458832, -0.08253312110900879, -0.07914985716342926, -0.07576659321784973, -0.0723833292722702, -0.06900006532669067, -0.06561680138111115, -0.062233537435531616, -0.05885027348995209, -0.05546700954437256, -0.05208374559879303, -0.0487004816532135, -0.04531721770763397, -0.04193395376205444, -0.038550689816474915, -0.035167425870895386, -0.03178416192531586, -0.028400897979736328, -0.0250176340341568, -0.02163437008857727, -0.01825110614299774, -0.014867842197418213, -0.011484578251838684, -0.008101314306259155, -0.0047180503606796265, -0.0013347864151000977, 0.002048477530479431, 0.00543174147605896, 0.008815005421638489, 0.012198269367218018, 0.015581533312797546, 0.018964797258377075, 0.022348061203956604, 0.025731325149536133, 0.02911458909511566, 0.03249785304069519, 0.03588111698627472, 0.03926438093185425, 0.04264764487743378, 0.046030908823013306, 0.049414172768592834, 0.05279743671417236, 0.05618070065975189, 0.05956396460533142, 0.06294722855091095, 0.06633049249649048, 0.06971375644207001, 0.07309702038764954, 0.07648028433322906, 0.0798635482788086, 0.08324681222438812, 0.08663007616996765, 0.09001334011554718, 0.09339660406112671, 0.09677986800670624, 0.10016313195228577, 0.1035463958978653, 0.10692965984344482, 0.11031292378902435, 0.11369618773460388, 0.11707945168018341, 0.12046271562576294]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 10.0, 11.0, 5.0, 12.0, 10.0, 18.0, 21.0, 29.0, 25.0, 25.0, 25.0, 30.0, 47.0, 58.0, 46.0, 46.0, 50.0, 38.0, 48.0, 43.0, 42.0, 32.0, 36.0, 29.0, 38.0, 35.0, 34.0, 23.0, 15.0, 18.0, 15.0, 10.0, 8.0, 11.0, 13.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.55859375, -5.3896484375, -5.220703125, -5.0517578125, -4.8828125, -4.7138671875, -4.544921875, -4.3759765625, -4.20703125, -4.0380859375, -3.869140625, -3.7001953125, -3.53125, -3.3623046875, -3.193359375, -3.0244140625, -2.85546875, -2.6865234375, -2.517578125, -2.3486328125, -2.1796875, -2.0107421875, -1.841796875, -1.6728515625, -1.50390625, -1.3349609375, -1.166015625, -0.9970703125, -0.828125, -0.6591796875, -0.490234375, -0.3212890625, -0.15234375, 0.0166015625, 0.185546875, 0.3544921875, 0.5234375, 0.6923828125, 0.861328125, 1.0302734375, 1.19921875, 1.3681640625, 1.537109375, 1.7060546875, 1.875, 2.0439453125, 2.212890625, 2.3818359375, 2.55078125, 2.7197265625, 2.888671875, 3.0576171875, 3.2265625, 3.3955078125, 3.564453125, 3.7333984375, 3.90234375, 4.0712890625, 4.240234375, 4.4091796875, 4.578125, 4.7470703125, 4.916015625, 5.0849609375, 5.25390625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 4.0, 13.0, 18.0, 39.0, 44.0, 54.0, 75.0, 111.0, 173.0, 245.0, 297.0, 525.0, 736.0, 1053.0, 1673.0, 2449.0, 3916.0, 6405.0, 11455.0, 20372.0, 38617.0, 79709.0, 178293.0, 301537.0, 207647.0, 93243.0, 44579.0, 23116.0, 12505.0, 7171.0, 4323.0, 2686.0, 1786.0, 1136.0, 774.0, 569.0, 384.0, 235.0, 184.0, 105.0, 89.0, 50.0, 57.0, 38.0, 18.0, 13.0, 5.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.83984375, -5.655029296875, -5.47021484375, -5.285400390625, -5.1005859375, -4.915771484375, -4.73095703125, -4.546142578125, -4.361328125, -4.176513671875, -3.99169921875, -3.806884765625, -3.6220703125, -3.437255859375, -3.25244140625, -3.067626953125, -2.8828125, -2.697998046875, -2.51318359375, -2.328369140625, -2.1435546875, -1.958740234375, -1.77392578125, -1.589111328125, -1.404296875, -1.219482421875, -1.03466796875, -0.849853515625, -0.6650390625, -0.480224609375, -0.29541015625, -0.110595703125, 0.07421875, 0.259033203125, 0.44384765625, 0.628662109375, 0.8134765625, 0.998291015625, 1.18310546875, 1.367919921875, 1.552734375, 1.737548828125, 1.92236328125, 2.107177734375, 2.2919921875, 2.476806640625, 2.66162109375, 2.846435546875, 3.03125, 3.216064453125, 3.40087890625, 3.585693359375, 3.7705078125, 3.955322265625, 4.14013671875, 4.324951171875, 4.509765625, 4.694580078125, 4.87939453125, 5.064208984375, 5.2490234375, 5.433837890625, 5.61865234375, 5.803466796875, 5.98828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 4.0, 14.0, 11.0, 15.0, 16.0, 19.0, 25.0, 14.0, 28.0, 32.0, 34.0, 29.0, 41.0, 53.0, 79.0, 89.0, 203.0, 1321.0, 305.0, 203.0, 116.0, 50.0, 48.0, 43.0, 35.0, 42.0, 36.0, 23.0, 18.0, 25.0, 18.0, 13.0, 13.0, 8.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.4869384765625, -11.059814453125, -10.6326904296875, -10.20556640625, -9.7784423828125, -9.351318359375, -8.9241943359375, -8.4970703125, -8.0699462890625, -7.642822265625, -7.2156982421875, -6.78857421875, -6.3614501953125, -5.934326171875, -5.5072021484375, -5.080078125, -4.6529541015625, -4.225830078125, -3.7987060546875, -3.37158203125, -2.9444580078125, -2.517333984375, -2.0902099609375, -1.6630859375, -1.2359619140625, -0.808837890625, -0.3817138671875, 0.04541015625, 0.4725341796875, 0.899658203125, 1.3267822265625, 1.75390625, 2.1810302734375, 2.608154296875, 3.0352783203125, 3.46240234375, 3.8895263671875, 4.316650390625, 4.7437744140625, 5.1708984375, 5.5980224609375, 6.025146484375, 6.4522705078125, 6.87939453125, 7.3065185546875, 7.733642578125, 8.1607666015625, 8.587890625, 9.0150146484375, 9.442138671875, 9.8692626953125, 10.29638671875, 10.7235107421875, 11.150634765625, 11.5777587890625, 12.0048828125, 12.4320068359375, 12.859130859375, 13.2862548828125, 13.71337890625, 14.1405029296875, 14.567626953125, 14.9947509765625, 15.421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 5.0, 5.0, 15.0, 10.0, 14.0, 16.0, 20.0, 39.0, 31.0, 38.0, 61.0, 63.0, 97.0, 126.0, 196.0, 294.0, 555.0, 1525.0, 6545.0, 57163.0, 2499861.0, 550520.0, 22408.0, 3644.0, 988.0, 497.0, 282.0, 196.0, 113.0, 88.0, 76.0, 44.0, 34.0, 28.0, 19.0, 14.0, 16.0, 12.0, 11.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-22.453125, -21.768798828125, -21.08447265625, -20.400146484375, -19.7158203125, -19.031494140625, -18.34716796875, -17.662841796875, -16.978515625, -16.294189453125, -15.60986328125, -14.925537109375, -14.2412109375, -13.556884765625, -12.87255859375, -12.188232421875, -11.50390625, -10.819580078125, -10.13525390625, -9.450927734375, -8.7666015625, -8.082275390625, -7.39794921875, -6.713623046875, -6.029296875, -5.344970703125, -4.66064453125, -3.976318359375, -3.2919921875, -2.607666015625, -1.92333984375, -1.239013671875, -0.5546875, 0.129638671875, 0.81396484375, 1.498291015625, 2.1826171875, 2.866943359375, 3.55126953125, 4.235595703125, 4.919921875, 5.604248046875, 6.28857421875, 6.972900390625, 7.6572265625, 8.341552734375, 9.02587890625, 9.710205078125, 10.39453125, 11.078857421875, 11.76318359375, 12.447509765625, 13.1318359375, 13.816162109375, 14.50048828125, 15.184814453125, 15.869140625, 16.553466796875, 17.23779296875, 17.922119140625, 18.6064453125, 19.290771484375, 19.97509765625, 20.659423828125, 21.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 18.0, 31.0, 73.0, 133.0, 167.0, 208.0, 180.0, 98.0, 51.0, 23.0, 15.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.9676513671875, -55.588401794433594, -54.20914840698242, -52.829898834228516, -51.450645446777344, -50.07139587402344, -48.692142486572266, -47.31289291381836, -45.93363952636719, -44.55438995361328, -43.17513656616211, -41.7958869934082, -40.41663360595703, -39.037384033203125, -37.65813064575195, -36.27888107299805, -34.899627685546875, -33.52037811279297, -32.1411247253418, -30.761873245239258, -29.38262176513672, -28.00337028503418, -26.62411880493164, -25.244869232177734, -23.865619659423828, -22.48636817932129, -21.10711669921875, -19.72786521911621, -18.348613739013672, -16.969362258911133, -15.59011173248291, -14.210860252380371, -12.831607818603516, -11.452356338500977, -10.073104858398438, -8.693853378295898, -7.314602375030518, -5.9353508949279785, -4.556099891662598, -3.1768484115600586, -1.7975969314575195, -0.41834557056427, 0.9609057903289795, 2.3401570320129395, 3.7194085121154785, 5.098659992218018, 6.477910995483398, 7.8571624755859375, 9.236413955688477, 10.615665435791016, 11.994916915893555, 13.374168395996094, 14.753419876098633, 16.132671356201172, 17.511920928955078, 18.89117431640625, 20.270423889160156, 21.649675369262695, 23.028926849365234, 24.408178329467773, 25.787429809570312, 27.16668128967285, 28.54593276977539, 29.925182342529297, 31.30443572998047]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 6.0, 6.0, 12.0, 9.0, 10.0, 19.0, 18.0, 18.0, 26.0, 24.0, 21.0, 38.0, 32.0, 39.0, 31.0, 38.0, 41.0, 41.0, 49.0, 39.0, 35.0, 54.0, 43.0, 40.0, 43.0, 36.0, 29.0, 19.0, 18.0, 24.0, 17.0, 23.0, 17.0, 13.0, 11.0, 15.0, 12.0, 7.0, 5.0, 1.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.83474349975586, -26.905654907226562, -25.976564407348633, -25.047475814819336, -24.11838722229004, -23.18929672241211, -22.260208129882812, -21.331119537353516, -20.40203094482422, -19.472942352294922, -18.543851852416992, -17.614763259887695, -16.6856746673584, -15.756585121154785, -14.827495574951172, -13.898406982421875, -12.969316482543945, -12.040226936340332, -11.111138343811035, -10.182048797607422, -9.252960205078125, -8.323870658874512, -7.394781112670898, -6.465692043304443, -5.536602973937988, -4.607513904571533, -3.678424596786499, -2.749335289001465, -1.8202462196350098, -0.8911571502685547, 0.037932395935058594, 0.9670214653015137, 1.896108627319336, 2.825197696685791, 3.754287004470825, 4.683376312255859, 5.6124653816223145, 6.5415544509887695, 7.470643997192383, 8.39973258972168, 9.328822135925293, 10.257911682128906, 11.187000274658203, 12.116089820861816, 13.04517936706543, 13.974267959594727, 14.90335750579834, 15.832447052001953, 16.76153564453125, 17.690624237060547, 18.619714736938477, 19.548803329467773, 20.47789192199707, 21.406982421875, 22.336071014404297, 23.265159606933594, 24.19424819946289, 25.123336791992188, 26.052427291870117, 26.981515884399414, 27.91060447692871, 28.83969497680664, 29.768783569335938, 30.697872161865234, 31.626962661743164]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 11.0, 7.0, 6.0, 13.0, 12.0, 14.0, 17.0, 26.0, 21.0, 37.0, 35.0, 31.0, 37.0, 39.0, 55.0, 49.0, 41.0, 31.0, 51.0, 39.0, 59.0, 35.0, 41.0, 42.0, 31.0, 29.0, 29.0, 26.0, 22.0, 21.0, 15.0, 9.0, 7.0, 10.0, 7.0, 5.0, 5.0, 7.0, 10.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.70111083984375, -4.5272216796875, -4.35333251953125, -4.179443359375, -4.00555419921875, -3.8316650390625, -3.65777587890625, -3.48388671875, -3.30999755859375, -3.1361083984375, -2.96221923828125, -2.788330078125, -2.61444091796875, -2.4405517578125, -2.26666259765625, -2.0927734375, -1.91888427734375, -1.7449951171875, -1.57110595703125, -1.397216796875, -1.22332763671875, -1.0494384765625, -0.87554931640625, -0.70166015625, -0.52777099609375, -0.3538818359375, -0.17999267578125, -0.006103515625, 0.16778564453125, 0.3416748046875, 0.51556396484375, 0.689453125, 0.86334228515625, 1.0372314453125, 1.21112060546875, 1.385009765625, 1.55889892578125, 1.7327880859375, 1.90667724609375, 2.08056640625, 2.25445556640625, 2.4283447265625, 2.60223388671875, 2.776123046875, 2.95001220703125, 3.1239013671875, 3.29779052734375, 3.4716796875, 3.64556884765625, 3.8194580078125, 3.99334716796875, 4.167236328125, 4.34112548828125, 4.5150146484375, 4.68890380859375, 4.86279296875, 5.03668212890625, 5.2105712890625, 5.38446044921875, 5.558349609375, 5.73223876953125, 5.9061279296875, 6.08001708984375, 6.25390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 2.0, 7.0, 6.0, 11.0, 10.0, 10.0, 17.0, 30.0, 33.0, 33.0, 45.0, 54.0, 71.0, 85.0, 127.0, 188.0, 299.0, 489.0, 1183.0, 8085.0, 2394482.0, 1779035.0, 7322.0, 1223.0, 456.0, 271.0, 169.0, 128.0, 92.0, 76.0, 44.0, 42.0, 30.0, 20.0, 25.0, 15.0, 12.0, 13.0, 8.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-45.34375, -44.00927734375, -42.6748046875, -41.34033203125, -40.005859375, -38.67138671875, -37.3369140625, -36.00244140625, -34.66796875, -33.33349609375, -31.9990234375, -30.66455078125, -29.330078125, -27.99560546875, -26.6611328125, -25.32666015625, -23.9921875, -22.65771484375, -21.3232421875, -19.98876953125, -18.654296875, -17.31982421875, -15.9853515625, -14.65087890625, -13.31640625, -11.98193359375, -10.6474609375, -9.31298828125, -7.978515625, -6.64404296875, -5.3095703125, -3.97509765625, -2.640625, -1.30615234375, 0.0283203125, 1.36279296875, 2.697265625, 4.03173828125, 5.3662109375, 6.70068359375, 8.03515625, 9.36962890625, 10.7041015625, 12.03857421875, 13.373046875, 14.70751953125, 16.0419921875, 17.37646484375, 18.7109375, 20.04541015625, 21.3798828125, 22.71435546875, 24.048828125, 25.38330078125, 26.7177734375, 28.05224609375, 29.38671875, 30.72119140625, 32.0556640625, 33.39013671875, 34.724609375, 36.05908203125, 37.3935546875, 38.72802734375, 40.0625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 15.0, 10.0, 16.0, 20.0, 36.0, 50.0, 75.0, 117.0, 122.0, 176.0, 341.0, 506.0, 674.0, 577.0, 430.0, 293.0, 191.0, 128.0, 66.0, 43.0, 36.0, 32.0, 20.0, 17.0, 15.0, 6.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.5855712890625, -7.311767578125, -7.0379638671875, -6.76416015625, -6.4903564453125, -6.216552734375, -5.9427490234375, -5.6689453125, -5.3951416015625, -5.121337890625, -4.8475341796875, -4.57373046875, -4.2999267578125, -4.026123046875, -3.7523193359375, -3.478515625, -3.2047119140625, -2.930908203125, -2.6571044921875, -2.38330078125, -2.1094970703125, -1.835693359375, -1.5618896484375, -1.2880859375, -1.0142822265625, -0.740478515625, -0.4666748046875, -0.19287109375, 0.0809326171875, 0.354736328125, 0.6285400390625, 0.90234375, 1.1761474609375, 1.449951171875, 1.7237548828125, 1.99755859375, 2.2713623046875, 2.545166015625, 2.8189697265625, 3.0927734375, 3.3665771484375, 3.640380859375, 3.9141845703125, 4.18798828125, 4.4617919921875, 4.735595703125, 5.0093994140625, 5.283203125, 5.5570068359375, 5.830810546875, 6.1046142578125, 6.37841796875, 6.6522216796875, 6.926025390625, 7.1998291015625, 7.4736328125, 7.7474365234375, 8.021240234375, 8.2950439453125, 8.56884765625, 8.8426513671875, 9.116455078125, 9.3902587890625, 9.6640625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 8.0, 5.0, 15.0, 13.0, 21.0, 23.0, 25.0, 27.0, 33.0, 59.0, 82.0, 135.0, 280.0, 643.0, 1831.0, 8318.0, 63175.0, 2441202.0, 1618444.0, 49689.0, 7182.0, 1777.0, 540.0, 240.0, 124.0, 86.0, 67.0, 45.0, 36.0, 35.0, 18.0, 22.0, 19.0, 11.0, 12.0, 7.0, 8.0, 5.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.96875, -21.259033203125, -20.54931640625, -19.839599609375, -19.1298828125, -18.420166015625, -17.71044921875, -17.000732421875, -16.291015625, -15.581298828125, -14.87158203125, -14.161865234375, -13.4521484375, -12.742431640625, -12.03271484375, -11.322998046875, -10.61328125, -9.903564453125, -9.19384765625, -8.484130859375, -7.7744140625, -7.064697265625, -6.35498046875, -5.645263671875, -4.935546875, -4.225830078125, -3.51611328125, -2.806396484375, -2.0966796875, -1.386962890625, -0.67724609375, 0.032470703125, 0.7421875, 1.451904296875, 2.16162109375, 2.871337890625, 3.5810546875, 4.290771484375, 5.00048828125, 5.710205078125, 6.419921875, 7.129638671875, 7.83935546875, 8.549072265625, 9.2587890625, 9.968505859375, 10.67822265625, 11.387939453125, 12.09765625, 12.807373046875, 13.51708984375, 14.226806640625, 14.9365234375, 15.646240234375, 16.35595703125, 17.065673828125, 17.775390625, 18.485107421875, 19.19482421875, 19.904541015625, 20.6142578125, 21.323974609375, 22.03369140625, 22.743408203125, 23.453125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 63.0, 326.0, 504.0, 116.0, 5.0, 1.0, 1.0], "bins": [-290.0438537597656, -285.1431884765625, -280.2425231933594, -275.3418273925781, -270.441162109375, -265.5404968261719, -260.63983154296875, -255.73915100097656, -250.83848571777344, -245.9378204345703, -241.03713989257812, -236.136474609375, -231.2357940673828, -226.3351287841797, -221.4344482421875, -216.53378295898438, -211.63311767578125, -206.73245239257812, -201.83177185058594, -196.9311065673828, -192.03042602539062, -187.1297607421875, -182.22909545898438, -177.3284149169922, -172.427734375, -167.52706909179688, -162.6263885498047, -157.72572326660156, -152.82504272460938, -147.92437744140625, -143.02371215820312, -138.12303161621094, -133.2223663330078, -128.3217010498047, -123.4210205078125, -118.52035522460938, -113.61968231201172, -108.71900939941406, -103.8183364868164, -98.91766357421875, -94.01699829101562, -89.11632537841797, -84.21565246582031, -79.31498718261719, -74.41431427001953, -69.51364135742188, -64.61296844482422, -59.71229934692383, -54.81163024902344, -49.91095733642578, -45.01028823852539, -40.109615325927734, -35.208946228027344, -30.308273315429688, -25.40760040283203, -20.50693130493164, -15.606256484985352, -10.705585479736328, -5.804913520812988, -0.9042415618896484, 3.996429443359375, 8.897100448608398, 13.797773361206055, 18.698442459106445, 23.5991153717041]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 13.0, 14.0, 15.0, 25.0, 22.0, 26.0, 27.0, 32.0, 34.0, 26.0, 32.0, 48.0, 46.0, 43.0, 39.0, 42.0, 47.0, 51.0, 47.0, 48.0, 41.0, 32.0, 33.0, 32.0, 24.0, 27.0, 21.0, 20.0, 11.0, 9.0, 12.0, 14.0, 10.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.616117477416992, -25.726348876953125, -24.83658218383789, -23.946813583374023, -23.057044982910156, -22.167278289794922, -21.277509689331055, -20.387741088867188, -19.497974395751953, -18.608205795288086, -17.71843910217285, -16.828670501708984, -15.938902854919434, -15.049135208129883, -14.159366607666016, -13.269598960876465, -12.379831314086914, -11.490063667297363, -10.600296020507812, -9.710527420043945, -8.820759773254395, -7.930992126464844, -7.041224002838135, -6.151455879211426, -5.261688232421875, -4.371920585632324, -3.4821524620056152, -2.5923845767974854, -1.7026166915893555, -0.8128490447998047, 0.0769190788269043, 0.9666872024536133, 1.8564567565917969, 2.7462246417999268, 3.6359925270080566, 4.525760650634766, 5.415528297424316, 6.305295944213867, 7.195064067840576, 8.084832191467285, 8.974599838256836, 9.864367485046387, 10.754135131835938, 11.643903732299805, 12.533671379089355, 13.423439025878906, 14.313207626342773, 15.202975273132324, 16.092742919921875, 16.982511520385742, 17.872278213500977, 18.762046813964844, 19.651813507080078, 20.541582107543945, 21.431350708007812, 22.321117401123047, 23.210886001586914, 24.10065460205078, 24.990421295166016, 25.880189895629883, 26.76995849609375, 27.659725189208984, 28.54949378967285, 29.43926239013672, 30.329029083251953]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 10.0, 7.0, 5.0, 14.0, 15.0, 12.0, 29.0, 17.0, 21.0, 29.0, 27.0, 33.0, 39.0, 46.0, 42.0, 45.0, 35.0, 42.0, 44.0, 36.0, 44.0, 44.0, 34.0, 28.0, 39.0, 29.0, 30.0, 22.0, 28.0, 25.0, 23.0, 13.0, 18.0, 15.0, 12.0, 9.0, 5.0, 3.0, 1.0, 8.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.517822265625, -4.35986328125, -4.201904296875, -4.0439453125, -3.885986328125, -3.72802734375, -3.570068359375, -3.412109375, -3.254150390625, -3.09619140625, -2.938232421875, -2.7802734375, -2.622314453125, -2.46435546875, -2.306396484375, -2.1484375, -1.990478515625, -1.83251953125, -1.674560546875, -1.5166015625, -1.358642578125, -1.20068359375, -1.042724609375, -0.884765625, -0.726806640625, -0.56884765625, -0.410888671875, -0.2529296875, -0.094970703125, 0.06298828125, 0.220947265625, 0.37890625, 0.536865234375, 0.69482421875, 0.852783203125, 1.0107421875, 1.168701171875, 1.32666015625, 1.484619140625, 1.642578125, 1.800537109375, 1.95849609375, 2.116455078125, 2.2744140625, 2.432373046875, 2.59033203125, 2.748291015625, 2.90625, 3.064208984375, 3.22216796875, 3.380126953125, 3.5380859375, 3.696044921875, 3.85400390625, 4.011962890625, 4.169921875, 4.327880859375, 4.48583984375, 4.643798828125, 4.8017578125, 4.959716796875, 5.11767578125, 5.275634765625, 5.43359375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 7.0, 5.0, 22.0, 28.0, 25.0, 44.0, 70.0, 83.0, 132.0, 207.0, 279.0, 389.0, 525.0, 803.0, 1190.0, 1701.0, 2622.0, 4199.0, 6961.0, 12057.0, 23533.0, 51547.0, 131189.0, 308851.0, 286899.0, 117034.0, 46871.0, 21639.0, 11271.0, 6556.0, 4066.0, 2467.0, 1680.0, 1092.0, 790.0, 501.0, 354.0, 258.0, 178.0, 124.0, 88.0, 60.0, 46.0, 28.0, 21.0, 16.0, 8.0, 10.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6171875, -1.566558837890625, -1.51593017578125, -1.465301513671875, -1.4146728515625, -1.364044189453125, -1.31341552734375, -1.262786865234375, -1.212158203125, -1.161529541015625, -1.11090087890625, -1.060272216796875, -1.0096435546875, -0.959014892578125, -0.90838623046875, -0.857757568359375, -0.80712890625, -0.756500244140625, -0.70587158203125, -0.655242919921875, -0.6046142578125, -0.553985595703125, -0.50335693359375, -0.452728271484375, -0.402099609375, -0.351470947265625, -0.30084228515625, -0.250213623046875, -0.1995849609375, -0.148956298828125, -0.09832763671875, -0.047698974609375, 0.0029296875, 0.053558349609375, 0.10418701171875, 0.154815673828125, 0.2054443359375, 0.256072998046875, 0.30670166015625, 0.357330322265625, 0.407958984375, 0.458587646484375, 0.50921630859375, 0.559844970703125, 0.6104736328125, 0.661102294921875, 0.71173095703125, 0.762359619140625, 0.81298828125, 0.863616943359375, 0.91424560546875, 0.964874267578125, 1.0155029296875, 1.066131591796875, 1.11676025390625, 1.167388916015625, 1.218017578125, 1.268646240234375, 1.31927490234375, 1.369903564453125, 1.4205322265625, 1.471160888671875, 1.52178955078125, 1.572418212890625, 1.623046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 13.0, 10.0, 6.0, 10.0, 11.0, 12.0, 22.0, 23.0, 25.0, 39.0, 29.0, 34.0, 25.0, 43.0, 37.0, 48.0, 36.0, 42.0, 1077.0, 44.0, 46.0, 42.0, 32.0, 37.0, 36.0, 34.0, 25.0, 37.0, 24.0, 18.0, 26.0, 14.0, 14.0, 13.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.91015625, -3.79290771484375, -3.6756591796875, -3.55841064453125, -3.441162109375, -3.32391357421875, -3.2066650390625, -3.08941650390625, -2.97216796875, -2.85491943359375, -2.7376708984375, -2.62042236328125, -2.503173828125, -2.38592529296875, -2.2686767578125, -2.15142822265625, -2.0341796875, -1.91693115234375, -1.7996826171875, -1.68243408203125, -1.565185546875, -1.44793701171875, -1.3306884765625, -1.21343994140625, -1.09619140625, -0.97894287109375, -0.8616943359375, -0.74444580078125, -0.627197265625, -0.50994873046875, -0.3927001953125, -0.27545166015625, -0.158203125, -0.04095458984375, 0.0762939453125, 0.19354248046875, 0.310791015625, 0.42803955078125, 0.5452880859375, 0.66253662109375, 0.77978515625, 0.89703369140625, 1.0142822265625, 1.13153076171875, 1.248779296875, 1.36602783203125, 1.4832763671875, 1.60052490234375, 1.7177734375, 1.83502197265625, 1.9522705078125, 2.06951904296875, 2.186767578125, 2.30401611328125, 2.4212646484375, 2.53851318359375, 2.65576171875, 2.77301025390625, 2.8902587890625, 3.00750732421875, 3.124755859375, 3.24200439453125, 3.3592529296875, 3.47650146484375, 3.59375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 19.0, 33.0, 27.0, 46.0, 61.0, 78.0, 129.0, 175.0, 232.0, 348.0, 581.0, 829.0, 1367.0, 2152.0, 3856.0, 7001.0, 14496.0, 37812.0, 150275.0, 1307542.0, 441987.0, 80037.0, 24362.0, 10379.0, 5186.0, 3017.0, 1788.0, 1074.0, 706.0, 451.0, 313.0, 216.0, 168.0, 101.0, 84.0, 62.0, 33.0, 28.0, 18.0, 14.0, 13.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6171875, -1.56787109375, -1.5185546875, -1.46923828125, -1.419921875, -1.37060546875, -1.3212890625, -1.27197265625, -1.22265625, -1.17333984375, -1.1240234375, -1.07470703125, -1.025390625, -0.97607421875, -0.9267578125, -0.87744140625, -0.828125, -0.77880859375, -0.7294921875, -0.68017578125, -0.630859375, -0.58154296875, -0.5322265625, -0.48291015625, -0.43359375, -0.38427734375, -0.3349609375, -0.28564453125, -0.236328125, -0.18701171875, -0.1376953125, -0.08837890625, -0.0390625, 0.01025390625, 0.0595703125, 0.10888671875, 0.158203125, 0.20751953125, 0.2568359375, 0.30615234375, 0.35546875, 0.40478515625, 0.4541015625, 0.50341796875, 0.552734375, 0.60205078125, 0.6513671875, 0.70068359375, 0.75, 0.79931640625, 0.8486328125, 0.89794921875, 0.947265625, 0.99658203125, 1.0458984375, 1.09521484375, 1.14453125, 1.19384765625, 1.2431640625, 1.29248046875, 1.341796875, 1.39111328125, 1.4404296875, 1.48974609375, 1.5390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 14.0, 14.0, 27.0, 36.0, 38.0, 88.0, 106.0, 148.0, 154.0, 110.0, 69.0, 42.0, 30.0, 22.0, 18.0, 13.0, 8.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.34326171875, -0.3339996337890625, -0.324737548828125, -0.3154754638671875, -0.30621337890625, -0.2969512939453125, -0.287689208984375, -0.2784271240234375, -0.2691650390625, -0.2599029541015625, -0.250640869140625, -0.2413787841796875, -0.23211669921875, -0.2228546142578125, -0.213592529296875, -0.2043304443359375, -0.195068359375, -0.1858062744140625, -0.176544189453125, -0.1672821044921875, -0.15802001953125, -0.1487579345703125, -0.139495849609375, -0.1302337646484375, -0.1209716796875, -0.1117095947265625, -0.102447509765625, -0.0931854248046875, -0.08392333984375, -0.0746612548828125, -0.065399169921875, -0.0561370849609375, -0.046875, -0.0376129150390625, -0.028350830078125, -0.0190887451171875, -0.00982666015625, -0.0005645751953125, 0.008697509765625, 0.0179595947265625, 0.0272216796875, 0.0364837646484375, 0.045745849609375, 0.0550079345703125, 0.06427001953125, 0.0735321044921875, 0.082794189453125, 0.0920562744140625, 0.101318359375, 0.1105804443359375, 0.119842529296875, 0.1291046142578125, 0.13836669921875, 0.1476287841796875, 0.156890869140625, 0.1661529541015625, 0.1754150390625, 0.1846771240234375, 0.193939208984375, 0.2032012939453125, 0.21246337890625, 0.2217254638671875, 0.230987548828125, 0.2402496337890625, 0.24951171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 5.0, 8.0, 7.0, 15.0, 21.0, 28.0, 40.0, 70.0, 107.0, 181.0, 384.0, 5378.0, 1032181.0, 9069.0, 475.0, 215.0, 123.0, 81.0, 56.0, 21.0, 18.0, 12.0, 7.0, 7.0, 10.0, 2.0, 6.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.2740478515625, -5.067626953125, -4.8612060546875, -4.65478515625, -4.4483642578125, -4.241943359375, -4.0355224609375, -3.8291015625, -3.6226806640625, -3.416259765625, -3.2098388671875, -3.00341796875, -2.7969970703125, -2.590576171875, -2.3841552734375, -2.177734375, -1.9713134765625, -1.764892578125, -1.5584716796875, -1.35205078125, -1.1456298828125, -0.939208984375, -0.7327880859375, -0.5263671875, -0.3199462890625, -0.113525390625, 0.0928955078125, 0.29931640625, 0.5057373046875, 0.712158203125, 0.9185791015625, 1.125, 1.3314208984375, 1.537841796875, 1.7442626953125, 1.95068359375, 2.1571044921875, 2.363525390625, 2.5699462890625, 2.7763671875, 2.9827880859375, 3.189208984375, 3.3956298828125, 3.60205078125, 3.8084716796875, 4.014892578125, 4.2213134765625, 4.427734375, 4.6341552734375, 4.840576171875, 5.0469970703125, 5.25341796875, 5.4598388671875, 5.666259765625, 5.8726806640625, 6.0791015625, 6.2855224609375, 6.491943359375, 6.6983642578125, 6.90478515625, 7.1112060546875, 7.317626953125, 7.5240478515625, 7.73046875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 23.0, 80.0, 221.0, 367.0, 202.0, 85.0, 16.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1669464111328125, -1.1438159942626953, -1.1206856966018677, -1.0975552797317505, -1.0744249820709229, -1.0512945652008057, -1.028164267539978, -1.0050338506698608, -0.9819034934043884, -0.958773136138916, -0.9356427788734436, -0.9125124216079712, -0.889382004737854, -0.8662516474723816, -0.8431212902069092, -0.8199909329414368, -0.7968605756759644, -0.7737302184104919, -0.7505998611450195, -0.7274695038795471, -0.7043391466140747, -0.6812087297439575, -0.6580783724784851, -0.6349480152130127, -0.6118176579475403, -0.5886873006820679, -0.5655569434165955, -0.542426586151123, -0.5192961692810059, -0.49616584181785583, -0.47303545475006104, -0.4499050974845886, -0.4267747700214386, -0.4036444127559662, -0.3805140256881714, -0.357383668422699, -0.33425331115722656, -0.31112295389175415, -0.28799259662628174, -0.26486220955848694, -0.24173185229301453, -0.21860149502754211, -0.1954711228609085, -0.1723407506942749, -0.1492103934288025, -0.12608003616333008, -0.10294966399669647, -0.07981929183006287, -0.056688934564590454, -0.033558569848537445, -0.010428205132484436, 0.012702159583568573, 0.03583252429962158, 0.05896288901567459, 0.0820932537317276, 0.1052236258983612, 0.12835398316383362, 0.15148434042930603, 0.17461471259593964, 0.19774508476257324, 0.22087544202804565, 0.24400579929351807, 0.2671361565589905, 0.2902665436267853, 0.3133969008922577]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 3.0, 12.0, 14.0, 14.0, 12.0, 13.0, 12.0, 25.0, 20.0, 20.0, 28.0, 24.0, 35.0, 38.0, 22.0, 48.0, 35.0, 39.0, 39.0, 33.0, 41.0, 43.0, 34.0, 41.0, 41.0, 28.0, 28.0, 30.0, 33.0, 23.0, 20.0, 24.0, 26.0, 15.0, 12.0, 13.0, 11.0, 15.0, 4.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.19779318571090698, -0.1917155385017395, -0.18563790619373322, -0.17956025898456573, -0.17348262667655945, -0.16740497946739197, -0.1613273322582245, -0.155249685049057, -0.14917205274105072, -0.14309440553188324, -0.13701677322387695, -0.13093912601470947, -0.12486148625612259, -0.1187838464975357, -0.11270619928836823, -0.10662855952978134, -0.10055091977119446, -0.09447328001260757, -0.08839564025402069, -0.08231799304485321, -0.07624035328626633, -0.07016271352767944, -0.06408506631851196, -0.05800742655992508, -0.051929786801338196, -0.04585214704275131, -0.03977450355887413, -0.03369686007499695, -0.027619220316410065, -0.021541578695178032, -0.015463937073946, -0.009386293590068817, -0.0033086538314819336, 0.002768987789750099, 0.008846629410982132, 0.014924271032214165, 0.021001912653446198, 0.02707955427467823, 0.03315719589591026, 0.039234839379787445, 0.04531247913837433, 0.05139011889696121, 0.057467762380838394, 0.06354540586471558, 0.06962304562330246, 0.07570068538188934, 0.08177833259105682, 0.08785597234964371, 0.09393361210823059, 0.10001125186681747, 0.10608889162540436, 0.11216653883457184, 0.11824417859315872, 0.1243218183517456, 0.13039946556091309, 0.13647711277008057, 0.14255474507808685, 0.14863239228725433, 0.15471002459526062, 0.1607876718044281, 0.16686531901359558, 0.17294295132160187, 0.17902059853076935, 0.18509823083877563, 0.19117587804794312]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 6.0, 3.0, 10.0, 10.0, 5.0, 9.0, 16.0, 11.0, 18.0, 19.0, 28.0, 20.0, 24.0, 33.0, 26.0, 29.0, 36.0, 37.0, 35.0, 46.0, 43.0, 39.0, 37.0, 44.0, 36.0, 34.0, 44.0, 37.0, 23.0, 27.0, 38.0, 23.0, 20.0, 20.0, 9.0, 14.0, 17.0, 9.0, 18.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.5, -4.35015869140625, -4.2003173828125, -4.05047607421875, -3.900634765625, -3.75079345703125, -3.6009521484375, -3.45111083984375, -3.30126953125, -3.15142822265625, -3.0015869140625, -2.85174560546875, -2.701904296875, -2.55206298828125, -2.4022216796875, -2.25238037109375, -2.1025390625, -1.95269775390625, -1.8028564453125, -1.65301513671875, -1.503173828125, -1.35333251953125, -1.2034912109375, -1.05364990234375, -0.90380859375, -0.75396728515625, -0.6041259765625, -0.45428466796875, -0.304443359375, -0.15460205078125, -0.0047607421875, 0.14508056640625, 0.294921875, 0.44476318359375, 0.5946044921875, 0.74444580078125, 0.894287109375, 1.04412841796875, 1.1939697265625, 1.34381103515625, 1.49365234375, 1.64349365234375, 1.7933349609375, 1.94317626953125, 2.093017578125, 2.24285888671875, 2.3927001953125, 2.54254150390625, 2.6923828125, 2.84222412109375, 2.9920654296875, 3.14190673828125, 3.291748046875, 3.44158935546875, 3.5914306640625, 3.74127197265625, 3.89111328125, 4.04095458984375, 4.1907958984375, 4.34063720703125, 4.490478515625, 4.64031982421875, 4.7901611328125, 4.94000244140625, 5.08984375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 18.0, 16.0, 30.0, 34.0, 49.0, 72.0, 100.0, 161.0, 260.0, 385.0, 604.0, 935.0, 1522.0, 2626.0, 4546.0, 8095.0, 14452.0, 26300.0, 48773.0, 93519.0, 178970.0, 264026.0, 188215.0, 99286.0, 52481.0, 27765.0, 15093.0, 8384.0, 4716.0, 2722.0, 1534.0, 1004.0, 625.0, 414.0, 233.0, 172.0, 112.0, 88.0, 62.0, 34.0, 30.0, 23.0, 14.0, 11.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.9609375, -4.81304931640625, -4.6651611328125, -4.51727294921875, -4.369384765625, -4.22149658203125, -4.0736083984375, -3.92572021484375, -3.77783203125, -3.62994384765625, -3.4820556640625, -3.33416748046875, -3.186279296875, -3.03839111328125, -2.8905029296875, -2.74261474609375, -2.5947265625, -2.44683837890625, -2.2989501953125, -2.15106201171875, -2.003173828125, -1.85528564453125, -1.7073974609375, -1.55950927734375, -1.41162109375, -1.26373291015625, -1.1158447265625, -0.96795654296875, -0.820068359375, -0.67218017578125, -0.5242919921875, -0.37640380859375, -0.228515625, -0.08062744140625, 0.0672607421875, 0.21514892578125, 0.363037109375, 0.51092529296875, 0.6588134765625, 0.80670166015625, 0.95458984375, 1.10247802734375, 1.2503662109375, 1.39825439453125, 1.546142578125, 1.69403076171875, 1.8419189453125, 1.98980712890625, 2.1376953125, 2.28558349609375, 2.4334716796875, 2.58135986328125, 2.729248046875, 2.87713623046875, 3.0250244140625, 3.17291259765625, 3.32080078125, 3.46868896484375, 3.6165771484375, 3.76446533203125, 3.912353515625, 4.06024169921875, 4.2081298828125, 4.35601806640625, 4.50390625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 10.0, 11.0, 5.0, 14.0, 10.0, 10.0, 16.0, 16.0, 24.0, 25.0, 30.0, 32.0, 43.0, 41.0, 44.0, 75.0, 110.0, 140.0, 278.0, 1262.0, 200.0, 135.0, 88.0, 64.0, 57.0, 35.0, 36.0, 30.0, 29.0, 25.0, 24.0, 25.0, 16.0, 12.0, 10.0, 8.0, 7.0, 9.0, 5.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-11.109375, -10.78466796875, -10.4599609375, -10.13525390625, -9.810546875, -9.48583984375, -9.1611328125, -8.83642578125, -8.51171875, -8.18701171875, -7.8623046875, -7.53759765625, -7.212890625, -6.88818359375, -6.5634765625, -6.23876953125, -5.9140625, -5.58935546875, -5.2646484375, -4.93994140625, -4.615234375, -4.29052734375, -3.9658203125, -3.64111328125, -3.31640625, -2.99169921875, -2.6669921875, -2.34228515625, -2.017578125, -1.69287109375, -1.3681640625, -1.04345703125, -0.71875, -0.39404296875, -0.0693359375, 0.25537109375, 0.580078125, 0.90478515625, 1.2294921875, 1.55419921875, 1.87890625, 2.20361328125, 2.5283203125, 2.85302734375, 3.177734375, 3.50244140625, 3.8271484375, 4.15185546875, 4.4765625, 4.80126953125, 5.1259765625, 5.45068359375, 5.775390625, 6.10009765625, 6.4248046875, 6.74951171875, 7.07421875, 7.39892578125, 7.7236328125, 8.04833984375, 8.373046875, 8.69775390625, 9.0224609375, 9.34716796875, 9.671875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 8.0, 9.0, 8.0, 13.0, 16.0, 24.0, 30.0, 23.0, 47.0, 49.0, 68.0, 79.0, 136.0, 159.0, 237.0, 329.0, 483.0, 944.0, 3506.0, 1327980.0, 1804930.0, 3904.0, 970.0, 523.0, 323.0, 255.0, 154.0, 114.0, 90.0, 64.0, 54.0, 33.0, 34.0, 28.0, 24.0, 13.0, 18.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46875, -34.20263671875, -32.9365234375, -31.67041015625, -30.404296875, -29.13818359375, -27.8720703125, -26.60595703125, -25.33984375, -24.07373046875, -22.8076171875, -21.54150390625, -20.275390625, -19.00927734375, -17.7431640625, -16.47705078125, -15.2109375, -13.94482421875, -12.6787109375, -11.41259765625, -10.146484375, -8.88037109375, -7.6142578125, -6.34814453125, -5.08203125, -3.81591796875, -2.5498046875, -1.28369140625, -0.017578125, 1.24853515625, 2.5146484375, 3.78076171875, 5.046875, 6.31298828125, 7.5791015625, 8.84521484375, 10.111328125, 11.37744140625, 12.6435546875, 13.90966796875, 15.17578125, 16.44189453125, 17.7080078125, 18.97412109375, 20.240234375, 21.50634765625, 22.7724609375, 24.03857421875, 25.3046875, 26.57080078125, 27.8369140625, 29.10302734375, 30.369140625, 31.63525390625, 32.9013671875, 34.16748046875, 35.43359375, 36.69970703125, 37.9658203125, 39.23193359375, 40.498046875, 41.76416015625, 43.0302734375, 44.29638671875, 45.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 105.0, 482.0, 358.0, 61.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.85488891601562, -139.4613800048828, -135.06788635253906, -130.67437744140625, -126.28086853027344, -121.88736724853516, -117.49386596679688, -113.10035705566406, -108.70684814453125, -104.31334686279297, -99.91983795166016, -95.52633666992188, -91.13282775878906, -86.73932647705078, -82.3458251953125, -77.95231628417969, -73.5588150024414, -69.16531372070312, -64.77180480957031, -60.37830352783203, -55.98479461669922, -51.59129333496094, -47.19778823852539, -42.804283142089844, -38.4107780456543, -34.01727294921875, -29.623767852783203, -25.23026466369629, -20.836759567260742, -16.443254470825195, -12.049751281738281, -7.656246185302734, -3.2627410888671875, 1.1307635307312012, 5.52426815032959, 9.91777229309082, 14.311277389526367, 18.704782485961914, 23.098285675048828, 27.491790771484375, 31.885295867919922, 36.27880096435547, 40.672306060791016, 45.06581115722656, 49.459312438964844, 53.852821350097656, 58.24632263183594, 62.639827728271484, 67.03333282470703, 71.42683410644531, 75.82034301757812, 80.2138442993164, 84.60735321044922, 89.0008544921875, 93.39436340332031, 97.7878646850586, 102.18136596679688, 106.57486724853516, 110.96837615966797, 115.36187744140625, 119.75538635253906, 124.14888763427734, 128.54238891601562, 132.93589782714844, 137.32940673828125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 10.0, 13.0, 7.0, 19.0, 20.0, 21.0, 15.0, 24.0, 31.0, 23.0, 35.0, 33.0, 43.0, 51.0, 32.0, 41.0, 44.0, 45.0, 36.0, 23.0, 42.0, 39.0, 40.0, 41.0, 39.0, 28.0, 32.0, 26.0, 23.0, 24.0, 9.0, 23.0, 11.0, 9.0, 11.0, 7.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.688982009887695, -29.621551513671875, -28.554119110107422, -27.4866886138916, -26.41925811767578, -25.351825714111328, -24.284395217895508, -23.216964721679688, -22.149532318115234, -21.082101821899414, -20.01466941833496, -18.94723892211914, -17.879806518554688, -16.812376022338867, -15.744945526123047, -14.67751407623291, -13.610082626342773, -12.542651176452637, -11.4752197265625, -10.40778923034668, -9.340357780456543, -8.272926330566406, -7.205495357513428, -6.138064384460449, -5.0706329345703125, -4.003201484680176, -2.9357705116271973, -1.8683393001556396, -0.800908088684082, 0.2665233612060547, 1.3339543342590332, 2.4013853073120117, 3.4688186645507812, 4.536250114440918, 5.6036810874938965, 6.671112060546875, 7.738543510437012, 8.805974960327148, 9.873405456542969, 10.940836906433105, 12.008268356323242, 13.075699806213379, 14.143131256103516, 15.210561752319336, 16.277992248535156, 17.34542465209961, 18.41285514831543, 19.48028564453125, 20.547718048095703, 21.615148544311523, 22.682580947875977, 23.750011444091797, 24.81744384765625, 25.88487434387207, 26.95230484008789, 28.019737243652344, 29.087167739868164, 30.154598236083984, 31.222030639648438, 32.28946304321289, 33.35689163208008, 34.42432403564453, 35.491756439208984, 36.55918502807617, 37.626617431640625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 8.0, 9.0, 5.0, 8.0, 10.0, 11.0, 17.0, 26.0, 22.0, 20.0, 21.0, 26.0, 26.0, 27.0, 36.0, 44.0, 37.0, 32.0, 49.0, 46.0, 30.0, 39.0, 32.0, 42.0, 30.0, 32.0, 37.0, 37.0, 31.0, 29.0, 26.0, 18.0, 21.0, 18.0, 10.0, 12.0, 18.0, 12.0, 6.0, 6.0, 6.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.31768798828125, -4.1705322265625, -4.02337646484375, -3.876220703125, -3.72906494140625, -3.5819091796875, -3.43475341796875, -3.28759765625, -3.14044189453125, -2.9932861328125, -2.84613037109375, -2.698974609375, -2.55181884765625, -2.4046630859375, -2.25750732421875, -2.1103515625, -1.96319580078125, -1.8160400390625, -1.66888427734375, -1.521728515625, -1.37457275390625, -1.2274169921875, -1.08026123046875, -0.93310546875, -0.78594970703125, -0.6387939453125, -0.49163818359375, -0.344482421875, -0.19732666015625, -0.0501708984375, 0.09698486328125, 0.244140625, 0.39129638671875, 0.5384521484375, 0.68560791015625, 0.832763671875, 0.97991943359375, 1.1270751953125, 1.27423095703125, 1.42138671875, 1.56854248046875, 1.7156982421875, 1.86285400390625, 2.010009765625, 2.15716552734375, 2.3043212890625, 2.45147705078125, 2.5986328125, 2.74578857421875, 2.8929443359375, 3.04010009765625, 3.187255859375, 3.33441162109375, 3.4815673828125, 3.62872314453125, 3.77587890625, 3.92303466796875, 4.0701904296875, 4.21734619140625, 4.364501953125, 4.51165771484375, 4.6588134765625, 4.80596923828125, 4.953125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 7.0, 7.0, 8.0, 7.0, 9.0, 19.0, 17.0, 21.0, 27.0, 28.0, 64.0, 87.0, 125.0, 190.0, 366.0, 695.0, 1419.0, 3124.0, 8031.0, 29471.0, 208519.0, 1589012.0, 2006253.0, 292801.0, 37123.0, 9748.0, 3620.0, 1621.0, 780.0, 401.0, 217.0, 123.0, 71.0, 46.0, 39.0, 31.0, 23.0, 30.0, 20.0, 14.0, 11.0, 9.0, 8.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0], "bins": [-10.421875, -10.1068115234375, -9.791748046875, -9.4766845703125, -9.16162109375, -8.8465576171875, -8.531494140625, -8.2164306640625, -7.9013671875, -7.5863037109375, -7.271240234375, -6.9561767578125, -6.64111328125, -6.3260498046875, -6.010986328125, -5.6959228515625, -5.380859375, -5.0657958984375, -4.750732421875, -4.4356689453125, -4.12060546875, -3.8055419921875, -3.490478515625, -3.1754150390625, -2.8603515625, -2.5452880859375, -2.230224609375, -1.9151611328125, -1.60009765625, -1.2850341796875, -0.969970703125, -0.6549072265625, -0.33984375, -0.0247802734375, 0.290283203125, 0.6053466796875, 0.92041015625, 1.2354736328125, 1.550537109375, 1.8656005859375, 2.1806640625, 2.4957275390625, 2.810791015625, 3.1258544921875, 3.44091796875, 3.7559814453125, 4.071044921875, 4.3861083984375, 4.701171875, 5.0162353515625, 5.331298828125, 5.6463623046875, 5.96142578125, 6.2764892578125, 6.591552734375, 6.9066162109375, 7.2216796875, 7.5367431640625, 7.851806640625, 8.1668701171875, 8.48193359375, 8.7969970703125, 9.112060546875, 9.4271240234375, 9.7421875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 15.0, 16.0, 24.0, 28.0, 28.0, 44.0, 61.0, 68.0, 86.0, 118.0, 144.0, 197.0, 265.0, 350.0, 460.0, 461.0, 391.0, 282.0, 234.0, 201.0, 122.0, 96.0, 75.0, 66.0, 56.0, 36.0, 28.0, 27.0, 16.0, 16.0, 7.0, 9.0, 7.0, 2.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0, -7.77874755859375, -7.5574951171875, -7.33624267578125, -7.114990234375, -6.89373779296875, -6.6724853515625, -6.45123291015625, -6.22998046875, -6.00872802734375, -5.7874755859375, -5.56622314453125, -5.344970703125, -5.12371826171875, -4.9024658203125, -4.68121337890625, -4.4599609375, -4.23870849609375, -4.0174560546875, -3.79620361328125, -3.574951171875, -3.35369873046875, -3.1324462890625, -2.91119384765625, -2.68994140625, -2.46868896484375, -2.2474365234375, -2.02618408203125, -1.804931640625, -1.58367919921875, -1.3624267578125, -1.14117431640625, -0.919921875, -0.69866943359375, -0.4774169921875, -0.25616455078125, -0.034912109375, 0.18634033203125, 0.4075927734375, 0.62884521484375, 0.85009765625, 1.07135009765625, 1.2926025390625, 1.51385498046875, 1.735107421875, 1.95635986328125, 2.1776123046875, 2.39886474609375, 2.6201171875, 2.84136962890625, 3.0626220703125, 3.28387451171875, 3.505126953125, 3.72637939453125, 3.9476318359375, 4.16888427734375, 4.39013671875, 4.61138916015625, 4.8326416015625, 5.05389404296875, 5.275146484375, 5.49639892578125, 5.7176513671875, 5.93890380859375, 6.16015625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 6.0, 8.0, 9.0, 16.0, 34.0, 38.0, 40.0, 75.0, 133.0, 224.0, 498.0, 1460.0, 6517.0, 68381.0, 2766180.0, 1306341.0, 37535.0, 4530.0, 1220.0, 436.0, 215.0, 125.0, 77.0, 55.0, 26.0, 26.0, 17.0, 11.0, 12.0, 8.0, 6.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5625, -21.916015625, -21.26953125, -20.623046875, -19.9765625, -19.330078125, -18.68359375, -18.037109375, -17.390625, -16.744140625, -16.09765625, -15.451171875, -14.8046875, -14.158203125, -13.51171875, -12.865234375, -12.21875, -11.572265625, -10.92578125, -10.279296875, -9.6328125, -8.986328125, -8.33984375, -7.693359375, -7.046875, -6.400390625, -5.75390625, -5.107421875, -4.4609375, -3.814453125, -3.16796875, -2.521484375, -1.875, -1.228515625, -0.58203125, 0.064453125, 0.7109375, 1.357421875, 2.00390625, 2.650390625, 3.296875, 3.943359375, 4.58984375, 5.236328125, 5.8828125, 6.529296875, 7.17578125, 7.822265625, 8.46875, 9.115234375, 9.76171875, 10.408203125, 11.0546875, 11.701171875, 12.34765625, 12.994140625, 13.640625, 14.287109375, 14.93359375, 15.580078125, 16.2265625, 16.873046875, 17.51953125, 18.166015625, 18.8125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 864.0, 148.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-634.5588989257812, -619.3680419921875, -604.1771850585938, -588.986328125, -573.7955322265625, -558.6046752929688, -543.413818359375, -528.2229614257812, -513.0321044921875, -497.84124755859375, -482.6504211425781, -467.4595642089844, -452.2687072753906, -437.077880859375, -421.88702392578125, -406.6961669921875, -391.5053405761719, -376.3144836425781, -361.1236572265625, -345.93280029296875, -330.741943359375, -315.55108642578125, -300.3602600097656, -285.1694030761719, -269.97857666015625, -254.78773498535156, -239.5968780517578, -224.40603637695312, -209.21517944335938, -194.0243377685547, -178.83349609375, -163.64263916015625, -148.45181274414062, -133.26097106933594, -118.07011413574219, -102.8792724609375, -87.68842315673828, -72.49757385253906, -57.306732177734375, -42.115882873535156, -26.925033569335938, -11.734186172485352, 3.4566612243652344, 18.647506713867188, 33.838356018066406, 49.029205322265625, 64.22004699707031, 79.41089630126953, 94.60174560546875, 109.79259490966797, 124.98344421386719, 140.17428588867188, 155.36514282226562, 170.5559844970703, 185.746826171875, 200.93768310546875, 216.12852478027344, 231.31936645507812, 246.51022338867188, 261.7010498046875, 276.89190673828125, 292.082763671875, 307.27362060546875, 322.4644470214844, 337.6553039550781]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 8.0, 15.0, 17.0, 12.0, 22.0, 17.0, 31.0, 22.0, 37.0, 43.0, 49.0, 36.0, 40.0, 55.0, 53.0, 54.0, 39.0, 47.0, 48.0, 50.0, 36.0, 36.0, 32.0, 33.0, 31.0, 18.0, 24.0, 18.0, 17.0, 13.0, 8.0, 7.0, 9.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.37283706665039, -25.29002571105957, -24.20721435546875, -23.124401092529297, -22.041589736938477, -20.958778381347656, -19.875965118408203, -18.793153762817383, -17.710342407226562, -16.627531051635742, -15.544718742370605, -14.461906433105469, -13.379095077514648, -12.296283721923828, -11.213471412658691, -10.130659103393555, -9.047847747802734, -7.965035915374756, -6.882224082946777, -5.799412250518799, -4.71660041809082, -3.633788585662842, -2.5509767532348633, -1.4681649208068848, -0.38535308837890625, 0.6974587440490723, 1.7802705764770508, 2.8630824089050293, 3.945894241333008, 5.028706073760986, 6.111517906188965, 7.194329738616943, 8.277137756347656, 9.359949111938477, 10.442761421203613, 11.52557373046875, 12.60838508605957, 13.69119644165039, 14.774008750915527, 15.856821060180664, 16.939632415771484, 18.022443771362305, 19.105255126953125, 20.188068389892578, 21.2708797454834, 22.35369110107422, 23.436504364013672, 24.519315719604492, 25.602127075195312, 26.684938430786133, 27.767749786376953, 28.850563049316406, 29.933374404907227, 31.016185760498047, 32.0989990234375, 33.18180847167969, 34.26462173461914, 35.347434997558594, 36.43024444580078, 37.513057708740234, 38.59587097167969, 39.678680419921875, 40.76149368286133, 41.844303131103516, 42.92711639404297]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 7.0, 2.0, 8.0, 10.0, 12.0, 16.0, 21.0, 22.0, 34.0, 22.0, 30.0, 30.0, 42.0, 35.0, 40.0, 42.0, 46.0, 43.0, 40.0, 41.0, 42.0, 45.0, 29.0, 32.0, 41.0, 44.0, 29.0, 33.0, 19.0, 15.0, 25.0, 16.0, 11.0, 17.0, 7.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 6.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.57421875, -4.43798828125, -4.3017578125, -4.16552734375, -4.029296875, -3.89306640625, -3.7568359375, -3.62060546875, -3.484375, -3.34814453125, -3.2119140625, -3.07568359375, -2.939453125, -2.80322265625, -2.6669921875, -2.53076171875, -2.39453125, -2.25830078125, -2.1220703125, -1.98583984375, -1.849609375, -1.71337890625, -1.5771484375, -1.44091796875, -1.3046875, -1.16845703125, -1.0322265625, -0.89599609375, -0.759765625, -0.62353515625, -0.4873046875, -0.35107421875, -0.21484375, -0.07861328125, 0.0576171875, 0.19384765625, 0.330078125, 0.46630859375, 0.6025390625, 0.73876953125, 0.875, 1.01123046875, 1.1474609375, 1.28369140625, 1.419921875, 1.55615234375, 1.6923828125, 1.82861328125, 1.96484375, 2.10107421875, 2.2373046875, 2.37353515625, 2.509765625, 2.64599609375, 2.7822265625, 2.91845703125, 3.0546875, 3.19091796875, 3.3271484375, 3.46337890625, 3.599609375, 3.73583984375, 3.8720703125, 4.00830078125, 4.14453125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 7.0, 7.0, 13.0, 20.0, 33.0, 43.0, 76.0, 93.0, 144.0, 255.0, 330.0, 502.0, 776.0, 1139.0, 1872.0, 3062.0, 4953.0, 8911.0, 15221.0, 27697.0, 51881.0, 97292.0, 171753.0, 234053.0, 187743.0, 109376.0, 58773.0, 31183.0, 16927.0, 9422.0, 5617.0, 3527.0, 2038.0, 1274.0, 869.0, 551.0, 368.0, 228.0, 176.0, 118.0, 81.0, 50.0, 35.0, 20.0, 14.0, 10.0, 10.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.66796875, -0.6480865478515625, -0.628204345703125, -0.6083221435546875, -0.58843994140625, -0.5685577392578125, -0.548675537109375, -0.5287933349609375, -0.5089111328125, -0.4890289306640625, -0.469146728515625, -0.4492645263671875, -0.42938232421875, -0.4095001220703125, -0.389617919921875, -0.3697357177734375, -0.349853515625, -0.3299713134765625, -0.310089111328125, -0.2902069091796875, -0.27032470703125, -0.2504425048828125, -0.230560302734375, -0.2106781005859375, -0.1907958984375, -0.1709136962890625, -0.151031494140625, -0.1311492919921875, -0.11126708984375, -0.0913848876953125, -0.071502685546875, -0.0516204833984375, -0.03173828125, -0.0118560791015625, 0.008026123046875, 0.0279083251953125, 0.04779052734375, 0.0676727294921875, 0.087554931640625, 0.1074371337890625, 0.1273193359375, 0.1472015380859375, 0.167083740234375, 0.1869659423828125, 0.20684814453125, 0.2267303466796875, 0.246612548828125, 0.2664947509765625, 0.286376953125, 0.3062591552734375, 0.326141357421875, 0.3460235595703125, 0.36590576171875, 0.3857879638671875, 0.405670166015625, 0.4255523681640625, 0.4454345703125, 0.4653167724609375, 0.485198974609375, 0.5050811767578125, 0.52496337890625, 0.5448455810546875, 0.564727783203125, 0.5846099853515625, 0.6044921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 10.0, 13.0, 10.0, 22.0, 20.0, 27.0, 25.0, 27.0, 28.0, 20.0, 32.0, 36.0, 36.0, 26.0, 60.0, 49.0, 1065.0, 43.0, 35.0, 46.0, 44.0, 28.0, 38.0, 31.0, 28.0, 27.0, 26.0, 16.0, 20.0, 16.0, 17.0, 10.0, 10.0, 8.0, 12.0, 10.0, 5.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4609375, -2.37091064453125, -2.2808837890625, -2.19085693359375, -2.100830078125, -2.01080322265625, -1.9207763671875, -1.83074951171875, -1.74072265625, -1.65069580078125, -1.5606689453125, -1.47064208984375, -1.380615234375, -1.29058837890625, -1.2005615234375, -1.11053466796875, -1.0205078125, -0.93048095703125, -0.8404541015625, -0.75042724609375, -0.660400390625, -0.57037353515625, -0.4803466796875, -0.39031982421875, -0.30029296875, -0.21026611328125, -0.1202392578125, -0.03021240234375, 0.059814453125, 0.14984130859375, 0.2398681640625, 0.32989501953125, 0.419921875, 0.50994873046875, 0.5999755859375, 0.69000244140625, 0.780029296875, 0.87005615234375, 0.9600830078125, 1.05010986328125, 1.14013671875, 1.23016357421875, 1.3201904296875, 1.41021728515625, 1.500244140625, 1.59027099609375, 1.6802978515625, 1.77032470703125, 1.8603515625, 1.95037841796875, 2.0404052734375, 2.13043212890625, 2.220458984375, 2.31048583984375, 2.4005126953125, 2.49053955078125, 2.58056640625, 2.67059326171875, 2.7606201171875, 2.85064697265625, 2.940673828125, 3.03070068359375, 3.1207275390625, 3.21075439453125, 3.30078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 10.0, 12.0, 17.0, 26.0, 46.0, 65.0, 83.0, 149.0, 195.0, 320.0, 469.0, 765.0, 1244.0, 2369.0, 4632.0, 9680.0, 22737.0, 59279.0, 165845.0, 923274.0, 662998.0, 149610.0, 53582.0, 20924.0, 8943.0, 4326.0, 2226.0, 1216.0, 769.0, 432.0, 273.0, 198.0, 124.0, 68.0, 58.0, 46.0, 35.0, 30.0, 12.0, 18.0, 10.0, 5.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62890625, -0.609222412109375, -0.58953857421875, -0.569854736328125, -0.5501708984375, -0.530487060546875, -0.51080322265625, -0.491119384765625, -0.471435546875, -0.451751708984375, -0.43206787109375, -0.412384033203125, -0.3927001953125, -0.373016357421875, -0.35333251953125, -0.333648681640625, -0.31396484375, -0.294281005859375, -0.27459716796875, -0.254913330078125, -0.2352294921875, -0.215545654296875, -0.19586181640625, -0.176177978515625, -0.156494140625, -0.136810302734375, -0.11712646484375, -0.097442626953125, -0.0777587890625, -0.058074951171875, -0.03839111328125, -0.018707275390625, 0.0009765625, 0.020660400390625, 0.04034423828125, 0.060028076171875, 0.0797119140625, 0.099395751953125, 0.11907958984375, 0.138763427734375, 0.158447265625, 0.178131103515625, 0.19781494140625, 0.217498779296875, 0.2371826171875, 0.256866455078125, 0.27655029296875, 0.296234130859375, 0.31591796875, 0.335601806640625, 0.35528564453125, 0.374969482421875, 0.3946533203125, 0.414337158203125, 0.43402099609375, 0.453704833984375, 0.473388671875, 0.493072509765625, 0.51275634765625, 0.532440185546875, 0.5521240234375, 0.571807861328125, 0.59149169921875, 0.611175537109375, 0.630859375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 18.0, 23.0, 28.0, 41.0, 59.0, 81.0, 113.0, 138.0, 143.0, 99.0, 52.0, 56.0, 35.0, 18.0, 23.0, 14.0, 10.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.13953876495361328, -0.13564491271972656, -0.13175106048583984, -0.12785720825195312, -0.1239633560180664, -0.12006950378417969, -0.11617565155029297, -0.11228179931640625, -0.10838794708251953, -0.10449409484863281, -0.1006002426147461, -0.09670639038085938, -0.09281253814697266, -0.08891868591308594, -0.08502483367919922, -0.0811309814453125, -0.07723712921142578, -0.07334327697753906, -0.06944942474365234, -0.06555557250976562, -0.061661720275878906, -0.05776786804199219, -0.05387401580810547, -0.04998016357421875, -0.04608631134033203, -0.04219245910644531, -0.038298606872558594, -0.034404754638671875, -0.030510902404785156, -0.026617050170898438, -0.02272319793701172, -0.018829345703125, -0.014935493469238281, -0.011041641235351562, -0.007147789001464844, -0.003253936767578125, 0.0006399154663085938, 0.0045337677001953125, 0.008427619934082031, 0.01232147216796875, 0.01621532440185547, 0.020109176635742188, 0.024003028869628906, 0.027896881103515625, 0.031790733337402344, 0.03568458557128906, 0.03957843780517578, 0.0434722900390625, 0.04736614227294922, 0.05125999450683594, 0.055153846740722656, 0.059047698974609375, 0.0629415512084961, 0.06683540344238281, 0.07072925567626953, 0.07462310791015625, 0.07851696014404297, 0.08241081237792969, 0.0863046646118164, 0.09019851684570312, 0.09409236907958984, 0.09798622131347656, 0.10188007354736328, 0.10577392578125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 20.0, 14.0, 33.0, 46.0, 60.0, 71.0, 139.0, 212.0, 487.0, 2305.0, 1041239.0, 2620.0, 576.0, 225.0, 152.0, 96.0, 63.0, 38.0, 32.0, 27.0, 19.0, 10.0, 10.0, 5.0, 9.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.924652099609375, -1.84930419921875, -1.773956298828125, -1.6986083984375, -1.623260498046875, -1.54791259765625, -1.472564697265625, -1.397216796875, -1.321868896484375, -1.24652099609375, -1.171173095703125, -1.0958251953125, -1.020477294921875, -0.94512939453125, -0.869781494140625, -0.79443359375, -0.719085693359375, -0.64373779296875, -0.568389892578125, -0.4930419921875, -0.417694091796875, -0.34234619140625, -0.266998291015625, -0.191650390625, -0.116302490234375, -0.04095458984375, 0.034393310546875, 0.1097412109375, 0.185089111328125, 0.26043701171875, 0.335784912109375, 0.4111328125, 0.486480712890625, 0.56182861328125, 0.637176513671875, 0.7125244140625, 0.787872314453125, 0.86322021484375, 0.938568115234375, 1.013916015625, 1.089263916015625, 1.16461181640625, 1.239959716796875, 1.3153076171875, 1.390655517578125, 1.46600341796875, 1.541351318359375, 1.61669921875, 1.692047119140625, 1.76739501953125, 1.842742919921875, 1.9180908203125, 1.993438720703125, 2.06878662109375, 2.144134521484375, 2.219482421875, 2.294830322265625, 2.37017822265625, 2.445526123046875, 2.5208740234375, 2.596221923828125, 2.67156982421875, 2.746917724609375, 2.822265625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 20.0, 480.0, 490.0, 19.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30912306904792786, -0.29194191098213196, -0.27476075291633606, -0.2575795650482178, -0.24039840698242188, -0.22321724891662598, -0.20603609085083008, -0.18885493278503418, -0.1716737598180771, -0.1544926017522812, -0.1373114287853241, -0.1201302707195282, -0.1029491052031517, -0.08576793968677521, -0.06858678162097931, -0.051405616104602814, -0.03422445058822632, -0.017043286934494972, 0.0001378767192363739, 0.01731903851032257, 0.034500204026699066, 0.05168136954307556, 0.06886252760887146, 0.08604369312524796, 0.10322485864162445, 0.12040602415800095, 0.13758718967437744, 0.15476834774017334, 0.17194950580596924, 0.18913067877292633, 0.20631183683872223, 0.22349300980567932, 0.2406741976737976, 0.2578553557395935, 0.2750365138053894, 0.2922176718711853, 0.3093988597393036, 0.3265800178050995, 0.3437611758708954, 0.3609423339366913, 0.37812352180480957, 0.39530467987060547, 0.41248583793640137, 0.42966699600219727, 0.44684818387031555, 0.46402934193611145, 0.48121050000190735, 0.49839165806770325, 0.5155727863311768, 0.5327539443969727, 0.5499351024627686, 0.5671162605285645, 0.5842974185943604, 0.6014785766601562, 0.6186597347259521, 0.6358409523963928, 0.6530221104621887, 0.6702032685279846, 0.6873844265937805, 0.7045655846595764, 0.7217467427253723, 0.738927960395813, 0.7561091184616089, 0.7732902765274048, 0.7904714345932007]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 17.0, 15.0, 8.0, 11.0, 17.0, 26.0, 27.0, 31.0, 28.0, 22.0, 23.0, 39.0, 43.0, 40.0, 37.0, 37.0, 43.0, 41.0, 38.0, 36.0, 53.0, 45.0, 27.0, 29.0, 30.0, 28.0, 29.0, 24.0, 24.0, 16.0, 18.0, 14.0, 13.0, 8.0, 10.0, 8.0, 7.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0856671929359436, -0.08294132351875305, -0.0802154541015625, -0.07748958468437195, -0.0747637152671814, -0.07203785330057144, -0.06931198388338089, -0.06658611446619034, -0.06386024504899979, -0.061134375631809235, -0.05840850621461868, -0.05568264052271843, -0.05295677110552788, -0.050230901688337326, -0.04750503599643707, -0.04477916657924652, -0.04205329716205597, -0.03932742774486542, -0.036601558327674866, -0.03387569263577461, -0.03114982321858406, -0.02842395380139351, -0.025698086246848106, -0.022972218692302704, -0.020246349275112152, -0.0175204798579216, -0.014794612303376198, -0.01206874381750822, -0.009342875331640244, -0.006617006845772266, -0.0038911383599042892, -0.0011652708053588867, 0.001560598611831665, 0.004286467097699642, 0.007012335583567619, 0.009738204069435596, 0.012464072555303574, 0.01518994104117155, 0.017915809527039528, 0.02064167708158493, 0.023367546498775482, 0.026093415915966034, 0.028819283470511436, 0.03154515102505684, 0.03427102044224739, 0.03699688985943794, 0.039722755551338196, 0.04244862496852875, 0.0451744943857193, 0.04790036380290985, 0.0506262332201004, 0.053352098912000656, 0.05607796832919121, 0.05880383774638176, 0.06152970343828201, 0.06425557285547256, 0.06698144227266312, 0.06970731168985367, 0.07243318110704422, 0.07515905052423477, 0.07788491249084473, 0.08061078190803528, 0.08333665132522583, 0.08606252074241638, 0.08878839015960693]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 2.0, 9.0, 9.0, 4.0, 8.0, 16.0, 12.0, 20.0, 32.0, 27.0, 20.0, 16.0, 25.0, 43.0, 50.0, 59.0, 56.0, 44.0, 44.0, 47.0, 42.0, 42.0, 38.0, 36.0, 35.0, 42.0, 24.0, 29.0, 31.0, 19.0, 21.0, 20.0, 18.0, 9.0, 5.0, 10.0, 5.0, 6.0, 7.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-5.359375, -5.2156982421875, -5.072021484375, -4.9283447265625, -4.78466796875, -4.6409912109375, -4.497314453125, -4.3536376953125, -4.2099609375, -4.0662841796875, -3.922607421875, -3.7789306640625, -3.63525390625, -3.4915771484375, -3.347900390625, -3.2042236328125, -3.060546875, -2.9168701171875, -2.773193359375, -2.6295166015625, -2.48583984375, -2.3421630859375, -2.198486328125, -2.0548095703125, -1.9111328125, -1.7674560546875, -1.623779296875, -1.4801025390625, -1.33642578125, -1.1927490234375, -1.049072265625, -0.9053955078125, -0.76171875, -0.6180419921875, -0.474365234375, -0.3306884765625, -0.18701171875, -0.0433349609375, 0.100341796875, 0.2440185546875, 0.3876953125, 0.5313720703125, 0.675048828125, 0.8187255859375, 0.96240234375, 1.1060791015625, 1.249755859375, 1.3934326171875, 1.537109375, 1.6807861328125, 1.824462890625, 1.9681396484375, 2.11181640625, 2.2554931640625, 2.399169921875, 2.5428466796875, 2.6865234375, 2.8302001953125, 2.973876953125, 3.1175537109375, 3.26123046875, 3.4049072265625, 3.548583984375, 3.6922607421875, 3.8359375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 13.0, 9.0, 12.0, 29.0, 51.0, 56.0, 99.0, 104.0, 171.0, 298.0, 388.0, 607.0, 927.0, 1603.0, 2801.0, 5012.0, 10529.0, 27296.0, 88482.0, 346261.0, 404621.0, 102564.0, 31667.0, 11908.0, 5466.0, 2903.0, 1717.0, 1083.0, 623.0, 396.0, 273.0, 188.0, 133.0, 80.0, 47.0, 46.0, 26.0, 13.0, 18.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.28765869140625, -6.0635986328125, -5.83953857421875, -5.615478515625, -5.39141845703125, -5.1673583984375, -4.94329833984375, -4.71923828125, -4.49517822265625, -4.2711181640625, -4.04705810546875, -3.822998046875, -3.59893798828125, -3.3748779296875, -3.15081787109375, -2.9267578125, -2.70269775390625, -2.4786376953125, -2.25457763671875, -2.030517578125, -1.80645751953125, -1.5823974609375, -1.35833740234375, -1.13427734375, -0.91021728515625, -0.6861572265625, -0.46209716796875, -0.238037109375, -0.01397705078125, 0.2100830078125, 0.43414306640625, 0.658203125, 0.88226318359375, 1.1063232421875, 1.33038330078125, 1.554443359375, 1.77850341796875, 2.0025634765625, 2.22662353515625, 2.45068359375, 2.67474365234375, 2.8988037109375, 3.12286376953125, 3.346923828125, 3.57098388671875, 3.7950439453125, 4.01910400390625, 4.2431640625, 4.46722412109375, 4.6912841796875, 4.91534423828125, 5.139404296875, 5.36346435546875, 5.5875244140625, 5.81158447265625, 6.03564453125, 6.25970458984375, 6.4837646484375, 6.70782470703125, 6.931884765625, 7.15594482421875, 7.3800048828125, 7.60406494140625, 7.828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 8.0, 7.0, 7.0, 14.0, 8.0, 14.0, 17.0, 15.0, 17.0, 28.0, 34.0, 35.0, 41.0, 57.0, 73.0, 92.0, 134.0, 255.0, 1374.0, 216.0, 146.0, 79.0, 53.0, 38.0, 32.0, 42.0, 35.0, 23.0, 17.0, 26.0, 9.0, 11.0, 9.0, 8.0, 11.0, 13.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-9.578125, -9.291259765625, -9.00439453125, -8.717529296875, -8.4306640625, -8.143798828125, -7.85693359375, -7.570068359375, -7.283203125, -6.996337890625, -6.70947265625, -6.422607421875, -6.1357421875, -5.848876953125, -5.56201171875, -5.275146484375, -4.98828125, -4.701416015625, -4.41455078125, -4.127685546875, -3.8408203125, -3.553955078125, -3.26708984375, -2.980224609375, -2.693359375, -2.406494140625, -2.11962890625, -1.832763671875, -1.5458984375, -1.259033203125, -0.97216796875, -0.685302734375, -0.3984375, -0.111572265625, 0.17529296875, 0.462158203125, 0.7490234375, 1.035888671875, 1.32275390625, 1.609619140625, 1.896484375, 2.183349609375, 2.47021484375, 2.757080078125, 3.0439453125, 3.330810546875, 3.61767578125, 3.904541015625, 4.19140625, 4.478271484375, 4.76513671875, 5.052001953125, 5.3388671875, 5.625732421875, 5.91259765625, 6.199462890625, 6.486328125, 6.773193359375, 7.06005859375, 7.346923828125, 7.6337890625, 7.920654296875, 8.20751953125, 8.494384765625, 8.78125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 15.0, 14.0, 18.0, 35.0, 32.0, 41.0, 74.0, 101.0, 138.0, 215.0, 373.0, 591.0, 1323.0, 17789.0, 3112071.0, 10034.0, 1252.0, 550.0, 321.0, 196.0, 158.0, 101.0, 59.0, 49.0, 39.0, 18.0, 16.0, 18.0, 17.0, 9.0, 7.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.84375, -35.63330078125, -34.4228515625, -33.21240234375, -32.001953125, -30.79150390625, -29.5810546875, -28.37060546875, -27.16015625, -25.94970703125, -24.7392578125, -23.52880859375, -22.318359375, -21.10791015625, -19.8974609375, -18.68701171875, -17.4765625, -16.26611328125, -15.0556640625, -13.84521484375, -12.634765625, -11.42431640625, -10.2138671875, -9.00341796875, -7.79296875, -6.58251953125, -5.3720703125, -4.16162109375, -2.951171875, -1.74072265625, -0.5302734375, 0.68017578125, 1.890625, 3.10107421875, 4.3115234375, 5.52197265625, 6.732421875, 7.94287109375, 9.1533203125, 10.36376953125, 11.57421875, 12.78466796875, 13.9951171875, 15.20556640625, 16.416015625, 17.62646484375, 18.8369140625, 20.04736328125, 21.2578125, 22.46826171875, 23.6787109375, 24.88916015625, 26.099609375, 27.31005859375, 28.5205078125, 29.73095703125, 30.94140625, 32.15185546875, 33.3623046875, 34.57275390625, 35.783203125, 36.99365234375, 38.2041015625, 39.41455078125, 40.625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 12.0, 58.0, 136.0, 257.0, 289.0, 171.0, 63.0, 15.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.46492004394531, -65.42806243896484, -63.39120864868164, -61.35435485839844, -59.31749725341797, -57.280643463134766, -55.24378967285156, -53.206932067871094, -51.17007827758789, -49.13322448730469, -47.09636688232422, -45.059513092041016, -43.02265930175781, -40.985801696777344, -38.94894790649414, -36.91209411621094, -34.87523651123047, -32.838382720947266, -30.801525115966797, -28.764671325683594, -26.727815628051758, -24.690959930419922, -22.65410614013672, -20.617250442504883, -18.580394744873047, -16.54353904724121, -14.506684303283691, -12.469829559326172, -10.432973861694336, -8.3961181640625, -6.3592634201049805, -4.322408676147461, -2.2855453491210938, -0.24869012832641602, 1.7881650924682617, 3.8250203132629395, 5.861875534057617, 7.898731231689453, 9.935585975646973, 11.972440719604492, 14.009296417236328, 16.046152114868164, 18.0830078125, 20.119861602783203, 22.15671730041504, 24.193572998046875, 26.230426788330078, 28.267282485961914, 30.30413818359375, 32.34099197387695, 34.37784957885742, 36.414703369140625, 38.451560974121094, 40.4884147644043, 42.5252685546875, 44.56212615966797, 46.59897994995117, 48.635833740234375, 50.672691345214844, 52.70954513549805, 54.74639892578125, 56.78325653076172, 58.82011032104492, 60.856964111328125, 62.893821716308594]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 5.0, 15.0, 12.0, 13.0, 10.0, 19.0, 18.0, 29.0, 32.0, 25.0, 30.0, 31.0, 33.0, 34.0, 45.0, 40.0, 55.0, 46.0, 34.0, 42.0, 40.0, 53.0, 47.0, 26.0, 30.0, 38.0, 19.0, 26.0, 22.0, 16.0, 22.0, 20.0, 8.0, 8.0, 8.0, 5.0, 11.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-40.56049728393555, -39.519813537597656, -38.479129791259766, -37.438446044921875, -36.397762298583984, -35.357078552246094, -34.3163948059082, -33.27571105957031, -32.23503112792969, -31.194347381591797, -30.153663635253906, -29.112979888916016, -28.072296142578125, -27.031612396240234, -25.990930557250977, -24.950246810913086, -23.909561157226562, -22.868877410888672, -21.82819366455078, -20.78750991821289, -19.746826171875, -18.70614242553711, -17.66546058654785, -16.62477684020996, -15.58409309387207, -14.54340934753418, -13.502725601196289, -12.462042808532715, -11.421359062194824, -10.380675315856934, -9.33999252319336, -8.299308776855469, -7.258628845214844, -6.217945098876953, -5.177261829376221, -4.136578559875488, -3.0958948135375977, -2.055211067199707, -1.0145277976989746, 0.026155471801757812, 1.0668392181396484, 2.10752272605896, 3.1482062339782715, 4.188889503479004, 5.2295732498168945, 6.270256996154785, 7.310940265655518, 8.35162353515625, 9.39230728149414, 10.432991027832031, 11.473674774169922, 12.514357566833496, 13.555041313171387, 14.595725059509277, 15.636407852172852, 16.677091598510742, 17.717775344848633, 18.758459091186523, 19.799142837524414, 20.839826583862305, 21.880508422851562, 22.921192169189453, 23.961875915527344, 25.002559661865234, 26.043243408203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 19.0, 16.0, 21.0, 21.0, 24.0, 29.0, 21.0, 20.0, 32.0, 30.0, 33.0, 41.0, 42.0, 44.0, 49.0, 38.0, 43.0, 43.0, 25.0, 47.0, 37.0, 30.0, 33.0, 27.0, 23.0, 25.0, 25.0, 13.0, 22.0, 10.0, 17.0, 14.0, 12.0, 9.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.540252685546875, -3.40667724609375, -3.273101806640625, -3.1395263671875, -3.005950927734375, -2.87237548828125, -2.738800048828125, -2.605224609375, -2.471649169921875, -2.33807373046875, -2.204498291015625, -2.0709228515625, -1.937347412109375, -1.80377197265625, -1.670196533203125, -1.53662109375, -1.403045654296875, -1.26947021484375, -1.135894775390625, -1.0023193359375, -0.868743896484375, -0.73516845703125, -0.601593017578125, -0.468017578125, -0.334442138671875, -0.20086669921875, -0.067291259765625, 0.0662841796875, 0.199859619140625, 0.33343505859375, 0.467010498046875, 0.6005859375, 0.734161376953125, 0.86773681640625, 1.001312255859375, 1.1348876953125, 1.268463134765625, 1.40203857421875, 1.535614013671875, 1.669189453125, 1.802764892578125, 1.93634033203125, 2.069915771484375, 2.2034912109375, 2.337066650390625, 2.47064208984375, 2.604217529296875, 2.73779296875, 2.871368408203125, 3.00494384765625, 3.138519287109375, 3.2720947265625, 3.405670166015625, 3.53924560546875, 3.672821044921875, 3.806396484375, 3.939971923828125, 4.07354736328125, 4.207122802734375, 4.3406982421875, 4.474273681640625, 4.60784912109375, 4.741424560546875, 4.875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 17.0, 19.0, 25.0, 29.0, 42.0, 82.0, 98.0, 145.0, 229.0, 354.0, 627.0, 1113.0, 2072.0, 4552.0, 12891.0, 70010.0, 990185.0, 2717210.0, 348349.0, 31169.0, 8062.0, 3255.0, 1532.0, 853.0, 476.0, 303.0, 184.0, 115.0, 70.0, 63.0, 43.0, 39.0, 7.0, 18.0, 12.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5234375, -12.168701171875, -11.81396484375, -11.459228515625, -11.1044921875, -10.749755859375, -10.39501953125, -10.040283203125, -9.685546875, -9.330810546875, -8.97607421875, -8.621337890625, -8.2666015625, -7.911865234375, -7.55712890625, -7.202392578125, -6.84765625, -6.492919921875, -6.13818359375, -5.783447265625, -5.4287109375, -5.073974609375, -4.71923828125, -4.364501953125, -4.009765625, -3.655029296875, -3.30029296875, -2.945556640625, -2.5908203125, -2.236083984375, -1.88134765625, -1.526611328125, -1.171875, -0.817138671875, -0.46240234375, -0.107666015625, 0.2470703125, 0.601806640625, 0.95654296875, 1.311279296875, 1.666015625, 2.020751953125, 2.37548828125, 2.730224609375, 3.0849609375, 3.439697265625, 3.79443359375, 4.149169921875, 4.50390625, 4.858642578125, 5.21337890625, 5.568115234375, 5.9228515625, 6.277587890625, 6.63232421875, 6.987060546875, 7.341796875, 7.696533203125, 8.05126953125, 8.406005859375, 8.7607421875, 9.115478515625, 9.47021484375, 9.824951171875, 10.1796875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 4.0, 5.0, 9.0, 16.0, 18.0, 21.0, 42.0, 41.0, 58.0, 83.0, 132.0, 139.0, 213.0, 281.0, 370.0, 481.0, 451.0, 394.0, 308.0, 248.0, 183.0, 143.0, 102.0, 79.0, 53.0, 42.0, 38.0, 25.0, 23.0, 15.0, 5.0, 8.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.9169921875, -6.693359375, -6.4697265625, -6.24609375, -6.0224609375, -5.798828125, -5.5751953125, -5.3515625, -5.1279296875, -4.904296875, -4.6806640625, -4.45703125, -4.2333984375, -4.009765625, -3.7861328125, -3.5625, -3.3388671875, -3.115234375, -2.8916015625, -2.66796875, -2.4443359375, -2.220703125, -1.9970703125, -1.7734375, -1.5498046875, -1.326171875, -1.1025390625, -0.87890625, -0.6552734375, -0.431640625, -0.2080078125, 0.015625, 0.2392578125, 0.462890625, 0.6865234375, 0.91015625, 1.1337890625, 1.357421875, 1.5810546875, 1.8046875, 2.0283203125, 2.251953125, 2.4755859375, 2.69921875, 2.9228515625, 3.146484375, 3.3701171875, 3.59375, 3.8173828125, 4.041015625, 4.2646484375, 4.48828125, 4.7119140625, 4.935546875, 5.1591796875, 5.3828125, 5.6064453125, 5.830078125, 6.0537109375, 6.27734375, 6.5009765625, 6.724609375, 6.9482421875, 7.171875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 11.0, 8.0, 10.0, 13.0, 11.0, 19.0, 25.0, 43.0, 56.0, 63.0, 98.0, 156.0, 261.0, 424.0, 637.0, 1354.0, 3473.0, 13554.0, 130726.0, 2830723.0, 1146555.0, 53420.0, 7872.0, 2326.0, 996.0, 519.0, 291.0, 196.0, 110.0, 89.0, 72.0, 48.0, 27.0, 19.0, 20.0, 9.0, 10.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.593505859375, -12.17138671875, -11.749267578125, -11.3271484375, -10.905029296875, -10.48291015625, -10.060791015625, -9.638671875, -9.216552734375, -8.79443359375, -8.372314453125, -7.9501953125, -7.528076171875, -7.10595703125, -6.683837890625, -6.26171875, -5.839599609375, -5.41748046875, -4.995361328125, -4.5732421875, -4.151123046875, -3.72900390625, -3.306884765625, -2.884765625, -2.462646484375, -2.04052734375, -1.618408203125, -1.1962890625, -0.774169921875, -0.35205078125, 0.070068359375, 0.4921875, 0.914306640625, 1.33642578125, 1.758544921875, 2.1806640625, 2.602783203125, 3.02490234375, 3.447021484375, 3.869140625, 4.291259765625, 4.71337890625, 5.135498046875, 5.5576171875, 5.979736328125, 6.40185546875, 6.823974609375, 7.24609375, 7.668212890625, 8.09033203125, 8.512451171875, 8.9345703125, 9.356689453125, 9.77880859375, 10.200927734375, 10.623046875, 11.045166015625, 11.46728515625, 11.889404296875, 12.3115234375, 12.733642578125, 13.15576171875, 13.577880859375, 14.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 829.0, 112.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-513.6961059570312, -504.27490234375, -494.85369873046875, -485.4325256347656, -476.0113220214844, -466.5901184082031, -457.1689147949219, -447.7477111816406, -438.3265380859375, -428.90533447265625, -419.484130859375, -410.0629577636719, -400.6417541503906, -391.2205505371094, -381.7993469238281, -372.3781433105469, -362.9569396972656, -353.5357360839844, -344.1145324707031, -334.693359375, -325.27215576171875, -315.8509521484375, -306.42974853515625, -297.008544921875, -287.58734130859375, -278.1661376953125, -268.74493408203125, -259.3237609863281, -249.90255737304688, -240.48135375976562, -231.06015014648438, -221.63894653320312, -212.21780395507812, -202.79660034179688, -193.3754119873047, -183.95420837402344, -174.53302001953125, -165.11181640625, -155.69061279296875, -146.2694091796875, -136.84820556640625, -127.42700958251953, -118.00581359863281, -108.58460998535156, -99.16341400146484, -89.74221801757812, -80.32101440429688, -70.89981842041016, -61.47863006591797, -52.05743408203125, -42.636234283447266, -33.21503448486328, -23.793838500976562, -14.372642517089844, -4.951442718505859, 4.469757080078125, 13.890953063964844, 23.312150955200195, 32.73334884643555, 42.15454864501953, 51.57574462890625, 60.99694061279297, 70.41813659667969, 79.83934020996094, 89.26053619384766]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 3.0, 9.0, 12.0, 11.0, 29.0, 40.0, 37.0, 45.0, 66.0, 55.0, 69.0, 55.0, 82.0, 56.0, 79.0, 56.0, 54.0, 51.0, 49.0, 52.0, 33.0, 14.0, 19.0, 12.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.30732727050781, -40.75027847290039, -39.19322967529297, -37.63618469238281, -36.07913589477539, -34.52208709716797, -32.96504211425781, -31.40799331665039, -29.85094451904297, -28.293895721435547, -26.736848831176758, -25.17980194091797, -23.622753143310547, -22.065704345703125, -20.508657455444336, -18.951610565185547, -17.394561767578125, -15.83751392364502, -14.280466079711914, -12.723418235778809, -11.166370391845703, -9.609322547912598, -8.052274703979492, -6.495226860046387, -4.938179016113281, -3.381131172180176, -1.8240833282470703, -0.26703548431396484, 1.2900123596191406, 2.847060203552246, 4.404108047485352, 5.961155891418457, 7.518199920654297, 9.075247764587402, 10.632295608520508, 12.189343452453613, 13.746391296386719, 15.303439140319824, 16.86048698425293, 18.41753387451172, 19.97458267211914, 21.531631469726562, 23.08867835998535, 24.64572525024414, 26.202774047851562, 27.759822845458984, 29.316869735717773, 30.873916625976562, 32.430965423583984, 33.988014221191406, 35.54505920410156, 37.102108001708984, 38.659156799316406, 40.21620559692383, 41.77325439453125, 43.330299377441406, 44.88734817504883, 46.44439697265625, 48.001441955566406, 49.55849075317383, 51.11553955078125, 52.67258834838867, 54.229637145996094, 55.78668212890625, 57.34373092651367]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 5.0, 8.0, 8.0, 9.0, 6.0, 18.0, 7.0, 16.0, 10.0, 25.0, 20.0, 30.0, 23.0, 30.0, 27.0, 32.0, 44.0, 27.0, 37.0, 42.0, 42.0, 34.0, 42.0, 43.0, 34.0, 33.0, 34.0, 33.0, 36.0, 41.0, 32.0, 21.0, 15.0, 18.0, 18.0, 17.0, 11.0, 10.0, 9.0, 12.0, 6.0, 10.0, 1.0, 3.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.611328125, -3.503875732421875, -3.39642333984375, -3.288970947265625, -3.1815185546875, -3.074066162109375, -2.96661376953125, -2.859161376953125, -2.751708984375, -2.644256591796875, -2.53680419921875, -2.429351806640625, -2.3218994140625, -2.214447021484375, -2.10699462890625, -1.999542236328125, -1.89208984375, -1.784637451171875, -1.67718505859375, -1.569732666015625, -1.4622802734375, -1.354827880859375, -1.24737548828125, -1.139923095703125, -1.032470703125, -0.925018310546875, -0.81756591796875, -0.710113525390625, -0.6026611328125, -0.495208740234375, -0.38775634765625, -0.280303955078125, -0.1728515625, -0.065399169921875, 0.04205322265625, 0.149505615234375, 0.2569580078125, 0.364410400390625, 0.47186279296875, 0.579315185546875, 0.686767578125, 0.794219970703125, 0.90167236328125, 1.009124755859375, 1.1165771484375, 1.224029541015625, 1.33148193359375, 1.438934326171875, 1.54638671875, 1.653839111328125, 1.76129150390625, 1.868743896484375, 1.9761962890625, 2.083648681640625, 2.19110107421875, 2.298553466796875, 2.406005859375, 2.513458251953125, 2.62091064453125, 2.728363037109375, 2.8358154296875, 2.943267822265625, 3.05072021484375, 3.158172607421875, 3.265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 7.0, 10.0, 16.0, 19.0, 24.0, 35.0, 59.0, 119.0, 183.0, 235.0, 354.0, 655.0, 1074.0, 1886.0, 3207.0, 5817.0, 11323.0, 27058.0, 83335.0, 339567.0, 407300.0, 105794.0, 31968.0, 13187.0, 6660.0, 3608.0, 1953.0, 1204.0, 669.0, 452.0, 280.0, 181.0, 115.0, 69.0, 39.0, 32.0, 19.0, 13.0, 11.0, 8.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5732421875, -1.53082275390625, -1.4884033203125, -1.44598388671875, -1.403564453125, -1.36114501953125, -1.3187255859375, -1.27630615234375, -1.23388671875, -1.19146728515625, -1.1490478515625, -1.10662841796875, -1.064208984375, -1.02178955078125, -0.9793701171875, -0.93695068359375, -0.89453125, -0.85211181640625, -0.8096923828125, -0.76727294921875, -0.724853515625, -0.68243408203125, -0.6400146484375, -0.59759521484375, -0.55517578125, -0.51275634765625, -0.4703369140625, -0.42791748046875, -0.385498046875, -0.34307861328125, -0.3006591796875, -0.25823974609375, -0.2158203125, -0.17340087890625, -0.1309814453125, -0.08856201171875, -0.046142578125, -0.00372314453125, 0.0386962890625, 0.08111572265625, 0.12353515625, 0.16595458984375, 0.2083740234375, 0.25079345703125, 0.293212890625, 0.33563232421875, 0.3780517578125, 0.42047119140625, 0.462890625, 0.50531005859375, 0.5477294921875, 0.59014892578125, 0.632568359375, 0.67498779296875, 0.7174072265625, 0.75982666015625, 0.80224609375, 0.84466552734375, 0.8870849609375, 0.92950439453125, 0.971923828125, 1.01434326171875, 1.0567626953125, 1.09918212890625, 1.1416015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 10.0, 11.0, 7.0, 14.0, 14.0, 10.0, 22.0, 24.0, 21.0, 28.0, 30.0, 29.0, 36.0, 29.0, 54.0, 43.0, 45.0, 38.0, 1073.0, 32.0, 40.0, 45.0, 33.0, 31.0, 30.0, 36.0, 31.0, 18.0, 33.0, 27.0, 18.0, 18.0, 15.0, 20.0, 6.0, 7.0, 4.0, 13.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.63067626953125, -2.5465087890625, -2.46234130859375, -2.378173828125, -2.29400634765625, -2.2098388671875, -2.12567138671875, -2.04150390625, -1.95733642578125, -1.8731689453125, -1.78900146484375, -1.704833984375, -1.62066650390625, -1.5364990234375, -1.45233154296875, -1.3681640625, -1.28399658203125, -1.1998291015625, -1.11566162109375, -1.031494140625, -0.94732666015625, -0.8631591796875, -0.77899169921875, -0.69482421875, -0.61065673828125, -0.5264892578125, -0.44232177734375, -0.358154296875, -0.27398681640625, -0.1898193359375, -0.10565185546875, -0.021484375, 0.06268310546875, 0.1468505859375, 0.23101806640625, 0.315185546875, 0.39935302734375, 0.4835205078125, 0.56768798828125, 0.65185546875, 0.73602294921875, 0.8201904296875, 0.90435791015625, 0.988525390625, 1.07269287109375, 1.1568603515625, 1.24102783203125, 1.3251953125, 1.40936279296875, 1.4935302734375, 1.57769775390625, 1.661865234375, 1.74603271484375, 1.8302001953125, 1.91436767578125, 1.99853515625, 2.08270263671875, 2.1668701171875, 2.25103759765625, 2.335205078125, 2.41937255859375, 2.5035400390625, 2.58770751953125, 2.671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 9.0, 16.0, 21.0, 16.0, 30.0, 35.0, 56.0, 81.0, 109.0, 167.0, 252.0, 379.0, 522.0, 764.0, 1227.0, 1965.0, 3071.0, 5216.0, 10115.0, 24106.0, 83710.0, 577216.0, 1223907.0, 108795.0, 28755.0, 11538.0, 5838.0, 3217.0, 2012.0, 1299.0, 859.0, 565.0, 353.0, 260.0, 166.0, 133.0, 95.0, 72.0, 47.0, 41.0, 17.0, 20.0, 15.0, 13.0, 7.0, 3.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.9921875, -0.9621963500976562, -0.9322052001953125, -0.9022140502929688, -0.872222900390625, -0.8422317504882812, -0.8122406005859375, -0.7822494506835938, -0.75225830078125, -0.7222671508789062, -0.6922760009765625, -0.6622848510742188, -0.632293701171875, -0.6023025512695312, -0.5723114013671875, -0.5423202514648438, -0.5123291015625, -0.48233795166015625, -0.4523468017578125, -0.42235565185546875, -0.392364501953125, -0.36237335205078125, -0.3323822021484375, -0.30239105224609375, -0.27239990234375, -0.24240875244140625, -0.2124176025390625, -0.18242645263671875, -0.152435302734375, -0.12244415283203125, -0.0924530029296875, -0.06246185302734375, -0.032470703125, -0.00247955322265625, 0.0275115966796875, 0.05750274658203125, 0.087493896484375, 0.11748504638671875, 0.1474761962890625, 0.17746734619140625, 0.20745849609375, 0.23744964599609375, 0.2674407958984375, 0.29743194580078125, 0.327423095703125, 0.35741424560546875, 0.3874053955078125, 0.41739654541015625, 0.4473876953125, 0.47737884521484375, 0.5073699951171875, 0.5373611450195312, 0.567352294921875, 0.5973434448242188, 0.6273345947265625, 0.6573257446289062, 0.68731689453125, 0.7173080444335938, 0.7472991943359375, 0.7772903442382812, 0.807281494140625, 0.8372726440429688, 0.8672637939453125, 0.8972549438476562, 0.92724609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 13.0, 21.0, 53.0, 564.0, 243.0, 47.0, 16.0, 8.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5131759643554688, -0.4975433349609375, -0.48191070556640625, -0.466278076171875, -0.45064544677734375, -0.4350128173828125, -0.41938018798828125, -0.40374755859375, -0.38811492919921875, -0.3724822998046875, -0.35684967041015625, -0.341217041015625, -0.32558441162109375, -0.3099517822265625, -0.29431915283203125, -0.2786865234375, -0.26305389404296875, -0.2474212646484375, -0.23178863525390625, -0.216156005859375, -0.20052337646484375, -0.1848907470703125, -0.16925811767578125, -0.15362548828125, -0.13799285888671875, -0.1223602294921875, -0.10672760009765625, -0.091094970703125, -0.07546234130859375, -0.0598297119140625, -0.04419708251953125, -0.028564453125, -0.01293182373046875, 0.0027008056640625, 0.01833343505859375, 0.033966064453125, 0.04959869384765625, 0.0652313232421875, 0.08086395263671875, 0.09649658203125, 0.11212921142578125, 0.1277618408203125, 0.14339447021484375, 0.159027099609375, 0.17465972900390625, 0.1902923583984375, 0.20592498779296875, 0.2215576171875, 0.23719024658203125, 0.2528228759765625, 0.26845550537109375, 0.284088134765625, 0.29972076416015625, 0.3153533935546875, 0.33098602294921875, 0.34661865234375, 0.36225128173828125, 0.3778839111328125, 0.39351654052734375, 0.409149169921875, 0.42478179931640625, 0.4404144287109375, 0.45604705810546875, 0.4716796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 3.0, 11.0, 9.0, 9.0, 8.0, 12.0, 15.0, 21.0, 37.0, 64.0, 214.0, 1569.0, 15985.0, 1025634.0, 4189.0, 505.0, 93.0, 43.0, 20.0, 18.0, 12.0, 9.0, 6.0, 10.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.45458984375, -8.1748046875, -7.89501953125, -7.615234375, -7.33544921875, -7.0556640625, -6.77587890625, -6.49609375, -6.21630859375, -5.9365234375, -5.65673828125, -5.376953125, -5.09716796875, -4.8173828125, -4.53759765625, -4.2578125, -3.97802734375, -3.6982421875, -3.41845703125, -3.138671875, -2.85888671875, -2.5791015625, -2.29931640625, -2.01953125, -1.73974609375, -1.4599609375, -1.18017578125, -0.900390625, -0.62060546875, -0.3408203125, -0.06103515625, 0.21875, 0.49853515625, 0.7783203125, 1.05810546875, 1.337890625, 1.61767578125, 1.8974609375, 2.17724609375, 2.45703125, 2.73681640625, 3.0166015625, 3.29638671875, 3.576171875, 3.85595703125, 4.1357421875, 4.41552734375, 4.6953125, 4.97509765625, 5.2548828125, 5.53466796875, 5.814453125, 6.09423828125, 6.3740234375, 6.65380859375, 6.93359375, 7.21337890625, 7.4931640625, 7.77294921875, 8.052734375, 8.33251953125, 8.6123046875, 8.89208984375, 9.171875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 40.0, 80.0, 518.0, 264.0, 68.0, 24.0, 10.0, 6.0, 0.0, 2.0], "bins": [-3.009080410003662, -2.956098794937134, -2.9031171798706055, -2.850135564804077, -2.797153949737549, -2.7441723346710205, -2.691190719604492, -2.638209104537964, -2.5852274894714355, -2.5322458744049072, -2.479264259338379, -2.4262826442718506, -2.3733010292053223, -2.320319414138794, -2.2673377990722656, -2.2143561840057373, -2.161374568939209, -2.1083929538726807, -2.0554113388061523, -2.002429723739624, -1.9494481086730957, -1.8964664936065674, -1.843484878540039, -1.7905032634735107, -1.7375214099884033, -1.684539794921875, -1.6315581798553467, -1.5785765647888184, -1.52559494972229, -1.4726133346557617, -1.4196317195892334, -1.366650104522705, -1.3136684894561768, -1.2606868743896484, -1.2077052593231201, -1.1547236442565918, -1.1017420291900635, -1.0487604141235352, -0.9957787394523621, -0.9427971243858337, -0.8898155689239502, -0.8368339538574219, -0.7838523387908936, -0.7308707237243652, -0.6778891086578369, -0.6249074935913086, -0.5719258189201355, -0.5189442038536072, -0.46596258878707886, -0.41298097372055054, -0.3599993586540222, -0.3070177137851715, -0.2540360987186432, -0.20105448365211487, -0.14807283878326416, -0.09509122371673584, -0.04210960865020752, 0.010872013866901398, 0.06385363638401031, 0.11683526635169983, 0.16981688141822815, 0.22279849648475647, 0.2757801413536072, 0.3287617564201355, 0.3817433714866638]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 7.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 20.0, 12.0, 11.0, 18.0, 19.0, 26.0, 16.0, 24.0, 34.0, 27.0, 35.0, 45.0, 42.0, 28.0, 41.0, 41.0, 52.0, 38.0, 29.0, 41.0, 36.0, 39.0, 30.0, 31.0, 25.0, 28.0, 33.0, 16.0, 22.0, 22.0, 20.0, 17.0, 7.0, 9.0, 5.0, 5.0, 4.0, 10.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.26025938987731934, -0.25271737575531006, -0.2451753467321396, -0.23763331770896912, -0.23009130358695984, -0.22254927456378937, -0.2150072455406189, -0.20746523141860962, -0.19992320239543915, -0.19238117337226868, -0.1848391592502594, -0.17729713022708893, -0.16975510120391846, -0.16221308708190918, -0.1546710580587387, -0.14712902903556824, -0.13958701491355896, -0.1320449858903885, -0.12450297176837921, -0.11696094274520874, -0.10941892117261887, -0.10187689960002899, -0.09433487057685852, -0.08679284900426865, -0.07925082743167877, -0.0717088058590889, -0.06416678428649902, -0.05662475526332855, -0.04908273369073868, -0.041540712118148804, -0.03399868682026863, -0.026456661522388458, -0.018914639949798584, -0.01137261651456356, -0.003830593079328537, 0.0037114303559064865, 0.01125345379114151, 0.018795475363731384, 0.026337500661611557, 0.03387952595949173, 0.041421547532081604, 0.04896356910467148, 0.05650559440255165, 0.06404761970043182, 0.0715896412730217, 0.07913166284561157, 0.08667369186878204, 0.09421571344137192, 0.10175773501396179, 0.10929975658655167, 0.11684177815914154, 0.12438380718231201, 0.1319258213043213, 0.13946785032749176, 0.14700987935066223, 0.1545518934726715, 0.16209392249584198, 0.16963595151901245, 0.17717796564102173, 0.1847199946641922, 0.19226202368736267, 0.19980403780937195, 0.20734606683254242, 0.2148880958557129, 0.22243010997772217]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 5.0, 12.0, 11.0, 8.0, 4.0, 6.0, 15.0, 16.0, 17.0, 21.0, 31.0, 19.0, 36.0, 28.0, 28.0, 32.0, 31.0, 48.0, 38.0, 35.0, 38.0, 38.0, 41.0, 40.0, 37.0, 30.0, 47.0, 37.0, 33.0, 27.0, 19.0, 22.0, 21.0, 25.0, 21.0, 13.0, 11.0, 12.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.783203125, -3.672149658203125, -3.56109619140625, -3.450042724609375, -3.3389892578125, -3.227935791015625, -3.11688232421875, -3.005828857421875, -2.894775390625, -2.783721923828125, -2.67266845703125, -2.561614990234375, -2.4505615234375, -2.339508056640625, -2.22845458984375, -2.117401123046875, -2.00634765625, -1.895294189453125, -1.78424072265625, -1.673187255859375, -1.5621337890625, -1.451080322265625, -1.34002685546875, -1.228973388671875, -1.117919921875, -1.006866455078125, -0.89581298828125, -0.784759521484375, -0.6737060546875, -0.562652587890625, -0.45159912109375, -0.340545654296875, -0.2294921875, -0.118438720703125, -0.00738525390625, 0.103668212890625, 0.2147216796875, 0.325775146484375, 0.43682861328125, 0.547882080078125, 0.658935546875, 0.769989013671875, 0.88104248046875, 0.992095947265625, 1.1031494140625, 1.214202880859375, 1.32525634765625, 1.436309814453125, 1.54736328125, 1.658416748046875, 1.76947021484375, 1.880523681640625, 1.9915771484375, 2.102630615234375, 2.21368408203125, 2.324737548828125, 2.435791015625, 2.546844482421875, 2.65789794921875, 2.768951416015625, 2.8800048828125, 2.991058349609375, 3.10211181640625, 3.213165283203125, 3.32421875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 10.0, 12.0, 11.0, 15.0, 29.0, 29.0, 38.0, 58.0, 86.0, 101.0, 126.0, 202.0, 288.0, 466.0, 735.0, 1321.0, 2236.0, 4727.0, 10480.0, 27993.0, 93345.0, 349316.0, 392021.0, 110230.0, 31431.0, 11730.0, 5158.0, 2519.0, 1400.0, 878.0, 523.0, 289.0, 200.0, 152.0, 108.0, 78.0, 50.0, 43.0, 26.0, 32.0, 15.0, 10.0, 5.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.75, -4.6063232421875, -4.462646484375, -4.3189697265625, -4.17529296875, -4.0316162109375, -3.887939453125, -3.7442626953125, -3.6005859375, -3.4569091796875, -3.313232421875, -3.1695556640625, -3.02587890625, -2.8822021484375, -2.738525390625, -2.5948486328125, -2.451171875, -2.3074951171875, -2.163818359375, -2.0201416015625, -1.87646484375, -1.7327880859375, -1.589111328125, -1.4454345703125, -1.3017578125, -1.1580810546875, -1.014404296875, -0.8707275390625, -0.72705078125, -0.5833740234375, -0.439697265625, -0.2960205078125, -0.15234375, -0.0086669921875, 0.135009765625, 0.2786865234375, 0.42236328125, 0.5660400390625, 0.709716796875, 0.8533935546875, 0.9970703125, 1.1407470703125, 1.284423828125, 1.4281005859375, 1.57177734375, 1.7154541015625, 1.859130859375, 2.0028076171875, 2.146484375, 2.2901611328125, 2.433837890625, 2.5775146484375, 2.72119140625, 2.8648681640625, 3.008544921875, 3.1522216796875, 3.2958984375, 3.4395751953125, 3.583251953125, 3.7269287109375, 3.87060546875, 4.0142822265625, 4.157958984375, 4.3016357421875, 4.4453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 7.0, 16.0, 14.0, 15.0, 23.0, 28.0, 30.0, 33.0, 25.0, 46.0, 65.0, 62.0, 108.0, 202.0, 1420.0, 281.0, 150.0, 111.0, 62.0, 41.0, 52.0, 26.0, 25.0, 23.0, 21.0, 16.0, 22.0, 11.0, 15.0, 12.0, 12.0, 6.0, 12.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.3446044921875, -8.064208984375, -7.7838134765625, -7.50341796875, -7.2230224609375, -6.942626953125, -6.6622314453125, -6.3818359375, -6.1014404296875, -5.821044921875, -5.5406494140625, -5.26025390625, -4.9798583984375, -4.699462890625, -4.4190673828125, -4.138671875, -3.8582763671875, -3.577880859375, -3.2974853515625, -3.01708984375, -2.7366943359375, -2.456298828125, -2.1759033203125, -1.8955078125, -1.6151123046875, -1.334716796875, -1.0543212890625, -0.77392578125, -0.4935302734375, -0.213134765625, 0.0672607421875, 0.34765625, 0.6280517578125, 0.908447265625, 1.1888427734375, 1.46923828125, 1.7496337890625, 2.030029296875, 2.3104248046875, 2.5908203125, 2.8712158203125, 3.151611328125, 3.4320068359375, 3.71240234375, 3.9927978515625, 4.273193359375, 4.5535888671875, 4.833984375, 5.1143798828125, 5.394775390625, 5.6751708984375, 5.95556640625, 6.2359619140625, 6.516357421875, 6.7967529296875, 7.0771484375, 7.3575439453125, 7.637939453125, 7.9183349609375, 8.19873046875, 8.4791259765625, 8.759521484375, 9.0399169921875, 9.3203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 22.0, 12.0, 21.0, 23.0, 28.0, 40.0, 45.0, 47.0, 59.0, 80.0, 149.0, 201.0, 305.0, 626.0, 1679.0, 20379.0, 3006916.0, 110254.0, 2824.0, 799.0, 364.0, 238.0, 154.0, 98.0, 76.0, 56.0, 40.0, 28.0, 26.0, 23.0, 16.0, 15.0, 11.0, 11.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.4578857421875, -13.970458984375, -13.4830322265625, -12.99560546875, -12.5081787109375, -12.020751953125, -11.5333251953125, -11.0458984375, -10.5584716796875, -10.071044921875, -9.5836181640625, -9.09619140625, -8.6087646484375, -8.121337890625, -7.6339111328125, -7.146484375, -6.6590576171875, -6.171630859375, -5.6842041015625, -5.19677734375, -4.7093505859375, -4.221923828125, -3.7344970703125, -3.2470703125, -2.7596435546875, -2.272216796875, -1.7847900390625, -1.29736328125, -0.8099365234375, -0.322509765625, 0.1649169921875, 0.65234375, 1.1397705078125, 1.627197265625, 2.1146240234375, 2.60205078125, 3.0894775390625, 3.576904296875, 4.0643310546875, 4.5517578125, 5.0391845703125, 5.526611328125, 6.0140380859375, 6.50146484375, 6.9888916015625, 7.476318359375, 7.9637451171875, 8.451171875, 8.9385986328125, 9.426025390625, 9.9134521484375, 10.40087890625, 10.8883056640625, 11.375732421875, 11.8631591796875, 12.3505859375, 12.8380126953125, 13.325439453125, 13.8128662109375, 14.30029296875, 14.7877197265625, 15.275146484375, 15.7625732421875, 16.25]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 11.0, 45.0, 118.0, 262.0, 309.0, 191.0, 55.0, 15.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.02979278564453, -63.557804107666016, -62.085819244384766, -60.61383056640625, -59.141845703125, -57.669857025146484, -56.19786834716797, -54.72588348388672, -53.2538948059082, -51.78190612792969, -50.30992126464844, -48.83793258666992, -47.365943908691406, -45.893959045410156, -44.42197036743164, -42.949981689453125, -41.477996826171875, -40.00600814819336, -38.53402328491211, -37.062034606933594, -35.590049743652344, -34.11806106567383, -32.64607238769531, -31.17408561706543, -29.702098846435547, -28.230112075805664, -26.75812530517578, -25.286136627197266, -23.814149856567383, -22.3421630859375, -20.870174407958984, -19.3981876373291, -17.926197052001953, -16.45421028137207, -14.982222557067871, -13.510234832763672, -12.038248062133789, -10.566261291503906, -9.094273567199707, -7.622285842895508, -6.150299072265625, -4.678311824798584, -3.206324577331543, -1.734337329864502, -0.26235008239746094, 1.20963716506958, 2.681624412536621, 4.15361213684082, 5.625598907470703, 7.097586154937744, 8.569573402404785, 10.041561126708984, 11.513547897338867, 12.98553466796875, 14.45752239227295, 15.929510116577148, 17.40149688720703, 18.873483657836914, 20.345470428466797, 21.817459106445312, 23.289445877075195, 24.761432647705078, 26.233421325683594, 27.705408096313477, 29.17739486694336]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 10.0, 5.0, 17.0, 8.0, 12.0, 17.0, 14.0, 17.0, 19.0, 26.0, 27.0, 31.0, 35.0, 32.0, 34.0, 34.0, 35.0, 35.0, 38.0, 40.0, 41.0, 45.0, 37.0, 31.0, 38.0, 30.0, 24.0, 33.0, 28.0, 26.0, 23.0, 17.0, 23.0, 17.0, 12.0, 7.0, 9.0, 12.0, 8.0, 5.0, 3.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-20.757801055908203, -20.126150131225586, -19.4945011138916, -18.862850189208984, -18.231201171875, -17.599550247192383, -16.9679012298584, -16.33625030517578, -15.704601287841797, -15.072951316833496, -14.441301345825195, -13.809651374816895, -13.178001403808594, -12.546351432800293, -11.914701461791992, -11.283050537109375, -10.651400566101074, -10.019750595092773, -9.388100624084473, -8.756450653076172, -8.124800682067871, -7.49315071105957, -6.861500263214111, -6.2298502922058105, -5.59820032119751, -4.966550350189209, -4.334900379180908, -3.7032501697540283, -3.0716001987457275, -2.4399502277374268, -1.8083000183105469, -1.176650047302246, -0.5450000762939453, 0.08664995431900024, 0.7182999849319458, 1.3499500751495361, 1.981600046157837, 2.6132500171661377, 3.2449002265930176, 3.8765501976013184, 4.508200168609619, 5.13985013961792, 5.771500110626221, 6.40315055847168, 7.0348005294799805, 7.666450500488281, 8.298100471496582, 8.929750442504883, 9.561400413513184, 10.193050384521484, 10.824700355529785, 11.456350326538086, 12.088000297546387, 12.719650268554688, 13.351301193237305, 13.982950210571289, 14.614601135253906, 15.246251106262207, 15.877901077270508, 16.509552001953125, 17.14120101928711, 17.772851943969727, 18.40450096130371, 19.036151885986328, 19.667800903320312]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 13.0, 8.0, 14.0, 30.0, 18.0, 18.0, 22.0, 22.0, 21.0, 30.0, 26.0, 23.0, 30.0, 24.0, 29.0, 42.0, 41.0, 41.0, 48.0, 44.0, 36.0, 32.0, 26.0, 30.0, 37.0, 34.0, 27.0, 34.0, 18.0, 21.0, 17.0, 24.0, 15.0, 12.0, 2.0, 9.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0], "bins": [-3.8046875, -3.6904296875, -3.576171875, -3.4619140625, -3.34765625, -3.2333984375, -3.119140625, -3.0048828125, -2.890625, -2.7763671875, -2.662109375, -2.5478515625, -2.43359375, -2.3193359375, -2.205078125, -2.0908203125, -1.9765625, -1.8623046875, -1.748046875, -1.6337890625, -1.51953125, -1.4052734375, -1.291015625, -1.1767578125, -1.0625, -0.9482421875, -0.833984375, -0.7197265625, -0.60546875, -0.4912109375, -0.376953125, -0.2626953125, -0.1484375, -0.0341796875, 0.080078125, 0.1943359375, 0.30859375, 0.4228515625, 0.537109375, 0.6513671875, 0.765625, 0.8798828125, 0.994140625, 1.1083984375, 1.22265625, 1.3369140625, 1.451171875, 1.5654296875, 1.6796875, 1.7939453125, 1.908203125, 2.0224609375, 2.13671875, 2.2509765625, 2.365234375, 2.4794921875, 2.59375, 2.7080078125, 2.822265625, 2.9365234375, 3.05078125, 3.1650390625, 3.279296875, 3.3935546875, 3.5078125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 3.0, 8.0, 13.0, 13.0, 19.0, 35.0, 28.0, 37.0, 42.0, 62.0, 118.0, 151.0, 210.0, 311.0, 408.0, 651.0, 1014.0, 1621.0, 3281.0, 7892.0, 31385.0, 328782.0, 3016625.0, 734865.0, 48019.0, 10065.0, 3728.0, 1873.0, 998.0, 703.0, 399.0, 269.0, 194.0, 132.0, 95.0, 51.0, 40.0, 29.0, 21.0, 16.0, 12.0, 15.0, 4.0, 12.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-16.375, -15.887939453125, -15.40087890625, -14.913818359375, -14.4267578125, -13.939697265625, -13.45263671875, -12.965576171875, -12.478515625, -11.991455078125, -11.50439453125, -11.017333984375, -10.5302734375, -10.043212890625, -9.55615234375, -9.069091796875, -8.58203125, -8.094970703125, -7.60791015625, -7.120849609375, -6.6337890625, -6.146728515625, -5.65966796875, -5.172607421875, -4.685546875, -4.198486328125, -3.71142578125, -3.224365234375, -2.7373046875, -2.250244140625, -1.76318359375, -1.276123046875, -0.7890625, -0.302001953125, 0.18505859375, 0.672119140625, 1.1591796875, 1.646240234375, 2.13330078125, 2.620361328125, 3.107421875, 3.594482421875, 4.08154296875, 4.568603515625, 5.0556640625, 5.542724609375, 6.02978515625, 6.516845703125, 7.00390625, 7.490966796875, 7.97802734375, 8.465087890625, 8.9521484375, 9.439208984375, 9.92626953125, 10.413330078125, 10.900390625, 11.387451171875, 11.87451171875, 12.361572265625, 12.8486328125, 13.335693359375, 13.82275390625, 14.309814453125, 14.796875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 6.0, 14.0, 20.0, 15.0, 19.0, 18.0, 51.0, 42.0, 64.0, 61.0, 86.0, 109.0, 149.0, 161.0, 183.0, 228.0, 282.0, 308.0, 327.0, 332.0, 307.0, 236.0, 219.0, 145.0, 116.0, 135.0, 81.0, 68.0, 66.0, 34.0, 35.0, 25.0, 32.0, 21.0, 16.0, 14.0, 4.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.20703125, -5.03582763671875, -4.8646240234375, -4.69342041015625, -4.522216796875, -4.35101318359375, -4.1798095703125, -4.00860595703125, -3.83740234375, -3.66619873046875, -3.4949951171875, -3.32379150390625, -3.152587890625, -2.98138427734375, -2.8101806640625, -2.63897705078125, -2.4677734375, -2.29656982421875, -2.1253662109375, -1.95416259765625, -1.782958984375, -1.61175537109375, -1.4405517578125, -1.26934814453125, -1.09814453125, -0.92694091796875, -0.7557373046875, -0.58453369140625, -0.413330078125, -0.24212646484375, -0.0709228515625, 0.10028076171875, 0.271484375, 0.44268798828125, 0.6138916015625, 0.78509521484375, 0.956298828125, 1.12750244140625, 1.2987060546875, 1.46990966796875, 1.64111328125, 1.81231689453125, 1.9835205078125, 2.15472412109375, 2.325927734375, 2.49713134765625, 2.6683349609375, 2.83953857421875, 3.0107421875, 3.18194580078125, 3.3531494140625, 3.52435302734375, 3.695556640625, 3.86676025390625, 4.0379638671875, 4.20916748046875, 4.38037109375, 4.55157470703125, 4.7227783203125, 4.89398193359375, 5.065185546875, 5.23638916015625, 5.4075927734375, 5.57879638671875, 5.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 11.0, 22.0, 46.0, 95.0, 231.0, 507.0, 1273.0, 3345.0, 10046.0, 35585.0, 169234.0, 1033111.0, 2278446.0, 535812.0, 93414.0, 22201.0, 6773.0, 2410.0, 947.0, 414.0, 192.0, 85.0, 32.0, 16.0, 6.0, 3.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8359375, -8.5784912109375, -8.321044921875, -8.0635986328125, -7.80615234375, -7.5487060546875, -7.291259765625, -7.0338134765625, -6.7763671875, -6.5189208984375, -6.261474609375, -6.0040283203125, -5.74658203125, -5.4891357421875, -5.231689453125, -4.9742431640625, -4.716796875, -4.4593505859375, -4.201904296875, -3.9444580078125, -3.68701171875, -3.4295654296875, -3.172119140625, -2.9146728515625, -2.6572265625, -2.3997802734375, -2.142333984375, -1.8848876953125, -1.62744140625, -1.3699951171875, -1.112548828125, -0.8551025390625, -0.59765625, -0.3402099609375, -0.082763671875, 0.1746826171875, 0.43212890625, 0.6895751953125, 0.947021484375, 1.2044677734375, 1.4619140625, 1.7193603515625, 1.976806640625, 2.2342529296875, 2.49169921875, 2.7491455078125, 3.006591796875, 3.2640380859375, 3.521484375, 3.7789306640625, 4.036376953125, 4.2938232421875, 4.55126953125, 4.8087158203125, 5.066162109375, 5.3236083984375, 5.5810546875, 5.8385009765625, 6.095947265625, 6.3533935546875, 6.61083984375, 6.8682861328125, 7.125732421875, 7.3831787109375, 7.640625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 4.0, 13.0, 7.0, 16.0, 13.0, 20.0, 16.0, 23.0, 27.0, 33.0, 27.0, 50.0, 53.0, 61.0, 51.0, 53.0, 53.0, 66.0, 52.0, 59.0, 48.0, 45.0, 42.0, 25.0, 33.0, 16.0, 17.0, 18.0, 9.0, 13.0, 7.0, 12.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.12446212768555, -38.00209426879883, -36.87972640991211, -35.75735855102539, -34.63499450683594, -33.51262664794922, -32.3902587890625, -31.26789093017578, -30.145523071289062, -29.023155212402344, -27.900787353515625, -26.77842140197754, -25.65605354309082, -24.5336856842041, -23.411319732666016, -22.288951873779297, -21.166584014892578, -20.04421615600586, -18.92184829711914, -17.799482345581055, -16.677114486694336, -15.554746627807617, -14.432379722595215, -13.310012817382812, -12.187644958496094, -11.065277099609375, -9.942910194396973, -8.82054328918457, -7.698175430297852, -6.575808048248291, -5.4534406661987305, -4.33107328414917, -3.2087020874023438, -2.086334705352783, -0.9639673233032227, 0.1584000587463379, 1.2807674407958984, 2.403134822845459, 3.5255022048950195, 4.64786958694458, 5.770236968994141, 6.892604351043701, 8.014971733093262, 9.137338638305664, 10.259706497192383, 11.382074356079102, 12.504441261291504, 13.626808166503906, 14.749176025390625, 15.871543884277344, 16.993911743164062, 18.11627769470215, 19.238645553588867, 20.361013412475586, 21.483379364013672, 22.60574722290039, 23.72811508178711, 24.850482940673828, 25.972850799560547, 27.095216751098633, 28.21758460998535, 29.33995246887207, 30.462318420410156, 31.584686279296875, 32.707054138183594]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 5.0, 4.0, 6.0, 4.0, 4.0, 11.0, 25.0, 17.0, 19.0, 21.0, 25.0, 41.0, 31.0, 29.0, 44.0, 32.0, 38.0, 43.0, 55.0, 49.0, 45.0, 49.0, 39.0, 47.0, 37.0, 35.0, 39.0, 30.0, 29.0, 28.0, 22.0, 24.0, 18.0, 11.0, 12.0, 7.0, 7.0, 1.0, 5.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.117645263671875, -33.04658508300781, -31.975522994995117, -30.904462814331055, -29.83340072631836, -28.762340545654297, -27.691280364990234, -26.620220184326172, -25.549158096313477, -24.478097915649414, -23.40703582763672, -22.335975646972656, -21.264915466308594, -20.1938533782959, -19.122793197631836, -18.05173110961914, -16.980670928955078, -15.9096097946167, -14.83854866027832, -13.767488479614258, -12.696427345275879, -11.6253662109375, -10.554306030273438, -9.483244895935059, -8.41218376159668, -7.341122627258301, -6.27006196975708, -5.199001312255859, -4.1279401779174805, -3.0568790435791016, -1.9858183860778809, -0.9147577285766602, 0.15629959106445312, 1.227360486984253, 2.2984213829040527, 3.3694822788238525, 4.440543174743652, 5.511604309082031, 6.582664966583252, 7.653725624084473, 8.724786758422852, 9.79584789276123, 10.86690902709961, 11.937969207763672, 13.00903034210205, 14.08009147644043, 15.151151657104492, 16.222213745117188, 17.29327392578125, 18.364334106445312, 19.435396194458008, 20.50645637512207, 21.577518463134766, 22.648578643798828, 23.71963882446289, 24.790699005126953, 25.86176109313965, 26.93282127380371, 28.003883361816406, 29.07494354248047, 30.14600372314453, 31.217065811157227, 32.28812789916992, 33.359188079833984, 34.43024826049805]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 4.0, 9.0, 10.0, 12.0, 14.0, 15.0, 16.0, 33.0, 37.0, 56.0, 49.0, 39.0, 56.0, 58.0, 58.0, 72.0, 49.0, 58.0, 62.0, 56.0, 44.0, 44.0, 23.0, 31.0, 21.0, 17.0, 23.0, 5.0, 11.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.875, -97.03515625, -94.1953125, -91.35546875, -88.515625, -85.67578125, -82.8359375, -79.99609375, -77.15625, -74.31640625, -71.4765625, -68.63671875, -65.796875, -62.95703125, -60.1171875, -57.27734375, -54.4375, -51.59765625, -48.7578125, -45.91796875, -43.078125, -40.23828125, -37.3984375, -34.55859375, -31.71875, -28.87890625, -26.0390625, -23.19921875, -20.359375, -17.51953125, -14.6796875, -11.83984375, -9.0, -6.16015625, -3.3203125, -0.48046875, 2.359375, 5.19921875, 8.0390625, 10.87890625, 13.71875, 16.55859375, 19.3984375, 22.23828125, 25.078125, 27.91796875, 30.7578125, 33.59765625, 36.4375, 39.27734375, 42.1171875, 44.95703125, 47.796875, 50.63671875, 53.4765625, 56.31640625, 59.15625, 61.99609375, 64.8359375, 67.67578125, 70.515625, 73.35546875, 76.1953125, 79.03515625, 81.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 15.0, 15.0, 31.0, 26.0, 47.0, 87.0, 137.0, 242.0, 455.0, 842.0, 1479.0, 2987.0, 5524.0, 11176.0, 22003.0, 45367.0, 92581.0, 179907.0, 264209.0, 205143.0, 109545.0, 53621.0, 25969.0, 13184.0, 6641.0, 3370.0, 1787.0, 960.0, 501.0, 261.0, 167.0, 100.0, 67.0, 35.0, 18.0, 16.0, 12.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.058837890625, -3.92626953125, -3.793701171875, -3.6611328125, -3.528564453125, -3.39599609375, -3.263427734375, -3.130859375, -2.998291015625, -2.86572265625, -2.733154296875, -2.6005859375, -2.468017578125, -2.33544921875, -2.202880859375, -2.0703125, -1.937744140625, -1.80517578125, -1.672607421875, -1.5400390625, -1.407470703125, -1.27490234375, -1.142333984375, -1.009765625, -0.877197265625, -0.74462890625, -0.612060546875, -0.4794921875, -0.346923828125, -0.21435546875, -0.081787109375, 0.05078125, 0.183349609375, 0.31591796875, 0.448486328125, 0.5810546875, 0.713623046875, 0.84619140625, 0.978759765625, 1.111328125, 1.243896484375, 1.37646484375, 1.509033203125, 1.6416015625, 1.774169921875, 1.90673828125, 2.039306640625, 2.171875, 2.304443359375, 2.43701171875, 2.569580078125, 2.7021484375, 2.834716796875, 2.96728515625, 3.099853515625, 3.232421875, 3.364990234375, 3.49755859375, 3.630126953125, 3.7626953125, 3.895263671875, 4.02783203125, 4.160400390625, 4.29296875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 10.0, 12.0, 8.0, 16.0, 13.0, 21.0, 15.0, 17.0, 25.0, 22.0, 27.0, 22.0, 25.0, 27.0, 25.0, 36.0, 32.0, 38.0, 56.0, 1057.0, 36.0, 47.0, 40.0, 30.0, 43.0, 37.0, 31.0, 36.0, 20.0, 25.0, 21.0, 23.0, 22.0, 22.0, 16.0, 13.0, 14.0, 8.0, 6.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.96875, -35.81201171875, -34.6552734375, -33.49853515625, -32.341796875, -31.18505859375, -30.0283203125, -28.87158203125, -27.71484375, -26.55810546875, -25.4013671875, -24.24462890625, -23.087890625, -21.93115234375, -20.7744140625, -19.61767578125, -18.4609375, -17.30419921875, -16.1474609375, -14.99072265625, -13.833984375, -12.67724609375, -11.5205078125, -10.36376953125, -9.20703125, -8.05029296875, -6.8935546875, -5.73681640625, -4.580078125, -3.42333984375, -2.2666015625, -1.10986328125, 0.046875, 1.20361328125, 2.3603515625, 3.51708984375, 4.673828125, 5.83056640625, 6.9873046875, 8.14404296875, 9.30078125, 10.45751953125, 11.6142578125, 12.77099609375, 13.927734375, 15.08447265625, 16.2412109375, 17.39794921875, 18.5546875, 19.71142578125, 20.8681640625, 22.02490234375, 23.181640625, 24.33837890625, 25.4951171875, 26.65185546875, 27.80859375, 28.96533203125, 30.1220703125, 31.27880859375, 32.435546875, 33.59228515625, 34.7490234375, 35.90576171875, 37.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 11.0, 11.0, 23.0, 27.0, 41.0, 70.0, 120.0, 176.0, 252.0, 383.0, 556.0, 872.0, 1372.0, 2050.0, 3208.0, 4842.0, 7794.0, 11937.0, 18385.0, 28566.0, 44112.0, 67451.0, 100047.0, 152004.0, 1169062.0, 173046.0, 106157.0, 72025.0, 46769.0, 30277.0, 19646.0, 12667.0, 8073.0, 5242.0, 3449.0, 2205.0, 1487.0, 900.0, 644.0, 402.0, 265.0, 176.0, 117.0, 73.0, 47.0, 28.0, 21.0, 19.0, 13.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.375, -2.299774169921875, -2.22454833984375, -2.149322509765625, -2.0740966796875, -1.998870849609375, -1.92364501953125, -1.848419189453125, -1.773193359375, -1.697967529296875, -1.62274169921875, -1.547515869140625, -1.4722900390625, -1.397064208984375, -1.32183837890625, -1.246612548828125, -1.17138671875, -1.096160888671875, -1.02093505859375, -0.945709228515625, -0.8704833984375, -0.795257568359375, -0.72003173828125, -0.644805908203125, -0.569580078125, -0.494354248046875, -0.41912841796875, -0.343902587890625, -0.2686767578125, -0.193450927734375, -0.11822509765625, -0.042999267578125, 0.0322265625, 0.107452392578125, 0.18267822265625, 0.257904052734375, 0.3331298828125, 0.408355712890625, 0.48358154296875, 0.558807373046875, 0.634033203125, 0.709259033203125, 0.78448486328125, 0.859710693359375, 0.9349365234375, 1.010162353515625, 1.08538818359375, 1.160614013671875, 1.23583984375, 1.311065673828125, 1.38629150390625, 1.461517333984375, 1.5367431640625, 1.611968994140625, 1.68719482421875, 1.762420654296875, 1.837646484375, 1.912872314453125, 1.98809814453125, 2.063323974609375, 2.1385498046875, 2.213775634765625, 2.28900146484375, 2.364227294921875, 2.439453125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 3.0, 4.0, 13.0, 14.0, 11.0, 13.0, 22.0, 28.0, 22.0, 24.0, 37.0, 51.0, 45.0, 48.0, 50.0, 72.0, 58.0, 70.0, 58.0, 55.0, 39.0, 40.0, 43.0, 20.0, 17.0, 18.0, 21.0, 18.0, 15.0, 11.0, 12.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05255126953125, -0.05106306076049805, -0.049574851989746094, -0.04808664321899414, -0.04659843444824219, -0.045110225677490234, -0.04362201690673828, -0.04213380813598633, -0.040645599365234375, -0.03915739059448242, -0.03766918182373047, -0.036180973052978516, -0.03469276428222656, -0.03320455551147461, -0.031716346740722656, -0.030228137969970703, -0.02873992919921875, -0.027251720428466797, -0.025763511657714844, -0.02427530288696289, -0.022787094116210938, -0.021298885345458984, -0.01981067657470703, -0.018322467803955078, -0.016834259033203125, -0.015346050262451172, -0.013857841491699219, -0.012369632720947266, -0.010881423950195312, -0.00939321517944336, -0.007905006408691406, -0.006416797637939453, -0.0049285888671875, -0.003440380096435547, -0.0019521713256835938, -0.0004639625549316406, 0.0010242462158203125, 0.0025124549865722656, 0.004000663757324219, 0.005488872528076172, 0.006977081298828125, 0.008465290069580078, 0.009953498840332031, 0.011441707611083984, 0.012929916381835938, 0.01441812515258789, 0.015906333923339844, 0.017394542694091797, 0.01888275146484375, 0.020370960235595703, 0.021859169006347656, 0.02334737777709961, 0.024835586547851562, 0.026323795318603516, 0.02781200408935547, 0.029300212860107422, 0.030788421630859375, 0.03227663040161133, 0.03376483917236328, 0.035253047943115234, 0.03674125671386719, 0.03822946548461914, 0.039717674255371094, 0.04120588302612305, 0.042694091796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 4.0, 21.0, 30.0, 25.0, 40.0, 85.0, 129.0, 250.0, 363.0, 706.0, 1246.0, 2569.0, 5693.0, 12438.0, 29710.0, 74621.0, 187221.0, 331854.0, 235491.0, 97657.0, 38686.0, 16041.0, 6940.0, 3253.0, 1564.0, 797.0, 458.0, 251.0, 161.0, 79.0, 60.0, 31.0, 29.0, 17.0, 13.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2249755859375, -0.21738624572753906, -0.20979690551757812, -0.2022075653076172, -0.19461822509765625, -0.1870288848876953, -0.17943954467773438, -0.17185020446777344, -0.1642608642578125, -0.15667152404785156, -0.14908218383789062, -0.1414928436279297, -0.13390350341796875, -0.1263141632080078, -0.11872482299804688, -0.11113548278808594, -0.103546142578125, -0.09595680236816406, -0.08836746215820312, -0.08077812194824219, -0.07318878173828125, -0.06559944152832031, -0.058010101318359375, -0.05042076110839844, -0.0428314208984375, -0.03524208068847656, -0.027652740478515625, -0.020063400268554688, -0.01247406005859375, -0.0048847198486328125, 0.002704620361328125, 0.010293960571289062, 0.01788330078125, 0.025472640991210938, 0.033061981201171875, 0.04065132141113281, 0.04824066162109375, 0.05583000183105469, 0.06341934204101562, 0.07100868225097656, 0.0785980224609375, 0.08618736267089844, 0.09377670288085938, 0.10136604309082031, 0.10895538330078125, 0.11654472351074219, 0.12413406372070312, 0.13172340393066406, 0.139312744140625, 0.14690208435058594, 0.15449142456054688, 0.1620807647705078, 0.16967010498046875, 0.1772594451904297, 0.18484878540039062, 0.19243812561035156, 0.2000274658203125, 0.20761680603027344, 0.21520614624023438, 0.2227954864501953, 0.23038482666015625, 0.2379741668701172, 0.24556350708007812, 0.25315284729003906, 0.2607421875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 11.0, 22.0, 37.0, 51.0, 66.0, 108.0, 137.0, 127.0, 118.0, 98.0, 79.0, 53.0, 32.0, 18.0, 15.0, 11.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.24691200256347656, -0.24205948412418365, -0.23720695078372955, -0.23235443234443665, -0.22750189900398254, -0.22264938056468964, -0.21779684722423553, -0.21294432878494263, -0.20809179544448853, -0.20323927700519562, -0.19838674366474152, -0.1935342252254486, -0.1886816918849945, -0.1838291734457016, -0.1789766401052475, -0.1741241216659546, -0.16927160322666168, -0.16441908478736877, -0.15956655144691467, -0.15471403300762177, -0.14986149966716766, -0.14500898122787476, -0.14015644788742065, -0.13530392944812775, -0.13045141100883484, -0.12559889256954193, -0.12074635922908783, -0.11589383333921432, -0.11104130744934082, -0.10618878901004791, -0.10133626312017441, -0.0964837372303009, -0.0916312113404274, -0.0867786854505539, -0.08192615956068039, -0.07707363367080688, -0.07222111523151398, -0.06736858189105988, -0.06251606345176697, -0.05766353756189346, -0.05281101167201996, -0.047958485782146454, -0.04310595989227295, -0.03825343772768974, -0.03340091183781624, -0.028548385947942734, -0.02369586192071438, -0.018843337893486023, -0.013990812003612518, -0.009138287045061588, -0.004285762086510658, 0.0005667628720402718, 0.005419287830591202, 0.010271813720464706, 0.015124337747693062, 0.019976861774921417, 0.024829387664794922, 0.029681913554668427, 0.03453443944454193, 0.03938696160912514, 0.04423948749899864, 0.04909201338887215, 0.05394453555345535, 0.05879706144332886, 0.06364958733320236]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 8.0, 7.0, 8.0, 18.0, 11.0, 22.0, 28.0, 20.0, 28.0, 30.0, 21.0, 42.0, 39.0, 31.0, 48.0, 46.0, 35.0, 41.0, 36.0, 25.0, 35.0, 41.0, 46.0, 39.0, 32.0, 29.0, 22.0, 31.0, 27.0, 25.0, 25.0, 12.0, 9.0, 18.0, 10.0, 13.0, 7.0, 5.0, 6.0, 10.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0], "bins": [-0.056616365909576416, -0.055010199546813965, -0.053404029458761215, -0.051797859370708466, -0.050191693007946014, -0.04858552664518356, -0.046979356557130814, -0.045373186469078064, -0.04376702010631561, -0.04216085374355316, -0.04055468365550041, -0.03894851356744766, -0.03734234720468521, -0.03573618084192276, -0.03413001075387001, -0.03252384066581726, -0.03091767430305481, -0.02931150607764721, -0.02770533785223961, -0.02609916962683201, -0.024493001401424408, -0.022886833176016808, -0.021280664950609207, -0.019674496725201607, -0.018068328499794006, -0.016462160274386406, -0.014855992048978806, -0.013249823823571205, -0.011643655598163605, -0.010037487372756004, -0.008431319147348404, -0.0068251509219408035, -0.005218982696533203, -0.0036128144711256027, -0.0020066462457180023, -0.0004004780203104019, 0.0012056902050971985, 0.002811858430504799, 0.004418026655912399, 0.00602419488132, 0.0076303631067276, 0.0092365313321352, 0.010842699557542801, 0.012448867782950401, 0.014055036008358002, 0.015661204233765602, 0.017267372459173203, 0.018873540684580803, 0.020479708909988403, 0.022085877135396004, 0.023692045360803604, 0.025298213586211205, 0.026904381811618805, 0.028510550037026405, 0.030116718262434006, 0.031722888350486755, 0.03332905471324921, 0.03493522107601166, 0.03654139116406441, 0.03814756125211716, 0.03975372761487961, 0.04135989397764206, 0.04296606406569481, 0.04457223415374756, 0.04617840051651001]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 12.0, 17.0, 15.0, 27.0, 23.0, 44.0, 49.0, 53.0, 54.0, 63.0, 72.0, 86.0, 65.0, 62.0, 46.0, 60.0, 56.0, 48.0, 37.0, 22.0, 18.0, 22.0, 10.0, 9.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.0, -102.84765625, -99.6953125, -96.54296875, -93.390625, -90.23828125, -87.0859375, -83.93359375, -80.78125, -77.62890625, -74.4765625, -71.32421875, -68.171875, -65.01953125, -61.8671875, -58.71484375, -55.5625, -52.41015625, -49.2578125, -46.10546875, -42.953125, -39.80078125, -36.6484375, -33.49609375, -30.34375, -27.19140625, -24.0390625, -20.88671875, -17.734375, -14.58203125, -11.4296875, -8.27734375, -5.125, -1.97265625, 1.1796875, 4.33203125, 7.484375, 10.63671875, 13.7890625, 16.94140625, 20.09375, 23.24609375, 26.3984375, 29.55078125, 32.703125, 35.85546875, 39.0078125, 42.16015625, 45.3125, 48.46484375, 51.6171875, 54.76953125, 57.921875, 61.07421875, 64.2265625, 67.37890625, 70.53125, 73.68359375, 76.8359375, 79.98828125, 83.140625, 86.29296875, 89.4453125, 92.59765625, 95.75]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 11.0, 15.0, 19.0, 25.0, 59.0, 74.0, 100.0, 256.0, 438.0, 1129.0, 9639.0, 553401.0, 473367.0, 7973.0, 1015.0, 440.0, 223.0, 129.0, 76.0, 44.0, 29.0, 26.0, 20.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.734375, -22.065185546875, -21.39599609375, -20.726806640625, -20.0576171875, -19.388427734375, -18.71923828125, -18.050048828125, -17.380859375, -16.711669921875, -16.04248046875, -15.373291015625, -14.7041015625, -14.034912109375, -13.36572265625, -12.696533203125, -12.02734375, -11.358154296875, -10.68896484375, -10.019775390625, -9.3505859375, -8.681396484375, -8.01220703125, -7.343017578125, -6.673828125, -6.004638671875, -5.33544921875, -4.666259765625, -3.9970703125, -3.327880859375, -2.65869140625, -1.989501953125, -1.3203125, -0.651123046875, 0.01806640625, 0.687255859375, 1.3564453125, 2.025634765625, 2.69482421875, 3.364013671875, 4.033203125, 4.702392578125, 5.37158203125, 6.040771484375, 6.7099609375, 7.379150390625, 8.04833984375, 8.717529296875, 9.38671875, 10.055908203125, 10.72509765625, 11.394287109375, 12.0634765625, 12.732666015625, 13.40185546875, 14.071044921875, 14.740234375, 15.409423828125, 16.07861328125, 16.747802734375, 17.4169921875, 18.086181640625, 18.75537109375, 19.424560546875, 20.09375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 9.0, 9.0, 13.0, 19.0, 24.0, 31.0, 46.0, 54.0, 58.0, 86.0, 83.0, 115.0, 2104.0, 82.0, 60.0, 75.0, 43.0, 50.0, 26.0, 18.0, 12.0, 11.0, 5.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.5, -138.73828125, -133.9765625, -129.21484375, -124.453125, -119.69140625, -114.9296875, -110.16796875, -105.40625, -100.64453125, -95.8828125, -91.12109375, -86.359375, -81.59765625, -76.8359375, -72.07421875, -67.3125, -62.55078125, -57.7890625, -53.02734375, -48.265625, -43.50390625, -38.7421875, -33.98046875, -29.21875, -24.45703125, -19.6953125, -14.93359375, -10.171875, -5.41015625, -0.6484375, 4.11328125, 8.875, 13.63671875, 18.3984375, 23.16015625, 27.921875, 32.68359375, 37.4453125, 42.20703125, 46.96875, 51.73046875, 56.4921875, 61.25390625, 66.015625, 70.77734375, 75.5390625, 80.30078125, 85.0625, 89.82421875, 94.5859375, 99.34765625, 104.109375, 108.87109375, 113.6328125, 118.39453125, 123.15625, 127.91796875, 132.6796875, 137.44140625, 142.203125, 146.96484375, 151.7265625, 156.48828125, 161.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 7.0, 2.0, 9.0, 16.0, 12.0, 38.0, 46.0, 82.0, 130.0, 243.0, 487.0, 975.0, 2293.0, 7618.0, 66202.0, 2692635.0, 340130.0, 27013.0, 4491.0, 1589.0, 795.0, 392.0, 191.0, 122.0, 68.0, 36.0, 31.0, 23.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.890625, -9.5697021484375, -9.248779296875, -8.9278564453125, -8.60693359375, -8.2860107421875, -7.965087890625, -7.6441650390625, -7.3232421875, -7.0023193359375, -6.681396484375, -6.3604736328125, -6.03955078125, -5.7186279296875, -5.397705078125, -5.0767822265625, -4.755859375, -4.4349365234375, -4.114013671875, -3.7930908203125, -3.47216796875, -3.1512451171875, -2.830322265625, -2.5093994140625, -2.1884765625, -1.8675537109375, -1.546630859375, -1.2257080078125, -0.90478515625, -0.5838623046875, -0.262939453125, 0.0579833984375, 0.37890625, 0.6998291015625, 1.020751953125, 1.3416748046875, 1.66259765625, 1.9835205078125, 2.304443359375, 2.6253662109375, 2.9462890625, 3.2672119140625, 3.588134765625, 3.9090576171875, 4.22998046875, 4.5509033203125, 4.871826171875, 5.1927490234375, 5.513671875, 5.8345947265625, 6.155517578125, 6.4764404296875, 6.79736328125, 7.1182861328125, 7.439208984375, 7.7601318359375, 8.0810546875, 8.4019775390625, 8.722900390625, 9.0438232421875, 9.36474609375, 9.6856689453125, 10.006591796875, 10.3275146484375, 10.6484375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 14.0, 13.0, 17.0, 24.0, 54.0, 64.0, 103.0, 109.0, 124.0, 114.0, 103.0, 55.0, 51.0, 38.0, 21.0, 18.0, 9.0, 7.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-100.47003936767578, -97.3014144897461, -94.13278198242188, -90.96415710449219, -87.7955322265625, -84.62690734863281, -81.4582748413086, -78.2896499633789, -75.12102508544922, -71.95240020751953, -68.78376770019531, -65.61514282226562, -62.44651794433594, -59.277889251708984, -56.10926055908203, -52.940635681152344, -49.77200698852539, -46.60337829589844, -43.43475341796875, -40.2661247253418, -37.09749984741211, -33.928871154785156, -30.760244369506836, -27.591617584228516, -24.422990798950195, -21.254364013671875, -18.085737228393555, -14.917109489440918, -11.748482704162598, -8.579855918884277, -5.411228179931641, -2.2426013946533203, 0.926025390625, 4.09465217590332, 7.263279438018799, 10.431906700134277, 13.600533485412598, 16.769161224365234, 19.937788009643555, 23.106414794921875, 26.275041580200195, 29.443668365478516, 32.61229705810547, 35.780921936035156, 38.94955062866211, 42.1181755065918, 45.28680419921875, 48.45542907714844, 51.62405776977539, 54.792686462402344, 57.96131134033203, 61.129940032958984, 64.29856872558594, 67.46719360351562, 70.63581848144531, 73.804443359375, 76.97307586669922, 80.1417007446289, 83.31033325195312, 86.47895812988281, 89.6475830078125, 92.81620788574219, 95.9848403930664, 99.1534652709961, 102.32209014892578]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 4.0, 5.0, 9.0, 6.0, 9.0, 9.0, 16.0, 11.0, 13.0, 19.0, 18.0, 22.0, 17.0, 30.0, 35.0, 26.0, 37.0, 41.0, 40.0, 39.0, 38.0, 37.0, 42.0, 26.0, 42.0, 39.0, 34.0, 39.0, 32.0, 24.0, 31.0, 24.0, 27.0, 23.0, 21.0, 21.0, 18.0, 11.0, 16.0, 10.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.87315368652344, -113.34082794189453, -109.8084945678711, -106.27616882324219, -102.74384307861328, -99.21151733398438, -95.67918395996094, -92.14685821533203, -88.61453247070312, -85.08220672607422, -81.54987335205078, -78.01754760742188, -74.48522186279297, -70.95289611816406, -67.42056274414062, -63.88823699951172, -60.35590744018555, -56.823577880859375, -53.29125213623047, -49.7589225769043, -46.22659683227539, -42.69426727294922, -39.16194152832031, -35.62961196899414, -32.09728240966797, -28.56495475769043, -25.03262710571289, -21.50029754638672, -17.967971801757812, -14.43564224243164, -10.903314590454102, -7.3709869384765625, -3.8386611938476562, -0.3063333034515381, 3.22599458694458, 6.758322715759277, 10.290650367736816, 13.822978973388672, 17.35530662536621, 20.88763427734375, 24.41996192932129, 27.952289581298828, 31.484617233276367, 35.016944885253906, 38.54927444458008, 42.08160400390625, 45.613929748535156, 49.14625549316406, 52.678585052490234, 56.210914611816406, 59.74324035644531, 63.275569915771484, 66.80789947509766, 70.34022521972656, 73.87255096435547, 77.40487670898438, 80.93721008300781, 84.46953582763672, 88.00186920166016, 91.53419494628906, 95.06652069091797, 98.59884643554688, 102.13117980957031, 105.66350555419922, 109.19583129882812]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 10.0, 12.0, 13.0, 26.0, 53.0, 47.0, 65.0, 121.0, 230.0, 433.0, 948.0, 2844.0, 11634.0, 1019818.0, 8548.0, 2098.0, 744.0, 362.0, 212.0, 97.0, 97.0, 55.0, 33.0, 19.0, 17.0, 10.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4934310913086, -65.82247924804688, -64.15152740478516, -62.48057174682617, -60.80961608886719, -59.13866424560547, -57.46771240234375, -55.796756744384766, -54.12580108642578, -52.45484924316406, -50.78389358520508, -49.11294174194336, -47.441986083984375, -45.771034240722656, -44.10008239746094, -42.42912673950195, -40.758174896240234, -39.087223052978516, -37.41626739501953, -35.74531555175781, -34.07435989379883, -32.40340805053711, -30.732454299926758, -29.061500549316406, -27.390546798706055, -25.719593048095703, -24.04863929748535, -22.377685546875, -20.70673370361328, -19.035778045654297, -17.364826202392578, -15.693872451782227, -14.02292251586914, -12.351968765258789, -10.681015014648438, -9.010062217712402, -7.339108467102051, -5.668154716491699, -3.997201919555664, -2.3262481689453125, -0.6552944183349609, 1.0156590938568115, 2.686612606048584, 4.357565879821777, 6.028519630432129, 7.6994733810424805, 9.370426177978516, 11.041379928588867, 12.712333679199219, 14.38328742980957, 16.054241180419922, 17.72519302368164, 19.396148681640625, 21.067100524902344, 22.738054275512695, 24.409008026123047, 26.0799617767334, 27.75091552734375, 29.4218692779541, 31.092823028564453, 32.76377487182617, 34.434730529785156, 36.105682373046875, 37.776634216308594, 39.44758987426758]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 11.0, 9.0, 19.0, 81.0, 8189.0, 51454612.0, 183.0, 29.0, 16.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2258.0, -2171.503662109375, -2085.00732421875, -1998.5108642578125, -1912.0145263671875, -1825.51806640625, -1739.021728515625, -1652.525390625, -1566.029052734375, -1479.53271484375, -1393.0362548828125, -1306.5399169921875, -1220.0435791015625, -1133.547119140625, -1047.05078125, -960.554443359375, -874.0579833984375, -787.5615844726562, -701.0652465820312, -614.56884765625, -528.072509765625, -441.57611083984375, -355.0797119140625, -268.5833740234375, -182.08697509765625, -95.5905990600586, -9.094223022460938, 77.40216064453125, 163.89852905273438, 250.3948974609375, 336.89129638671875, 423.38763427734375, 509.884033203125, 596.3804321289062, 682.8767700195312, 769.3731689453125, 855.8695068359375, 942.3659057617188, 1028.8623046875, 1115.358642578125, 1201.85498046875, 1288.351318359375, 1374.8477783203125, 1461.3441162109375, 1547.8404541015625, 1634.3369140625, 1720.833251953125, 1807.32958984375, 1893.8260498046875, 1980.3223876953125, 2066.81884765625, 2153.315185546875, 2239.8115234375, 2326.307861328125, 2412.80419921875, 2499.30078125, 2585.797119140625, 2672.29345703125, 2758.789794921875, 2845.2861328125, 2931.78271484375, 3018.279052734375, 3104.775390625, 3191.271728515625, 3277.76806640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 9.0, 12.0, 10.0, 24.0, 28.0, 45.0, 66.0, 77.0, 143.0, 162.0, 261.0, 389.0, 610.0, 854.0, 1289.0, 1900.0, 2819.0, 4301.0, 6645.0, 10567.0, 16863.0, 27191.0, 44843.0, 75720.0, 130720.0, 234125.0, 453435.0, 1231171.0, 2419411.0, 812010.0, 353744.0, 189844.0, 108082.0, 63337.0, 37621.0, 23009.0, 14193.0, 8831.0, 5825.0, 3735.0, 2517.0, 1548.0, 1073.0, 775.0, 476.0, 367.0, 234.0, 160.0, 104.0, 89.0, 64.0, 38.0, 25.0, 19.0, 17.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.7578125, -9.4462890625, -9.134765625, -8.8232421875, -8.51171875, -8.2001953125, -7.888671875, -7.5771484375, -7.265625, -6.9541015625, -6.642578125, -6.3310546875, -6.01953125, -5.7080078125, -5.396484375, -5.0849609375, -4.7734375, -4.4619140625, -4.150390625, -3.8388671875, -3.52734375, -3.2158203125, -2.904296875, -2.5927734375, -2.28125, -1.9697265625, -1.658203125, -1.3466796875, -1.03515625, -0.7236328125, -0.412109375, -0.1005859375, 0.2109375, 0.5224609375, 0.833984375, 1.1455078125, 1.45703125, 1.7685546875, 2.080078125, 2.3916015625, 2.703125, 3.0146484375, 3.326171875, 3.6376953125, 3.94921875, 4.2607421875, 4.572265625, 4.8837890625, 5.1953125, 5.5068359375, 5.818359375, 6.1298828125, 6.44140625, 6.7529296875, 7.064453125, 7.3759765625, 7.6875, 7.9990234375, 8.310546875, 8.6220703125, 8.93359375, 9.2451171875, 9.556640625, 9.8681640625, 10.1796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 1.0, 3.0, 6.0, 5.0, 5.0, 8.0, 11.0, 9.0, 17.0, 21.0, 20.0, 25.0, 23.0, 27.0, 26.0, 35.0, 40.0, 41.0, 40.0, 51.0, 150.0, 402.0, 442.0, 166.0, 55.0, 41.0, 44.0, 31.0, 38.0, 28.0, 25.0, 29.0, 23.0, 21.0, 21.0, 18.0, 14.0, 11.0, 8.0, 10.0, 8.0, 5.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.3125, -26.3740234375, -25.435546875, -24.4970703125, -23.55859375, -22.6201171875, -21.681640625, -20.7431640625, -19.8046875, -18.8662109375, -17.927734375, -16.9892578125, -16.05078125, -15.1123046875, -14.173828125, -13.2353515625, -12.296875, -11.3583984375, -10.419921875, -9.4814453125, -8.54296875, -7.6044921875, -6.666015625, -5.7275390625, -4.7890625, -3.8505859375, -2.912109375, -1.9736328125, -1.03515625, -0.0966796875, 0.841796875, 1.7802734375, 2.71875, 3.6572265625, 4.595703125, 5.5341796875, 6.47265625, 7.4111328125, 8.349609375, 9.2880859375, 10.2265625, 11.1650390625, 12.103515625, 13.0419921875, 13.98046875, 14.9189453125, 15.857421875, 16.7958984375, 17.734375, 18.6728515625, 19.611328125, 20.5498046875, 21.48828125, 22.4267578125, 23.365234375, 24.3037109375, 25.2421875, 26.1806640625, 27.119140625, 28.0576171875, 28.99609375, 29.9345703125, 30.873046875, 31.8115234375, 32.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 11.0, 26.0, 45.0, 52.0, 99.0, 173.0, 220.0, 370.0, 526.0, 821.0, 1367.0, 2050.0, 3209.0, 4812.0, 7786.0, 11952.0, 18815.0, 29463.0, 44856.0, 68782.0, 105294.0, 154164.0, 222443.0, 325382.0, 669295.0, 2178313.0, 1216517.0, 418009.0, 261377.0, 183096.0, 124692.0, 83023.0, 54577.0, 35507.0, 22592.0, 14680.0, 9669.0, 6126.0, 3981.0, 2526.0, 1712.0, 1109.0, 741.0, 437.0, 273.0, 185.0, 94.0, 53.0, 37.0, 36.0, 17.0, 13.0, 11.0, 8.0, 6.0, 0.0, 1.0], "bins": [-4.85546875, -4.70709228515625, -4.5587158203125, -4.41033935546875, -4.261962890625, -4.11358642578125, -3.9652099609375, -3.81683349609375, -3.66845703125, -3.52008056640625, -3.3717041015625, -3.22332763671875, -3.074951171875, -2.92657470703125, -2.7781982421875, -2.62982177734375, -2.4814453125, -2.33306884765625, -2.1846923828125, -2.03631591796875, -1.887939453125, -1.73956298828125, -1.5911865234375, -1.44281005859375, -1.29443359375, -1.14605712890625, -0.9976806640625, -0.84930419921875, -0.700927734375, -0.55255126953125, -0.4041748046875, -0.25579833984375, -0.107421875, 0.04095458984375, 0.1893310546875, 0.33770751953125, 0.486083984375, 0.63446044921875, 0.7828369140625, 0.93121337890625, 1.07958984375, 1.22796630859375, 1.3763427734375, 1.52471923828125, 1.673095703125, 1.82147216796875, 1.9698486328125, 2.11822509765625, 2.2666015625, 2.41497802734375, 2.5633544921875, 2.71173095703125, 2.860107421875, 3.00848388671875, 3.1568603515625, 3.30523681640625, 3.45361328125, 3.60198974609375, 3.7503662109375, 3.89874267578125, 4.047119140625, 4.19549560546875, 4.3438720703125, 4.49224853515625, 4.640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 12.0, 9.0, 9.0, 18.0, 12.0, 12.0, 16.0, 21.0, 21.0, 29.0, 31.0, 26.0, 26.0, 39.0, 36.0, 49.0, 33.0, 92.0, 288.0, 552.0, 203.0, 72.0, 39.0, 41.0, 40.0, 33.0, 25.0, 33.0, 22.0, 27.0, 20.0, 18.0, 15.0, 14.0, 13.0, 12.0, 8.0, 11.0, 5.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-45.5625, -44.20458984375, -42.8466796875, -41.48876953125, -40.130859375, -38.77294921875, -37.4150390625, -36.05712890625, -34.69921875, -33.34130859375, -31.9833984375, -30.62548828125, -29.267578125, -27.90966796875, -26.5517578125, -25.19384765625, -23.8359375, -22.47802734375, -21.1201171875, -19.76220703125, -18.404296875, -17.04638671875, -15.6884765625, -14.33056640625, -12.97265625, -11.61474609375, -10.2568359375, -8.89892578125, -7.541015625, -6.18310546875, -4.8251953125, -3.46728515625, -2.109375, -0.75146484375, 0.6064453125, 1.96435546875, 3.322265625, 4.68017578125, 6.0380859375, 7.39599609375, 8.75390625, 10.11181640625, 11.4697265625, 12.82763671875, 14.185546875, 15.54345703125, 16.9013671875, 18.25927734375, 19.6171875, 20.97509765625, 22.3330078125, 23.69091796875, 25.048828125, 26.40673828125, 27.7646484375, 29.12255859375, 30.48046875, 31.83837890625, 33.1962890625, 34.55419921875, 35.912109375, 37.27001953125, 38.6279296875, 39.98583984375, 41.34375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 9.0, 8.0, 6.0, 11.0, 7.0, 19.0, 21.0, 38.0, 51.0, 87.0, 129.0, 185.0, 240.0, 328.0, 410.0, 583.0, 983.0, 1271.0, 1757.0, 2498.0, 3671.0, 6245.0, 11723.0, 24628.0, 54651.0, 125034.0, 5649571.0, 245535.0, 83890.0, 36847.0, 17074.0, 8647.0, 4952.0, 3040.0, 2155.0, 1547.0, 1007.0, 715.0, 521.0, 418.0, 298.0, 171.0, 125.0, 109.0, 52.0, 51.0, 33.0, 30.0, 21.0, 10.0, 13.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.078125, -26.197998046875, -25.31787109375, -24.437744140625, -23.5576171875, -22.677490234375, -21.79736328125, -20.917236328125, -20.037109375, -19.156982421875, -18.27685546875, -17.396728515625, -16.5166015625, -15.636474609375, -14.75634765625, -13.876220703125, -12.99609375, -12.115966796875, -11.23583984375, -10.355712890625, -9.4755859375, -8.595458984375, -7.71533203125, -6.835205078125, -5.955078125, -5.074951171875, -4.19482421875, -3.314697265625, -2.4345703125, -1.554443359375, -0.67431640625, 0.205810546875, 1.0859375, 1.966064453125, 2.84619140625, 3.726318359375, 4.6064453125, 5.486572265625, 6.36669921875, 7.246826171875, 8.126953125, 9.007080078125, 9.88720703125, 10.767333984375, 11.6474609375, 12.527587890625, 13.40771484375, 14.287841796875, 15.16796875, 16.048095703125, 16.92822265625, 17.808349609375, 18.6884765625, 19.568603515625, 20.44873046875, 21.328857421875, 22.208984375, 23.089111328125, 23.96923828125, 24.849365234375, 25.7294921875, 26.609619140625, 27.48974609375, 28.369873046875, 29.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 7.0, 8.0, 4.0, 6.0, 11.0, 12.0, 6.0, 17.0, 13.0, 20.0, 16.0, 22.0, 11.0, 24.0, 29.0, 20.0, 20.0, 28.0, 25.0, 35.0, 42.0, 35.0, 77.0, 604.0, 449.0, 47.0, 29.0, 41.0, 29.0, 32.0, 44.0, 28.0, 28.0, 30.0, 26.0, 23.0, 11.0, 16.0, 19.0, 10.0, 10.0, 11.0, 14.0, 9.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-87.3125, -84.7490234375, -82.185546875, -79.6220703125, -77.05859375, -74.4951171875, -71.931640625, -69.3681640625, -66.8046875, -64.2412109375, -61.677734375, -59.1142578125, -56.55078125, -53.9873046875, -51.423828125, -48.8603515625, -46.296875, -43.7333984375, -41.169921875, -38.6064453125, -36.04296875, -33.4794921875, -30.916015625, -28.3525390625, -25.7890625, -23.2255859375, -20.662109375, -18.0986328125, -15.53515625, -12.9716796875, -10.408203125, -7.8447265625, -5.28125, -2.7177734375, -0.154296875, 2.4091796875, 4.97265625, 7.5361328125, 10.099609375, 12.6630859375, 15.2265625, 17.7900390625, 20.353515625, 22.9169921875, 25.48046875, 28.0439453125, 30.607421875, 33.1708984375, 35.734375, 38.2978515625, 40.861328125, 43.4248046875, 45.98828125, 48.5517578125, 51.115234375, 53.6787109375, 56.2421875, 58.8056640625, 61.369140625, 63.9326171875, 66.49609375, 69.0595703125, 71.623046875, 74.1865234375, 76.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 7.0, 15.0, 43.0, 79.0, 641.0, 147.0, 21.0, 9.0, 8.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-565.7207641601562, -550.6943359375, -535.6678466796875, -520.6414184570312, -505.61492919921875, -490.5885009765625, -475.5620422363281, -460.53558349609375, -445.5091247558594, -430.482666015625, -415.4562072753906, -400.42974853515625, -385.4033203125, -370.3768310546875, -355.35040283203125, -340.3239440917969, -325.2974853515625, -310.2710266113281, -295.24456787109375, -280.2181091308594, -265.191650390625, -250.1652069091797, -235.13876342773438, -220.1123046875, -205.08584594726562, -190.05938720703125, -175.03292846679688, -160.00648498535156, -144.9800262451172, -129.9535675048828, -114.92711639404297, -99.90066528320312, -84.87423706054688, -69.8477783203125, -54.821327209472656, -39.79487228393555, -24.768417358398438, -9.741958618164062, 5.284492492675781, 20.310943603515625, 35.33740234375, 50.36385726928711, 65.39031219482422, 80.41676330566406, 95.44322204589844, 110.46968078613281, 125.49613189697266, 140.5225830078125, 155.54904174804688, 170.57550048828125, 185.60195922851562, 200.62840270996094, 215.6548614501953, 230.6813201904297, 245.707763671875, 260.7342224121094, 275.76068115234375, 290.7871398925781, 305.8135986328125, 320.8400573730469, 335.86651611328125, 350.8929443359375, 365.9194030761719, 380.94586181640625, 395.9723205566406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 7.0, 12.0, 8.0, 14.0, 12.0, 19.0, 29.0, 20.0, 132.0, 487.0, 130.0, 18.0, 15.0, 16.0, 17.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-713.6857299804688, -694.1215209960938, -674.5572509765625, -654.9930419921875, -635.4288330078125, -615.8646240234375, -596.3004150390625, -576.7361450195312, -557.1719360351562, -537.6077270507812, -518.04345703125, -498.479248046875, -478.9150390625, -459.350830078125, -439.7865905761719, -420.22235107421875, -400.65814208984375, -381.09393310546875, -361.5296936035156, -341.9654541015625, -322.4012451171875, -302.8370361328125, -283.2727966308594, -263.70855712890625, -244.14434814453125, -224.5801239013672, -205.01589965820312, -185.45167541503906, -165.887451171875, -146.32322692871094, -126.75900268554688, -107.19477844238281, -87.63055419921875, -68.06632995605469, -48.502105712890625, -28.937881469726562, -9.3736572265625, 10.190567016601562, 29.754791259765625, 49.31901550292969, 68.88323974609375, 88.44746398925781, 108.01168823242188, 127.57591247558594, 147.14013671875, 166.70436096191406, 186.26858520507812, 205.8328094482422, 225.39703369140625, 244.9612579345703, 264.5254821777344, 284.0897216796875, 303.6539306640625, 323.2181396484375, 342.7823791503906, 362.34661865234375, 381.91082763671875, 401.47503662109375, 421.0392761230469, 440.603515625, 460.167724609375, 479.73193359375, 499.2961730957031, 518.8604125976562, 538.4246215820312]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 20.0, 12.0, 34.0, 29.0, 49.0, 68.0, 108.0, 148.0, 193.0, 325.0, 510.0, 788.0, 1310.0, 2285.0, 4439.0, 9803.0, 27832.0, 293903.0, 3798314.0, 32518.0, 10595.0, 4679.0, 2406.0, 1387.0, 866.0, 540.0, 335.0, 223.0, 168.0, 113.0, 79.0, 43.0, 33.0, 23.0, 15.0, 16.0, 16.0, 8.0, 5.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.1875, -2.114776611328125, -2.04205322265625, -1.969329833984375, -1.8966064453125, -1.823883056640625, -1.75115966796875, -1.678436279296875, -1.605712890625, -1.532989501953125, -1.46026611328125, -1.387542724609375, -1.3148193359375, -1.242095947265625, -1.16937255859375, -1.096649169921875, -1.02392578125, -0.951202392578125, -0.87847900390625, -0.805755615234375, -0.7330322265625, -0.660308837890625, -0.58758544921875, -0.514862060546875, -0.442138671875, -0.369415283203125, -0.29669189453125, -0.223968505859375, -0.1512451171875, -0.078521728515625, -0.00579833984375, 0.066925048828125, 0.1396484375, 0.212371826171875, 0.28509521484375, 0.357818603515625, 0.4305419921875, 0.503265380859375, 0.57598876953125, 0.648712158203125, 0.721435546875, 0.794158935546875, 0.86688232421875, 0.939605712890625, 1.0123291015625, 1.085052490234375, 1.15777587890625, 1.230499267578125, 1.30322265625, 1.375946044921875, 1.44866943359375, 1.521392822265625, 1.5941162109375, 1.666839599609375, 1.73956298828125, 1.812286376953125, 1.885009765625, 1.957733154296875, 2.03045654296875, 2.103179931640625, 2.1759033203125, 2.248626708984375, 2.32135009765625, 2.394073486328125, 2.466796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 7.0, 11.0, 7.0, 5.0, 11.0, 8.0, 6.0, 13.0, 19.0, 27.0, 730.0, 39.0, 14.0, 11.0, 10.0, 12.0, 7.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2509765625, -1.2113037109375, -1.171630859375, -1.1319580078125, -1.09228515625, -1.0526123046875, -1.012939453125, -0.9732666015625, -0.93359375, -0.8939208984375, -0.854248046875, -0.8145751953125, -0.77490234375, -0.7352294921875, -0.695556640625, -0.6558837890625, -0.6162109375, -0.5765380859375, -0.536865234375, -0.4971923828125, -0.45751953125, -0.4178466796875, -0.378173828125, -0.3385009765625, -0.298828125, -0.2591552734375, -0.219482421875, -0.1798095703125, -0.14013671875, -0.1004638671875, -0.060791015625, -0.0211181640625, 0.0185546875, 0.0582275390625, 0.097900390625, 0.1375732421875, 0.17724609375, 0.2169189453125, 0.256591796875, 0.2962646484375, 0.3359375, 0.3756103515625, 0.415283203125, 0.4549560546875, 0.49462890625, 0.5343017578125, 0.573974609375, 0.6136474609375, 0.6533203125, 0.6929931640625, 0.732666015625, 0.7723388671875, 0.81201171875, 0.8516845703125, 0.891357421875, 0.9310302734375, 0.970703125, 1.0103759765625, 1.050048828125, 1.0897216796875, 1.12939453125, 1.1690673828125, 1.208740234375, 1.2484130859375, 1.2880859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 9.0, 16.0, 27.0, 43.0, 98.0, 211.0, 519.0, 1532.0, 5777.0, 31113.0, 659926.0, 3433163.0, 50692.0, 7974.0, 1939.0, 716.0, 243.0, 120.0, 62.0, 32.0, 18.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.55859375, -5.3956298828125, -5.232666015625, -5.0697021484375, -4.90673828125, -4.7437744140625, -4.580810546875, -4.4178466796875, -4.2548828125, -4.0919189453125, -3.928955078125, -3.7659912109375, -3.60302734375, -3.4400634765625, -3.277099609375, -3.1141357421875, -2.951171875, -2.7882080078125, -2.625244140625, -2.4622802734375, -2.29931640625, -2.1363525390625, -1.973388671875, -1.8104248046875, -1.6474609375, -1.4844970703125, -1.321533203125, -1.1585693359375, -0.99560546875, -0.8326416015625, -0.669677734375, -0.5067138671875, -0.34375, -0.1807861328125, -0.017822265625, 0.1451416015625, 0.30810546875, 0.4710693359375, 0.634033203125, 0.7969970703125, 0.9599609375, 1.1229248046875, 1.285888671875, 1.4488525390625, 1.61181640625, 1.7747802734375, 1.937744140625, 2.1007080078125, 2.263671875, 2.4266357421875, 2.589599609375, 2.7525634765625, 2.91552734375, 3.0784912109375, 3.241455078125, 3.4044189453125, 3.5673828125, 3.7303466796875, 3.893310546875, 4.0562744140625, 4.21923828125, 4.3822021484375, 4.545166015625, 4.7081298828125, 4.87109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 4.0, 9.0, 7.0, 13.0, 17.0, 17.0, 33.0, 39.0, 51.0, 86.0, 143.0, 290.0, 1326.0, 1216.0, 293.0, 170.0, 95.0, 63.0, 62.0, 25.0, 28.0, 14.0, 11.0, 13.0, 6.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.267578125, -1.23028564453125, -1.1929931640625, -1.15570068359375, -1.118408203125, -1.08111572265625, -1.0438232421875, -1.00653076171875, -0.96923828125, -0.93194580078125, -0.8946533203125, -0.85736083984375, -0.820068359375, -0.78277587890625, -0.7454833984375, -0.70819091796875, -0.6708984375, -0.63360595703125, -0.5963134765625, -0.55902099609375, -0.521728515625, -0.48443603515625, -0.4471435546875, -0.40985107421875, -0.37255859375, -0.33526611328125, -0.2979736328125, -0.26068115234375, -0.223388671875, -0.18609619140625, -0.1488037109375, -0.11151123046875, -0.07421875, -0.03692626953125, 0.0003662109375, 0.03765869140625, 0.074951171875, 0.11224365234375, 0.1495361328125, 0.18682861328125, 0.22412109375, 0.26141357421875, 0.2987060546875, 0.33599853515625, 0.373291015625, 0.41058349609375, 0.4478759765625, 0.48516845703125, 0.5224609375, 0.55975341796875, 0.5970458984375, 0.63433837890625, 0.671630859375, 0.70892333984375, 0.7462158203125, 0.78350830078125, 0.82080078125, 0.85809326171875, 0.8953857421875, 0.93267822265625, 0.969970703125, 1.00726318359375, 1.0445556640625, 1.08184814453125, 1.119140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 10.0, 12.0, 35.0, 61.0, 119.0, 168.0, 215.0, 181.0, 87.0, 52.0, 21.0, 14.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.666681289672852, -8.434228897094727, -8.201776504516602, -7.969324588775635, -7.736872673034668, -7.504420280456543, -7.271967887878418, -7.039515972137451, -6.807063579559326, -6.574611186981201, -6.342159271240234, -6.109706878662109, -5.877254962921143, -5.644802570343018, -5.412350654602051, -5.179898262023926, -4.947445869445801, -4.714993476867676, -4.482541561126709, -4.250089168548584, -4.017637252807617, -3.785184860229492, -3.5527327060699463, -3.3202805519104004, -3.0878286361694336, -2.8553764820098877, -2.622924327850342, -2.390471935272217, -2.158019781112671, -1.925567626953125, -1.693115472793579, -1.4606631994247437, -1.2282109260559082, -0.9957587122917175, -0.7633064985275269, -0.530854344367981, -0.2984021306037903, -0.06594991683959961, 0.1665022373199463, 0.39895451068878174, 0.6314066648483276, 0.8638588786125183, 1.096311092376709, 1.3287632465362549, 1.5612154006958008, 1.7936676740646362, 2.0261197090148926, 2.2585721015930176, 2.4910242557525635, 2.7234764099121094, 2.9559285640716553, 3.188380718231201, 3.420833110809326, 3.653285264968872, 3.885737419128418, 4.118189811706543, 4.35064172744751, 4.583094120025635, 4.815546035766602, 5.047998428344727, 5.280450344085693, 5.512902736663818, 5.745354652404785, 5.97780704498291, 6.210259437561035]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 8.0, 14.0, 8.0, 15.0, 24.0, 28.0, 32.0, 38.0, 49.0, 45.0, 57.0, 64.0, 63.0, 50.0, 76.0, 57.0, 55.0, 51.0, 40.0, 43.0, 42.0, 29.0, 23.0, 21.0, 11.0, 11.0, 11.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0176849365234375, -3.865354299545288, -3.7130236625671387, -3.5606930255889893, -3.40836238861084, -3.2560315132141113, -3.103700876235962, -2.9513702392578125, -2.799039602279663, -2.6467089653015137, -2.4943783283233643, -2.342047691345215, -2.1897168159484863, -2.037386417388916, -1.8850555419921875, -1.732724905014038, -1.5803942680358887, -1.4280636310577393, -1.2757329940795898, -1.1234022378921509, -0.9710716009140015, -0.818740963935852, -0.6664102673530579, -0.5140795707702637, -0.36174893379211426, -0.20941826701164246, -0.057087600231170654, 0.09524306654930115, 0.24757373332977295, 0.39990437030792236, 0.5522350668907166, 0.7045657634735107, 0.8568964004516602, 1.0092270374298096, 1.161557674407959, 1.313888430595398, 1.4662190675735474, 1.6185497045516968, 1.7708804607391357, 1.9232110977172852, 2.0755417346954346, 2.227872371673584, 2.3802030086517334, 2.532533645629883, 2.6848645210266113, 2.8371949195861816, 2.98952579498291, 3.1418564319610596, 3.294187068939209, 3.4465177059173584, 3.598848342895508, 3.7511789798736572, 3.9035096168518066, 4.055840492248535, 4.2081708908081055, 4.360501766204834, 4.5128326416015625, 4.665163516998291, 4.817493915557861, 4.96982479095459, 5.12215518951416, 5.274486064910889, 5.426816463470459, 5.5791473388671875, 5.731477737426758]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 8.0, 3.0, 9.0, 15.0, 19.0, 36.0, 42.0, 52.0, 84.0, 135.0, 187.0, 277.0, 421.0, 640.0, 965.0, 1466.0, 2357.0, 3996.0, 7152.0, 13241.0, 26334.0, 76841.0, 838088.0, 36063.0, 17703.0, 9235.0, 5023.0, 2943.0, 1784.0, 1177.0, 737.0, 473.0, 345.0, 220.0, 148.0, 112.0, 75.0, 46.0, 42.0, 17.0, 17.0, 6.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.48828125, -2.405914306640625, -2.32354736328125, -2.241180419921875, -2.1588134765625, -2.076446533203125, -1.99407958984375, -1.911712646484375, -1.829345703125, -1.746978759765625, -1.66461181640625, -1.582244873046875, -1.4998779296875, -1.417510986328125, -1.33514404296875, -1.252777099609375, -1.17041015625, -1.088043212890625, -1.00567626953125, -0.923309326171875, -0.8409423828125, -0.758575439453125, -0.67620849609375, -0.593841552734375, -0.511474609375, -0.429107666015625, -0.34674072265625, -0.264373779296875, -0.1820068359375, -0.099639892578125, -0.01727294921875, 0.065093994140625, 0.1474609375, 0.229827880859375, 0.31219482421875, 0.394561767578125, 0.4769287109375, 0.559295654296875, 0.64166259765625, 0.724029541015625, 0.806396484375, 0.888763427734375, 0.97113037109375, 1.053497314453125, 1.1358642578125, 1.218231201171875, 1.30059814453125, 1.382965087890625, 1.46533203125, 1.547698974609375, 1.63006591796875, 1.712432861328125, 1.7947998046875, 1.877166748046875, 1.95953369140625, 2.041900634765625, 2.124267578125, 2.206634521484375, 2.28900146484375, 2.371368408203125, 2.4537353515625, 2.536102294921875, 2.61846923828125, 2.700836181640625, 2.783203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 9.0, 10.0, 11.0, 6.0, 12.0, 12.0, 26.0, 405.0, 361.0, 17.0, 10.0, 15.0, 11.0, 6.0, 11.0, 8.0, 2.0, 3.0, 6.0, 3.0, 6.0, 1.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2744140625, -1.235626220703125, -1.19683837890625, -1.158050537109375, -1.1192626953125, -1.080474853515625, -1.04168701171875, -1.002899169921875, -0.964111328125, -0.925323486328125, -0.88653564453125, -0.847747802734375, -0.8089599609375, -0.770172119140625, -0.73138427734375, -0.692596435546875, -0.65380859375, -0.615020751953125, -0.57623291015625, -0.537445068359375, -0.4986572265625, -0.459869384765625, -0.42108154296875, -0.382293701171875, -0.343505859375, -0.304718017578125, -0.26593017578125, -0.227142333984375, -0.1883544921875, -0.149566650390625, -0.11077880859375, -0.071990966796875, -0.033203125, 0.005584716796875, 0.04437255859375, 0.083160400390625, 0.1219482421875, 0.160736083984375, 0.19952392578125, 0.238311767578125, 0.277099609375, 0.315887451171875, 0.35467529296875, 0.393463134765625, 0.4322509765625, 0.471038818359375, 0.50982666015625, 0.548614501953125, 0.58740234375, 0.626190185546875, 0.66497802734375, 0.703765869140625, 0.7425537109375, 0.781341552734375, 0.82012939453125, 0.858917236328125, 0.897705078125, 0.936492919921875, 0.97528076171875, 1.014068603515625, 1.0528564453125, 1.091644287109375, 1.13043212890625, 1.169219970703125, 1.2080078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 5.0, 3.0, 11.0, 8.0, 12.0, 14.0, 17.0, 13.0, 34.0, 29.0, 49.0, 61.0, 85.0, 133.0, 232.0, 466.0, 857.0, 1955.0, 5269.0, 17777.0, 79203.0, 464344.0, 388677.0, 65477.0, 15440.0, 4742.0, 1798.0, 778.0, 401.0, 218.0, 127.0, 89.0, 45.0, 38.0, 45.0, 16.0, 19.0, 12.0, 9.0, 9.0, 10.0, 5.0, 6.0, 8.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.337890625, -3.236572265625, -3.13525390625, -3.033935546875, -2.9326171875, -2.831298828125, -2.72998046875, -2.628662109375, -2.52734375, -2.426025390625, -2.32470703125, -2.223388671875, -2.1220703125, -2.020751953125, -1.91943359375, -1.818115234375, -1.716796875, -1.615478515625, -1.51416015625, -1.412841796875, -1.3115234375, -1.210205078125, -1.10888671875, -1.007568359375, -0.90625, -0.804931640625, -0.70361328125, -0.602294921875, -0.5009765625, -0.399658203125, -0.29833984375, -0.197021484375, -0.095703125, 0.005615234375, 0.10693359375, 0.208251953125, 0.3095703125, 0.410888671875, 0.51220703125, 0.613525390625, 0.71484375, 0.816162109375, 0.91748046875, 1.018798828125, 1.1201171875, 1.221435546875, 1.32275390625, 1.424072265625, 1.525390625, 1.626708984375, 1.72802734375, 1.829345703125, 1.9306640625, 2.031982421875, 2.13330078125, 2.234619140625, 2.3359375, 2.437255859375, 2.53857421875, 2.639892578125, 2.7412109375, 2.842529296875, 2.94384765625, 3.045166015625, 3.146484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 3.0, 4.0, 3.0, 16.0, 15.0, 17.0, 28.0, 25.0, 30.0, 21.0, 30.0, 36.0, 45.0, 46.0, 46.0, 37.0, 36.0, 48.0, 50.0, 53.0, 50.0, 48.0, 40.0, 38.0, 33.0, 32.0, 24.0, 16.0, 25.0, 18.0, 19.0, 9.0, 13.0, 5.0, 3.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.92578125, -4.766845703125, -4.60791015625, -4.448974609375, -4.2900390625, -4.131103515625, -3.97216796875, -3.813232421875, -3.654296875, -3.495361328125, -3.33642578125, -3.177490234375, -3.0185546875, -2.859619140625, -2.70068359375, -2.541748046875, -2.3828125, -2.223876953125, -2.06494140625, -1.906005859375, -1.7470703125, -1.588134765625, -1.42919921875, -1.270263671875, -1.111328125, -0.952392578125, -0.79345703125, -0.634521484375, -0.4755859375, -0.316650390625, -0.15771484375, 0.001220703125, 0.16015625, 0.319091796875, 0.47802734375, 0.636962890625, 0.7958984375, 0.954833984375, 1.11376953125, 1.272705078125, 1.431640625, 1.590576171875, 1.74951171875, 1.908447265625, 2.0673828125, 2.226318359375, 2.38525390625, 2.544189453125, 2.703125, 2.862060546875, 3.02099609375, 3.179931640625, 3.3388671875, 3.497802734375, 3.65673828125, 3.815673828125, 3.974609375, 4.133544921875, 4.29248046875, 4.451416015625, 4.6103515625, 4.769287109375, 4.92822265625, 5.087158203125, 5.24609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 13.0, 11.0, 35.0, 68.0, 72.0, 146.0, 296.0, 629.0, 1419.0, 3906.0, 13693.0, 80849.0, 643820.0, 261792.0, 30585.0, 7087.0, 2313.0, 926.0, 422.0, 185.0, 95.0, 59.0, 35.0, 23.0, 13.0, 12.0, 6.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9736328125, -1.8998565673828125, -1.826080322265625, -1.7523040771484375, -1.67852783203125, -1.6047515869140625, -1.530975341796875, -1.4571990966796875, -1.3834228515625, -1.3096466064453125, -1.235870361328125, -1.1620941162109375, -1.08831787109375, -1.0145416259765625, -0.940765380859375, -0.8669891357421875, -0.793212890625, -0.7194366455078125, -0.645660400390625, -0.5718841552734375, -0.49810791015625, -0.4243316650390625, -0.350555419921875, -0.2767791748046875, -0.2030029296875, -0.1292266845703125, -0.055450439453125, 0.0183258056640625, 0.09210205078125, 0.1658782958984375, 0.239654541015625, 0.3134307861328125, 0.38720703125, 0.4609832763671875, 0.534759521484375, 0.6085357666015625, 0.68231201171875, 0.7560882568359375, 0.829864501953125, 0.9036407470703125, 0.9774169921875, 1.0511932373046875, 1.124969482421875, 1.1987457275390625, 1.27252197265625, 1.3462982177734375, 1.420074462890625, 1.4938507080078125, 1.567626953125, 1.6414031982421875, 1.715179443359375, 1.7889556884765625, 1.86273193359375, 1.9365081787109375, 2.010284423828125, 2.0840606689453125, 2.1578369140625, 2.2316131591796875, 2.305389404296875, 2.3791656494140625, 2.45294189453125, 2.5267181396484375, 2.600494384765625, 2.6742706298828125, 2.748046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 9.0, 11.0, 9.0, 15.0, 17.0, 13.0, 24.0, 55.0, 71.0, 68.0, 73.0, 67.0, 94.0, 84.0, 74.0, 83.0, 45.0, 40.0, 26.0, 33.0, 19.0, 13.0, 13.0, 14.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.50366598367691e-05, -7.199123501777649e-05, -6.894581019878387e-05, -6.590038537979126e-05, -6.285496056079865e-05, -5.980953574180603e-05, -5.6764110922813416e-05, -5.37186861038208e-05, -5.0673261284828186e-05, -4.762783646583557e-05, -4.4582411646842957e-05, -4.153698682785034e-05, -3.849156200885773e-05, -3.544613718986511e-05, -3.24007123708725e-05, -2.9355287551879883e-05, -2.6309862732887268e-05, -2.3264437913894653e-05, -2.021901309490204e-05, -1.7173588275909424e-05, -1.4128163456916809e-05, -1.1082738637924194e-05, -8.03731381893158e-06, -4.991888999938965e-06, -1.94646418094635e-06, 1.0989606380462646e-06, 4.144385457038879e-06, 7.189810276031494e-06, 1.0235235095024109e-05, 1.3280659914016724e-05, 1.632608473300934e-05, 1.9371509552001953e-05, 2.2416934370994568e-05, 2.5462359189987183e-05, 2.8507784008979797e-05, 3.155320882797241e-05, 3.459863364696503e-05, 3.764405846595764e-05, 4.0689483284950256e-05, 4.373490810394287e-05, 4.6780332922935486e-05, 4.98257577419281e-05, 5.2871182560920715e-05, 5.591660737991333e-05, 5.8962032198905945e-05, 6.200745701789856e-05, 6.505288183689117e-05, 6.809830665588379e-05, 7.11437314748764e-05, 7.418915629386902e-05, 7.723458111286163e-05, 8.028000593185425e-05, 8.332543075084686e-05, 8.637085556983948e-05, 8.941628038883209e-05, 9.246170520782471e-05, 9.550713002681732e-05, 9.855255484580994e-05, 0.00010159797966480255, 0.00010464340448379517, 0.00010768882930278778, 0.0001107342541217804, 0.00011377967894077301, 0.00011682510375976562]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 15.0, 12.0, 20.0, 41.0, 73.0, 144.0, 295.0, 697.0, 2470.0, 12037.0, 148092.0, 806520.0, 67800.0, 7500.0, 1734.0, 574.0, 242.0, 141.0, 51.0, 32.0, 27.0, 14.0, 8.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0], "bins": [-5.28125, -5.1673583984375, -5.053466796875, -4.9395751953125, -4.82568359375, -4.7117919921875, -4.597900390625, -4.4840087890625, -4.3701171875, -4.2562255859375, -4.142333984375, -4.0284423828125, -3.91455078125, -3.8006591796875, -3.686767578125, -3.5728759765625, -3.458984375, -3.3450927734375, -3.231201171875, -3.1173095703125, -3.00341796875, -2.8895263671875, -2.775634765625, -2.6617431640625, -2.5478515625, -2.4339599609375, -2.320068359375, -2.2061767578125, -2.09228515625, -1.9783935546875, -1.864501953125, -1.7506103515625, -1.63671875, -1.5228271484375, -1.408935546875, -1.2950439453125, -1.18115234375, -1.0672607421875, -0.953369140625, -0.8394775390625, -0.7255859375, -0.6116943359375, -0.497802734375, -0.3839111328125, -0.27001953125, -0.1561279296875, -0.042236328125, 0.0716552734375, 0.185546875, 0.2994384765625, 0.413330078125, 0.5272216796875, 0.64111328125, 0.7550048828125, 0.868896484375, 0.9827880859375, 1.0966796875, 1.2105712890625, 1.324462890625, 1.4383544921875, 1.55224609375, 1.6661376953125, 1.780029296875, 1.8939208984375, 2.0078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 11.0, 14.0, 21.0, 40.0, 40.0, 45.0, 68.0, 72.0, 92.0, 83.0, 67.0, 103.0, 72.0, 64.0, 51.0, 47.0, 22.0, 30.0, 15.0, 13.0, 7.0, 6.0, 4.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.76190185546875, -3.6702880859375, -3.57867431640625, -3.487060546875, -3.39544677734375, -3.3038330078125, -3.21221923828125, -3.12060546875, -3.02899169921875, -2.9373779296875, -2.84576416015625, -2.754150390625, -2.66253662109375, -2.5709228515625, -2.47930908203125, -2.3876953125, -2.29608154296875, -2.2044677734375, -2.11285400390625, -2.021240234375, -1.92962646484375, -1.8380126953125, -1.74639892578125, -1.65478515625, -1.56317138671875, -1.4715576171875, -1.37994384765625, -1.288330078125, -1.19671630859375, -1.1051025390625, -1.01348876953125, -0.921875, -0.83026123046875, -0.7386474609375, -0.64703369140625, -0.555419921875, -0.46380615234375, -0.3721923828125, -0.28057861328125, -0.18896484375, -0.09735107421875, -0.0057373046875, 0.08587646484375, 0.177490234375, 0.26910400390625, 0.3607177734375, 0.45233154296875, 0.5439453125, 0.63555908203125, 0.7271728515625, 0.81878662109375, 0.910400390625, 1.00201416015625, 1.0936279296875, 1.18524169921875, 1.27685546875, 1.36846923828125, 1.4600830078125, 1.55169677734375, 1.643310546875, 1.73492431640625, 1.8265380859375, 1.91815185546875, 2.009765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 9.0, 36.0, 122.0, 344.0, 320.0, 97.0, 33.0, 10.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-91.80718231201172, -89.93212127685547, -88.05706024169922, -86.18199920654297, -84.30693054199219, -82.43186950683594, -80.55680847167969, -78.68174743652344, -76.80668640136719, -74.93162536621094, -73.05656433105469, -71.18150329589844, -69.30643463134766, -67.4313735961914, -65.55631256103516, -63.681251525878906, -61.806190490722656, -59.931129455566406, -58.05606460571289, -56.18100357055664, -54.30594253540039, -52.430877685546875, -50.555816650390625, -48.680755615234375, -46.80569076538086, -44.93062973022461, -43.055564880371094, -41.180503845214844, -39.305442810058594, -37.430381774902344, -35.55531692504883, -33.68025588989258, -31.805192947387695, -29.930130004882812, -28.055068969726562, -26.18000602722168, -24.30494499206543, -22.429882049560547, -20.554821014404297, -18.679758071899414, -16.80469512939453, -14.929633140563965, -13.054571151733398, -11.179508209228516, -9.304447174072266, -7.429384231567383, -5.554322242736816, -3.67926025390625, -1.80419921875, 0.07086288928985596, 1.945924997329712, 3.8209872245788574, 5.696049213409424, 7.571111679077148, 9.446173667907715, 11.321235656738281, 13.196297645568848, 15.071359634399414, 16.946422576904297, 18.821483612060547, 20.69654655456543, 22.571609497070312, 24.446670532226562, 26.321731567382812, 28.196794509887695]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 5.0, 5.0, 8.0, 12.0, 24.0, 37.0, 45.0, 85.0, 101.0, 111.0, 144.0, 106.0, 83.0, 61.0, 38.0, 25.0, 14.0, 9.0, 9.0, 10.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-79.60733032226562, -77.14020538330078, -74.67308044433594, -72.2059555053711, -69.73883056640625, -67.27169799804688, -64.80457305908203, -62.33744812011719, -59.870323181152344, -57.4031982421875, -54.936073303222656, -52.46894454956055, -50.0018196105957, -47.53469467163086, -45.06756591796875, -42.600440979003906, -40.13331604003906, -37.66619110107422, -35.199066162109375, -32.731937408447266, -30.264812469482422, -27.797687530517578, -25.3305606842041, -22.863433837890625, -20.39630889892578, -17.929183959960938, -15.462057113647461, -12.9949312210083, -10.52780532836914, -8.06067943572998, -5.59355354309082, -3.1264266967773438, -0.6593093872070312, 1.807816505432129, 4.274942398071289, 6.742068290710449, 9.20919418334961, 11.67632007598877, 14.14344596862793, 16.610572814941406, 19.07769775390625, 21.544822692871094, 24.01194953918457, 26.479076385498047, 28.94620132446289, 31.413326263427734, 33.880455017089844, 36.34757995605469, 38.81470489501953, 41.281829833984375, 43.74895477294922, 46.21608352661133, 48.68320846557617, 51.150333404541016, 53.617462158203125, 56.08458709716797, 58.55171203613281, 61.018836975097656, 63.4859619140625, 65.95308685302734, 68.42021179199219, 70.88734436035156, 73.3544692993164, 75.82159423828125, 78.2887191772461]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 9.0, 18.0, 26.0, 24.0, 44.0, 64.0, 69.0, 98.0, 133.0, 169.0, 287.0, 448.0, 679.0, 1118.0, 1837.0, 3474.0, 6626.0, 15836.0, 51696.0, 3949634.0, 121719.0, 22029.0, 8700.0, 4155.0, 2199.0, 1242.0, 724.0, 432.0, 260.0, 187.0, 95.0, 72.0, 54.0, 33.0, 23.0, 20.0, 7.0, 5.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.6015625, -8.3536376953125, -8.105712890625, -7.8577880859375, -7.60986328125, -7.3619384765625, -7.114013671875, -6.8660888671875, -6.6181640625, -6.3702392578125, -6.122314453125, -5.8743896484375, -5.62646484375, -5.3785400390625, -5.130615234375, -4.8826904296875, -4.634765625, -4.3868408203125, -4.138916015625, -3.8909912109375, -3.64306640625, -3.3951416015625, -3.147216796875, -2.8992919921875, -2.6513671875, -2.4034423828125, -2.155517578125, -1.9075927734375, -1.65966796875, -1.4117431640625, -1.163818359375, -0.9158935546875, -0.66796875, -0.4200439453125, -0.172119140625, 0.0758056640625, 0.32373046875, 0.5716552734375, 0.819580078125, 1.0675048828125, 1.3154296875, 1.5633544921875, 1.811279296875, 2.0592041015625, 2.30712890625, 2.5550537109375, 2.802978515625, 3.0509033203125, 3.298828125, 3.5467529296875, 3.794677734375, 4.0426025390625, 4.29052734375, 4.5384521484375, 4.786376953125, 5.0343017578125, 5.2822265625, 5.5301513671875, 5.778076171875, 6.0260009765625, 6.27392578125, 6.5218505859375, 6.769775390625, 7.0177001953125, 7.265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 8.0, 6.0, 9.0, 12.0, 14.0, 25.0, 27.0, 122.0, 360.0, 243.0, 64.0, 23.0, 12.0, 8.0, 10.0, 6.0, 7.0, 4.0, 7.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.228515625, -1.192047119140625, -1.15557861328125, -1.119110107421875, -1.0826416015625, -1.046173095703125, -1.00970458984375, -0.973236083984375, -0.936767578125, -0.900299072265625, -0.86383056640625, -0.827362060546875, -0.7908935546875, -0.754425048828125, -0.71795654296875, -0.681488037109375, -0.64501953125, -0.608551025390625, -0.57208251953125, -0.535614013671875, -0.4991455078125, -0.462677001953125, -0.42620849609375, -0.389739990234375, -0.353271484375, -0.316802978515625, -0.28033447265625, -0.243865966796875, -0.2073974609375, -0.170928955078125, -0.13446044921875, -0.097991943359375, -0.0615234375, -0.025054931640625, 0.01141357421875, 0.047882080078125, 0.0843505859375, 0.120819091796875, 0.15728759765625, 0.193756103515625, 0.230224609375, 0.266693115234375, 0.30316162109375, 0.339630126953125, 0.3760986328125, 0.412567138671875, 0.44903564453125, 0.485504150390625, 0.52197265625, 0.558441162109375, 0.59490966796875, 0.631378173828125, 0.6678466796875, 0.704315185546875, 0.74078369140625, 0.777252197265625, 0.813720703125, 0.850189208984375, 0.88665771484375, 0.923126220703125, 0.9595947265625, 0.996063232421875, 1.03253173828125, 1.069000244140625, 1.10546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 9.0, 9.0, 15.0, 23.0, 31.0, 34.0, 64.0, 100.0, 171.0, 281.0, 571.0, 1058.0, 2196.0, 4988.0, 13230.0, 46732.0, 297145.0, 3556962.0, 211781.0, 38525.0, 11562.0, 4539.0, 1994.0, 1013.0, 487.0, 287.0, 164.0, 104.0, 63.0, 43.0, 25.0, 17.0, 9.0, 12.0, 6.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.310546875, -4.1640625, -4.017578125, -3.87109375, -3.724609375, -3.578125, -3.431640625, -3.28515625, -3.138671875, -2.9921875, -2.845703125, -2.69921875, -2.552734375, -2.40625, -2.259765625, -2.11328125, -1.966796875, -1.8203125, -1.673828125, -1.52734375, -1.380859375, -1.234375, -1.087890625, -0.94140625, -0.794921875, -0.6484375, -0.501953125, -0.35546875, -0.208984375, -0.0625, 0.083984375, 0.23046875, 0.376953125, 0.5234375, 0.669921875, 0.81640625, 0.962890625, 1.109375, 1.255859375, 1.40234375, 1.548828125, 1.6953125, 1.841796875, 1.98828125, 2.134765625, 2.28125, 2.427734375, 2.57421875, 2.720703125, 2.8671875, 3.013671875, 3.16015625, 3.306640625, 3.453125, 3.599609375, 3.74609375, 3.892578125, 4.0390625, 4.185546875, 4.33203125, 4.478515625, 4.625, 4.771484375, 4.91796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 7.0, 6.0, 9.0, 18.0, 24.0, 15.0, 24.0, 38.0, 44.0, 66.0, 118.0, 147.0, 274.0, 772.0, 1535.0, 305.0, 173.0, 129.0, 85.0, 59.0, 35.0, 44.0, 25.0, 20.0, 19.0, 17.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.69921875, -0.6780929565429688, -0.6569671630859375, -0.6358413696289062, -0.614715576171875, -0.5935897827148438, -0.5724639892578125, -0.5513381958007812, -0.53021240234375, -0.5090866088867188, -0.4879608154296875, -0.46683502197265625, -0.445709228515625, -0.42458343505859375, -0.4034576416015625, -0.38233184814453125, -0.3612060546875, -0.34008026123046875, -0.3189544677734375, -0.29782867431640625, -0.276702880859375, -0.25557708740234375, -0.2344512939453125, -0.21332550048828125, -0.19219970703125, -0.17107391357421875, -0.1499481201171875, -0.12882232666015625, -0.107696533203125, -0.08657073974609375, -0.0654449462890625, -0.04431915283203125, -0.023193359375, -0.00206756591796875, 0.0190582275390625, 0.04018402099609375, 0.061309814453125, 0.08243560791015625, 0.1035614013671875, 0.12468719482421875, 0.14581298828125, 0.16693878173828125, 0.1880645751953125, 0.20919036865234375, 0.230316162109375, 0.25144195556640625, 0.2725677490234375, 0.29369354248046875, 0.3148193359375, 0.33594512939453125, 0.3570709228515625, 0.37819671630859375, 0.399322509765625, 0.42044830322265625, 0.4415740966796875, 0.46269989013671875, 0.48382568359375, 0.5049514770507812, 0.5260772705078125, 0.5472030639648438, 0.568328857421875, 0.5894546508789062, 0.6105804443359375, 0.6317062377929688, 0.65283203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 28.0, 75.0, 239.0, 327.0, 191.0, 82.0, 23.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171844005584717, -3.8986823558807373, -3.625520944595337, -3.3523592948913574, -3.079197883605957, -2.8060362339019775, -2.532874584197998, -2.2597131729125977, -1.9865515232086182, -1.7133899927139282, -1.4402284622192383, -1.1670668125152588, -0.8939052820205688, -0.6207437515258789, -0.3475821018218994, -0.07442057132720947, 0.19874095916748047, 0.4719025194644928, 0.7450640797615051, 1.0182256698608398, 1.2913872003555298, 1.5645487308502197, 1.8377103805541992, 2.1108717918395996, 2.384033441543579, 2.6571950912475586, 2.930356502532959, 3.2035181522369385, 3.476679801940918, 3.7498412132263184, 4.023002624511719, 4.296164512634277, 4.5693254470825195, 4.84248685836792, 5.1156487464904785, 5.388810157775879, 5.661971569061279, 5.93513298034668, 6.208294868469238, 6.481456279754639, 6.754617691040039, 7.0277791023254395, 7.300940990447998, 7.574102401733398, 7.847263813018799, 8.1204252243042, 8.393587112426758, 8.666749000549316, 8.939910888671875, 9.213072776794434, 9.486233711242676, 9.759395599365234, 10.032557487487793, 10.305718421936035, 10.578880310058594, 10.852042198181152, 11.125203132629395, 11.398365020751953, 11.671525955200195, 11.944687843322754, 12.217849731445312, 12.491010665893555, 12.764172554016113, 13.037334442138672, 13.310495376586914]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 10.0, 13.0, 19.0, 20.0, 32.0, 34.0, 49.0, 57.0, 61.0, 55.0, 56.0, 55.0, 80.0, 74.0, 56.0, 55.0, 45.0, 45.0, 24.0, 48.0, 19.0, 17.0, 26.0, 13.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.150112152099609, -4.027915954589844, -3.90571928024292, -3.783522844314575, -3.6613264083862305, -3.5391299724578857, -3.416933536529541, -3.2947373390197754, -3.1725406646728516, -3.050344228744507, -2.928147792816162, -2.8059513568878174, -2.6837549209594727, -2.561558485031128, -2.439362049102783, -2.3171658515930176, -2.194969415664673, -2.072772979736328, -1.9505765438079834, -1.8283801078796387, -1.706183671951294, -1.5839872360229492, -1.461790919303894, -1.3395944833755493, -1.2173980474472046, -1.0952016115188599, -0.9730051755905151, -0.8508087992668152, -0.7286123633384705, -0.6064159274101257, -0.4842195510864258, -0.36202311515808105, -0.23982644081115723, -0.1176300197839737, 0.004566401243209839, 0.12676280736923218, 0.2489592432975769, 0.37115567922592163, 0.4933520555496216, 0.6155484914779663, 0.737744927406311, 0.8599413633346558, 0.9821377992630005, 1.1043341159820557, 1.2265305519104004, 1.3487269878387451, 1.4709234237670898, 1.5931198596954346, 1.7153162956237793, 1.837512731552124, 1.9597091674804688, 2.0819056034088135, 2.204102039337158, 2.326298475265503, 2.4484949111938477, 2.5706911087036133, 2.692887783050537, 2.815084218978882, 2.9372806549072266, 3.0594770908355713, 3.181673526763916, 3.3038699626922607, 3.4260663986206055, 3.548262596130371, 3.670459032058716]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 14.0, 21.0, 9.0, 16.0, 30.0, 53.0, 101.0, 168.0, 248.0, 509.0, 956.0, 2084.0, 4951.0, 15631.0, 80481.0, 884258.0, 41496.0, 10450.0, 3781.0, 1596.0, 716.0, 405.0, 219.0, 132.0, 81.0, 51.0, 34.0, 19.0, 19.0, 8.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.37335205078125, -8.1295166015625, -7.88568115234375, -7.641845703125, -7.39801025390625, -7.1541748046875, -6.91033935546875, -6.66650390625, -6.42266845703125, -6.1788330078125, -5.93499755859375, -5.691162109375, -5.44732666015625, -5.2034912109375, -4.95965576171875, -4.7158203125, -4.47198486328125, -4.2281494140625, -3.98431396484375, -3.740478515625, -3.49664306640625, -3.2528076171875, -3.00897216796875, -2.76513671875, -2.52130126953125, -2.2774658203125, -2.03363037109375, -1.789794921875, -1.54595947265625, -1.3021240234375, -1.05828857421875, -0.814453125, -0.57061767578125, -0.3267822265625, -0.08294677734375, 0.160888671875, 0.40472412109375, 0.6485595703125, 0.89239501953125, 1.13623046875, 1.38006591796875, 1.6239013671875, 1.86773681640625, 2.111572265625, 2.35540771484375, 2.5992431640625, 2.84307861328125, 3.0869140625, 3.33074951171875, 3.5745849609375, 3.81842041015625, 4.062255859375, 4.30609130859375, 4.5499267578125, 4.79376220703125, 5.03759765625, 5.28143310546875, 5.5252685546875, 5.76910400390625, 6.012939453125, 6.25677490234375, 6.5006103515625, 6.74444580078125, 6.98828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 10.0, 11.0, 19.0, 24.0, 120.0, 273.0, 299.0, 104.0, 30.0, 10.0, 15.0, 14.0, 7.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2080078125, -1.171356201171875, -1.13470458984375, -1.098052978515625, -1.0614013671875, -1.024749755859375, -0.98809814453125, -0.951446533203125, -0.914794921875, -0.878143310546875, -0.84149169921875, -0.804840087890625, -0.7681884765625, -0.731536865234375, -0.69488525390625, -0.658233642578125, -0.62158203125, -0.584930419921875, -0.54827880859375, -0.511627197265625, -0.4749755859375, -0.438323974609375, -0.40167236328125, -0.365020751953125, -0.328369140625, -0.291717529296875, -0.25506591796875, -0.218414306640625, -0.1817626953125, -0.145111083984375, -0.10845947265625, -0.071807861328125, -0.03515625, 0.001495361328125, 0.03814697265625, 0.074798583984375, 0.1114501953125, 0.148101806640625, 0.18475341796875, 0.221405029296875, 0.258056640625, 0.294708251953125, 0.33135986328125, 0.368011474609375, 0.4046630859375, 0.441314697265625, 0.47796630859375, 0.514617919921875, 0.55126953125, 0.587921142578125, 0.62457275390625, 0.661224365234375, 0.6978759765625, 0.734527587890625, 0.77117919921875, 0.807830810546875, 0.844482421875, 0.881134033203125, 0.91778564453125, 0.954437255859375, 0.9910888671875, 1.027740478515625, 1.06439208984375, 1.101043701171875, 1.1376953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 3.0, 13.0, 16.0, 29.0, 32.0, 62.0, 83.0, 117.0, 197.0, 356.0, 630.0, 1374.0, 3072.0, 8714.0, 34732.0, 232065.0, 626156.0, 109950.0, 20192.0, 6031.0, 2335.0, 1110.0, 524.0, 278.0, 163.0, 101.0, 69.0, 47.0, 24.0, 24.0, 16.0, 9.0, 7.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.574920654296875, -3.44866943359375, -3.322418212890625, -3.1961669921875, -3.069915771484375, -2.94366455078125, -2.817413330078125, -2.691162109375, -2.564910888671875, -2.43865966796875, -2.312408447265625, -2.1861572265625, -2.059906005859375, -1.93365478515625, -1.807403564453125, -1.68115234375, -1.554901123046875, -1.42864990234375, -1.302398681640625, -1.1761474609375, -1.049896240234375, -0.92364501953125, -0.797393798828125, -0.671142578125, -0.544891357421875, -0.41864013671875, -0.292388916015625, -0.1661376953125, -0.039886474609375, 0.08636474609375, 0.212615966796875, 0.3388671875, 0.465118408203125, 0.59136962890625, 0.717620849609375, 0.8438720703125, 0.970123291015625, 1.09637451171875, 1.222625732421875, 1.348876953125, 1.475128173828125, 1.60137939453125, 1.727630615234375, 1.8538818359375, 1.980133056640625, 2.10638427734375, 2.232635498046875, 2.35888671875, 2.485137939453125, 2.61138916015625, 2.737640380859375, 2.8638916015625, 2.990142822265625, 3.11639404296875, 3.242645263671875, 3.368896484375, 3.495147705078125, 3.62139892578125, 3.747650146484375, 3.8739013671875, 4.000152587890625, 4.12640380859375, 4.252655029296875, 4.37890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 4.0, 14.0, 11.0, 13.0, 10.0, 21.0, 28.0, 30.0, 41.0, 45.0, 38.0, 44.0, 51.0, 64.0, 44.0, 66.0, 51.0, 42.0, 59.0, 42.0, 49.0, 46.0, 44.0, 35.0, 24.0, 18.0, 16.0, 10.0, 15.0, 4.0, 1.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.39453125, -3.294921875, -3.1953125, -3.095703125, -2.99609375, -2.896484375, -2.796875, -2.697265625, -2.59765625, -2.498046875, -2.3984375, -2.298828125, -2.19921875, -2.099609375, -2.0, -1.900390625, -1.80078125, -1.701171875, -1.6015625, -1.501953125, -1.40234375, -1.302734375, -1.203125, -1.103515625, -1.00390625, -0.904296875, -0.8046875, -0.705078125, -0.60546875, -0.505859375, -0.40625, -0.306640625, -0.20703125, -0.107421875, -0.0078125, 0.091796875, 0.19140625, 0.291015625, 0.390625, 0.490234375, 0.58984375, 0.689453125, 0.7890625, 0.888671875, 0.98828125, 1.087890625, 1.1875, 1.287109375, 1.38671875, 1.486328125, 1.5859375, 1.685546875, 1.78515625, 1.884765625, 1.984375, 2.083984375, 2.18359375, 2.283203125, 2.3828125, 2.482421875, 2.58203125, 2.681640625, 2.78125, 2.880859375, 2.98046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 20.0, 41.0, 61.0, 114.0, 226.0, 463.0, 952.0, 2378.0, 6863.0, 26457.0, 157620.0, 597825.0, 208668.0, 33621.0, 8239.0, 2774.0, 1104.0, 518.0, 261.0, 130.0, 71.0, 42.0, 26.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.889984130859375, -3.79168701171875, -3.693389892578125, -3.5950927734375, -3.496795654296875, -3.39849853515625, -3.300201416015625, -3.201904296875, -3.103607177734375, -3.00531005859375, -2.907012939453125, -2.8087158203125, -2.710418701171875, -2.61212158203125, -2.513824462890625, -2.41552734375, -2.317230224609375, -2.21893310546875, -2.120635986328125, -2.0223388671875, -1.924041748046875, -1.82574462890625, -1.727447509765625, -1.629150390625, -1.530853271484375, -1.43255615234375, -1.334259033203125, -1.2359619140625, -1.137664794921875, -1.03936767578125, -0.941070556640625, -0.8427734375, -0.744476318359375, -0.64617919921875, -0.547882080078125, -0.4495849609375, -0.351287841796875, -0.25299072265625, -0.154693603515625, -0.056396484375, 0.041900634765625, 0.14019775390625, 0.238494873046875, 0.3367919921875, 0.435089111328125, 0.53338623046875, 0.631683349609375, 0.72998046875, 0.828277587890625, 0.92657470703125, 1.024871826171875, 1.1231689453125, 1.221466064453125, 1.31976318359375, 1.418060302734375, 1.516357421875, 1.614654541015625, 1.71295166015625, 1.811248779296875, 1.9095458984375, 2.007843017578125, 2.10614013671875, 2.204437255859375, 2.302734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 6.0, 10.0, 9.0, 14.0, 22.0, 17.0, 41.0, 81.0, 114.0, 157.0, 162.0, 124.0, 91.0, 37.0, 30.0, 23.0, 14.0, 13.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0003840923309326172, -0.00037495605647563934, -0.0003658197820186615, -0.00035668350756168365, -0.0003475472331047058, -0.00033841095864772797, -0.0003292746841907501, -0.0003201384097337723, -0.00031100213527679443, -0.0003018658608198166, -0.00029272958636283875, -0.0002835933119058609, -0.00027445703744888306, -0.0002653207629919052, -0.00025618448853492737, -0.0002470482140779495, -0.00023791193962097168, -0.00022877566516399384, -0.000219639390707016, -0.00021050311625003815, -0.0002013668417930603, -0.00019223056733608246, -0.00018309429287910461, -0.00017395801842212677, -0.00016482174396514893, -0.00015568546950817108, -0.00014654919505119324, -0.0001374129205942154, -0.00012827664613723755, -0.0001191403716802597, -0.00011000409722328186, -0.00010086782276630402, -9.173154830932617e-05, -8.259527385234833e-05, -7.345899939537048e-05, -6.432272493839264e-05, -5.5186450481414795e-05, -4.605017602443695e-05, -3.6913901567459106e-05, -2.7777627110481262e-05, -1.8641352653503418e-05, -9.505078196525574e-06, -3.688037395477295e-07, 8.767470717430115e-06, 1.790374517440796e-05, 2.7040019631385803e-05, 3.617629408836365e-05, 4.531256854534149e-05, 5.4448843002319336e-05, 6.358511745929718e-05, 7.272139191627502e-05, 8.185766637325287e-05, 9.099394083023071e-05, 0.00010013021528720856, 0.0001092664897441864, 0.00011840276420116425, 0.0001275390386581421, 0.00013667531311511993, 0.00014581158757209778, 0.00015494786202907562, 0.00016408413648605347, 0.0001732204109430313, 0.00018235668540000916, 0.000191492959856987, 0.00020062923431396484]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 8.0, 11.0, 21.0, 22.0, 33.0, 52.0, 102.0, 151.0, 225.0, 399.0, 688.0, 1159.0, 2172.0, 4539.0, 10820.0, 29567.0, 97519.0, 299478.0, 379951.0, 149010.0, 44790.0, 15144.0, 6206.0, 2901.0, 1509.0, 791.0, 469.0, 319.0, 174.0, 95.0, 62.0, 55.0, 22.0, 24.0, 16.0, 13.0, 11.0, 4.0, 5.0, 1.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.368682861328125, -1.30963134765625, -1.250579833984375, -1.1915283203125, -1.132476806640625, -1.07342529296875, -1.014373779296875, -0.955322265625, -0.896270751953125, -0.83721923828125, -0.778167724609375, -0.7191162109375, -0.660064697265625, -0.60101318359375, -0.541961669921875, -0.48291015625, -0.423858642578125, -0.36480712890625, -0.305755615234375, -0.2467041015625, -0.187652587890625, -0.12860107421875, -0.069549560546875, -0.010498046875, 0.048553466796875, 0.10760498046875, 0.166656494140625, 0.2257080078125, 0.284759521484375, 0.34381103515625, 0.402862548828125, 0.4619140625, 0.520965576171875, 0.58001708984375, 0.639068603515625, 0.6981201171875, 0.757171630859375, 0.81622314453125, 0.875274658203125, 0.934326171875, 0.993377685546875, 1.05242919921875, 1.111480712890625, 1.1705322265625, 1.229583740234375, 1.28863525390625, 1.347686767578125, 1.40673828125, 1.465789794921875, 1.52484130859375, 1.583892822265625, 1.6429443359375, 1.701995849609375, 1.76104736328125, 1.820098876953125, 1.879150390625, 1.938201904296875, 1.99725341796875, 2.056304931640625, 2.1153564453125, 2.174407958984375, 2.23345947265625, 2.292510986328125, 2.3515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 16.0, 19.0, 27.0, 27.0, 41.0, 44.0, 69.0, 78.0, 90.0, 83.0, 77.0, 80.0, 64.0, 64.0, 51.0, 34.0, 38.0, 25.0, 19.0, 14.0, 8.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5512237548828125, -1.494049072265625, -1.4368743896484375, -1.37969970703125, -1.3225250244140625, -1.265350341796875, -1.2081756591796875, -1.1510009765625, -1.0938262939453125, -1.036651611328125, -0.9794769287109375, -0.92230224609375, -0.8651275634765625, -0.807952880859375, -0.7507781982421875, -0.693603515625, -0.6364288330078125, -0.579254150390625, -0.5220794677734375, -0.46490478515625, -0.4077301025390625, -0.350555419921875, -0.2933807373046875, -0.2362060546875, -0.1790313720703125, -0.121856689453125, -0.0646820068359375, -0.00750732421875, 0.0496673583984375, 0.106842041015625, 0.1640167236328125, 0.22119140625, 0.2783660888671875, 0.335540771484375, 0.3927154541015625, 0.44989013671875, 0.5070648193359375, 0.564239501953125, 0.6214141845703125, 0.6785888671875, 0.7357635498046875, 0.792938232421875, 0.8501129150390625, 0.90728759765625, 0.9644622802734375, 1.021636962890625, 1.0788116455078125, 1.135986328125, 1.1931610107421875, 1.250335693359375, 1.3075103759765625, 1.36468505859375, 1.4218597412109375, 1.479034423828125, 1.5362091064453125, 1.5933837890625, 1.6505584716796875, 1.707733154296875, 1.7649078369140625, 1.82208251953125, 1.8792572021484375, 1.936431884765625, 1.9936065673828125, 2.05078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 21.0, 157.0, 446.0, 287.0, 64.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.80026626586914, -34.07546615600586, -32.350669860839844, -30.625869750976562, -28.901073455810547, -27.176273345947266, -25.451475143432617, -23.72667694091797, -22.00187873840332, -20.277080535888672, -18.552282333374023, -16.827484130859375, -15.10268497467041, -13.377886772155762, -11.653087615966797, -9.928289413452148, -8.2034912109375, -6.478693008422852, -4.753894329071045, -3.0290956497192383, -1.3042974472045898, 0.4205007553100586, 2.1452999114990234, 3.870098114013672, 5.59489631652832, 7.319694519042969, 9.044492721557617, 10.769291877746582, 12.49409008026123, 14.218888282775879, 15.943687438964844, 17.668485641479492, 19.393287658691406, 21.118085861206055, 22.842884063720703, 24.567684173583984, 26.29248046875, 28.01728057861328, 29.74207878112793, 31.466876983642578, 33.191673278808594, 34.916473388671875, 36.64126968383789, 38.36606979370117, 40.09086608886719, 41.81566619873047, 43.54046630859375, 45.265262603759766, 46.99006271362305, 48.71486282348633, 50.439659118652344, 52.164459228515625, 53.88925552368164, 55.61405563354492, 57.33885192871094, 59.06365203857422, 60.7884521484375, 62.51325225830078, 64.23805236816406, 65.96284484863281, 67.6876449584961, 69.41244506835938, 71.13724517822266, 72.86204528808594, 74.58683776855469]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 4.0, 21.0, 30.0, 31.0, 54.0, 60.0, 90.0, 88.0, 112.0, 89.0, 89.0, 78.0, 64.0, 46.0, 43.0, 23.0, 9.0, 14.0, 10.0, 1.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.830583572387695, -25.822338104248047, -24.814090728759766, -23.805843353271484, -22.797597885131836, -21.789352416992188, -20.781105041503906, -19.772857666015625, -18.764612197875977, -17.756366729736328, -16.748119354248047, -15.739872932434082, -14.731626510620117, -13.723380088806152, -12.715133666992188, -11.706887245178223, -10.698640823364258, -9.690394401550293, -8.682147979736328, -7.673901557922363, -6.665655136108398, -5.657408714294434, -4.649162292480469, -3.640915870666504, -2.632669448852539, -1.6244230270385742, -0.6161766052246094, 0.39206981658935547, 1.4003162384033203, 2.408562660217285, 3.41680908203125, 4.425055503845215, 5.433300018310547, 6.441546440124512, 7.449792861938477, 8.458039283752441, 9.466285705566406, 10.474532127380371, 11.482778549194336, 12.4910249710083, 13.499271392822266, 14.50751781463623, 15.515764236450195, 16.524009704589844, 17.532257080078125, 18.540504455566406, 19.548749923706055, 20.556995391845703, 21.565242767333984, 22.573490142822266, 23.581735610961914, 24.589981079101562, 25.598228454589844, 26.606475830078125, 27.614721298217773, 28.622966766357422, 29.631214141845703, 30.639461517333984, 31.647706985473633, 32.65595245361328, 33.66419982910156, 34.672447204589844, 35.680694580078125, 36.68893814086914, 37.69718551635742]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 6.0, 18.0, 14.0, 14.0, 16.0, 25.0, 35.0, 29.0, 43.0, 54.0, 66.0, 78.0, 84.0, 115.0, 171.0, 213.0, 316.0, 465.0, 721.0, 1111.0, 1972.0, 3832.0, 9098.0, 31565.0, 855849.0, 3235037.0, 35028.0, 9111.0, 3891.0, 2030.0, 1132.0, 698.0, 438.0, 305.0, 193.0, 129.0, 86.0, 65.0, 52.0, 36.0, 28.0, 21.0, 20.0, 18.0, 13.0, 6.0, 3.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-10.7265625, -10.411376953125, -10.09619140625, -9.781005859375, -9.4658203125, -9.150634765625, -8.83544921875, -8.520263671875, -8.205078125, -7.889892578125, -7.57470703125, -7.259521484375, -6.9443359375, -6.629150390625, -6.31396484375, -5.998779296875, -5.68359375, -5.368408203125, -5.05322265625, -4.738037109375, -4.4228515625, -4.107666015625, -3.79248046875, -3.477294921875, -3.162109375, -2.846923828125, -2.53173828125, -2.216552734375, -1.9013671875, -1.586181640625, -1.27099609375, -0.955810546875, -0.640625, -0.325439453125, -0.01025390625, 0.304931640625, 0.6201171875, 0.935302734375, 1.25048828125, 1.565673828125, 1.880859375, 2.196044921875, 2.51123046875, 2.826416015625, 3.1416015625, 3.456787109375, 3.77197265625, 4.087158203125, 4.40234375, 4.717529296875, 5.03271484375, 5.347900390625, 5.6630859375, 5.978271484375, 6.29345703125, 6.608642578125, 6.923828125, 7.239013671875, 7.55419921875, 7.869384765625, 8.1845703125, 8.499755859375, 8.81494140625, 9.130126953125, 9.4453125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 10.0, 19.0, 34.0, 92.0, 228.0, 264.0, 174.0, 67.0, 18.0, 11.0, 12.0, 9.0, 13.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1659698486328125, -1.129791259765625, -1.0936126708984375, -1.05743408203125, -1.0212554931640625, -0.985076904296875, -0.9488983154296875, -0.9127197265625, -0.8765411376953125, -0.840362548828125, -0.8041839599609375, -0.76800537109375, -0.7318267822265625, -0.695648193359375, -0.6594696044921875, -0.623291015625, -0.5871124267578125, -0.550933837890625, -0.5147552490234375, -0.47857666015625, -0.4423980712890625, -0.406219482421875, -0.3700408935546875, -0.3338623046875, -0.2976837158203125, -0.261505126953125, -0.2253265380859375, -0.18914794921875, -0.1529693603515625, -0.116790771484375, -0.0806121826171875, -0.04443359375, -0.0082550048828125, 0.027923583984375, 0.0641021728515625, 0.10028076171875, 0.1364593505859375, 0.172637939453125, 0.2088165283203125, 0.2449951171875, 0.2811737060546875, 0.317352294921875, 0.3535308837890625, 0.38970947265625, 0.4258880615234375, 0.462066650390625, 0.4982452392578125, 0.534423828125, 0.5706024169921875, 0.606781005859375, 0.6429595947265625, 0.67913818359375, 0.7153167724609375, 0.751495361328125, 0.7876739501953125, 0.8238525390625, 0.8600311279296875, 0.896209716796875, 0.9323883056640625, 0.96856689453125, 1.0047454833984375, 1.040924072265625, 1.0771026611328125, 1.11328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 12.0, 15.0, 20.0, 33.0, 74.0, 119.0, 217.0, 610.0, 1869.0, 8010.0, 50205.0, 2162129.0, 1910442.0, 49552.0, 7909.0, 1887.0, 571.0, 281.0, 121.0, 64.0, 34.0, 34.0, 16.0, 11.0, 13.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.366943359375, -10.06201171875, -9.757080078125, -9.4521484375, -9.147216796875, -8.84228515625, -8.537353515625, -8.232421875, -7.927490234375, -7.62255859375, -7.317626953125, -7.0126953125, -6.707763671875, -6.40283203125, -6.097900390625, -5.79296875, -5.488037109375, -5.18310546875, -4.878173828125, -4.5732421875, -4.268310546875, -3.96337890625, -3.658447265625, -3.353515625, -3.048583984375, -2.74365234375, -2.438720703125, -2.1337890625, -1.828857421875, -1.52392578125, -1.218994140625, -0.9140625, -0.609130859375, -0.30419921875, 0.000732421875, 0.3056640625, 0.610595703125, 0.91552734375, 1.220458984375, 1.525390625, 1.830322265625, 2.13525390625, 2.440185546875, 2.7451171875, 3.050048828125, 3.35498046875, 3.659912109375, 3.96484375, 4.269775390625, 4.57470703125, 4.879638671875, 5.1845703125, 5.489501953125, 5.79443359375, 6.099365234375, 6.404296875, 6.709228515625, 7.01416015625, 7.319091796875, 7.6240234375, 7.928955078125, 8.23388671875, 8.538818359375, 8.84375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 8.0, 12.0, 16.0, 17.0, 30.0, 32.0, 51.0, 97.0, 130.0, 213.0, 401.0, 1559.0, 775.0, 265.0, 158.0, 84.0, 53.0, 37.0, 32.0, 25.0, 13.0, 16.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.05078125, -1.016693115234375, -0.98260498046875, -0.948516845703125, -0.9144287109375, -0.880340576171875, -0.84625244140625, -0.812164306640625, -0.778076171875, -0.743988037109375, -0.70989990234375, -0.675811767578125, -0.6417236328125, -0.607635498046875, -0.57354736328125, -0.539459228515625, -0.50537109375, -0.471282958984375, -0.43719482421875, -0.403106689453125, -0.3690185546875, -0.334930419921875, -0.30084228515625, -0.266754150390625, -0.232666015625, -0.198577880859375, -0.16448974609375, -0.130401611328125, -0.0963134765625, -0.062225341796875, -0.02813720703125, 0.005950927734375, 0.0400390625, 0.074127197265625, 0.10821533203125, 0.142303466796875, 0.1763916015625, 0.210479736328125, 0.24456787109375, 0.278656005859375, 0.312744140625, 0.346832275390625, 0.38092041015625, 0.415008544921875, 0.4490966796875, 0.483184814453125, 0.51727294921875, 0.551361083984375, 0.58544921875, 0.619537353515625, 0.65362548828125, 0.687713623046875, 0.7218017578125, 0.755889892578125, 0.78997802734375, 0.824066162109375, 0.858154296875, 0.892242431640625, 0.92633056640625, 0.960418701171875, 0.9945068359375, 1.028594970703125, 1.06268310546875, 1.096771240234375, 1.130859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 13.0, 45.0, 113.0, 270.0, 302.0, 158.0, 61.0, 20.0, 13.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.459372520446777, -4.064705848693848, -3.670039653778076, -3.2753732204437256, -2.880706787109375, -2.4860403537750244, -2.091373920440674, -1.6967074871063232, -1.3020410537719727, -0.9073746204376221, -0.5127081871032715, -0.1180417537689209, 0.2766246795654297, 0.6712911128997803, 1.0659575462341309, 1.4606239795684814, 1.855290412902832, 2.2499568462371826, 2.644623279571533, 3.039289712905884, 3.4339561462402344, 3.828622579574585, 4.2232890129089355, 4.617955207824707, 5.012621879577637, 5.407288551330566, 5.801954746246338, 6.196620941162109, 6.591287612915039, 6.985954284667969, 7.38062047958374, 7.775286674499512, 8.169954299926758, 8.564620971679688, 8.959287643432617, 9.35395336151123, 9.74862003326416, 10.14328670501709, 10.537952423095703, 10.932619094848633, 11.327285766601562, 11.721952438354492, 12.116619110107422, 12.511284828186035, 12.905951499938965, 13.300618171691895, 13.695283889770508, 14.089950561523438, 14.484617233276367, 14.879283905029297, 15.273950576782227, 15.66861629486084, 16.063282012939453, 16.457948684692383, 16.852615356445312, 17.247282028198242, 17.641948699951172, 18.0366153717041, 18.43128204345703, 18.82594871520996, 19.22061538696289, 19.615280151367188, 20.009946823120117, 20.404613494873047, 20.799280166625977]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 6.0, 9.0, 15.0, 18.0, 28.0, 29.0, 40.0, 32.0, 46.0, 39.0, 42.0, 36.0, 44.0, 43.0, 42.0, 43.0, 49.0, 49.0, 57.0, 34.0, 38.0, 38.0, 45.0, 26.0, 24.0, 25.0, 15.0, 13.0, 11.0, 9.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.964128255844116, -3.844958782196045, -3.7257893085479736, -3.6066198348999023, -3.487450361251831, -3.3682808876037598, -3.2491111755371094, -3.129941701889038, -3.010772228240967, -2.8916027545928955, -2.772433280944824, -2.653263807296753, -2.5340943336486816, -2.4149246215820312, -2.295755386352539, -2.1765856742858887, -2.0574164390563965, -1.9382469654083252, -1.819077491760254, -1.6999080181121826, -1.5807384252548218, -1.4615689516067505, -1.3423994779586792, -1.2232298851013184, -1.104060411453247, -0.9848909378051758, -0.8657214045524597, -0.7465519309043884, -0.6273823976516724, -0.5082129240036011, -0.3890434503555298, -0.2698739171028137, -0.15070438385009766, -0.031534887850284576, 0.0876346081495285, 0.206804096698761, 0.32597360014915466, 0.44514310359954834, 0.5643125772476196, 0.6834821105003357, 0.802651584148407, 0.9218210577964783, 1.0409905910491943, 1.1601600646972656, 1.279329538345337, 1.3984990119934082, 1.5176684856414795, 1.6368380784988403, 1.7560075521469116, 1.875177025794983, 1.9943464994430542, 2.113516092300415, 2.2326855659484863, 2.3518550395965576, 2.471024513244629, 2.5901939868927, 2.7093634605407715, 2.8285329341888428, 2.947702407836914, 3.0668718814849854, 3.1860413551330566, 3.305211067199707, 3.424380302429199, 3.5435500144958496, 3.662719488143921]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 14.0, 17.0, 27.0, 33.0, 36.0, 53.0, 72.0, 134.0, 161.0, 247.0, 440.0, 613.0, 1167.0, 2014.0, 4156.0, 9708.0, 31405.0, 275260.0, 638971.0, 58001.0, 14200.0, 5601.0, 2682.0, 1330.0, 785.0, 466.0, 291.0, 197.0, 130.0, 105.0, 71.0, 41.0, 26.0, 28.0, 18.0, 13.0, 10.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.78125, -7.5467529296875, -7.312255859375, -7.0777587890625, -6.84326171875, -6.6087646484375, -6.374267578125, -6.1397705078125, -5.9052734375, -5.6707763671875, -5.436279296875, -5.2017822265625, -4.96728515625, -4.7327880859375, -4.498291015625, -4.2637939453125, -4.029296875, -3.7947998046875, -3.560302734375, -3.3258056640625, -3.09130859375, -2.8568115234375, -2.622314453125, -2.3878173828125, -2.1533203125, -1.9188232421875, -1.684326171875, -1.4498291015625, -1.21533203125, -0.9808349609375, -0.746337890625, -0.5118408203125, -0.27734375, -0.0428466796875, 0.191650390625, 0.4261474609375, 0.66064453125, 0.8951416015625, 1.129638671875, 1.3641357421875, 1.5986328125, 1.8331298828125, 2.067626953125, 2.3021240234375, 2.53662109375, 2.7711181640625, 3.005615234375, 3.2401123046875, 3.474609375, 3.7091064453125, 3.943603515625, 4.1781005859375, 4.41259765625, 4.6470947265625, 4.881591796875, 5.1160888671875, 5.3505859375, 5.5850830078125, 5.819580078125, 6.0540771484375, 6.28857421875, 6.5230712890625, 6.757568359375, 6.9920654296875, 7.2265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 15.0, 11.0, 23.0, 48.0, 126.0, 219.0, 227.0, 155.0, 81.0, 30.0, 16.0, 5.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1429595947265625, -1.106231689453125, -1.0695037841796875, -1.03277587890625, -0.9960479736328125, -0.959320068359375, -0.9225921630859375, -0.8858642578125, -0.8491363525390625, -0.812408447265625, -0.7756805419921875, -0.73895263671875, -0.7022247314453125, -0.665496826171875, -0.6287689208984375, -0.592041015625, -0.5553131103515625, -0.518585205078125, -0.4818572998046875, -0.44512939453125, -0.4084014892578125, -0.371673583984375, -0.3349456787109375, -0.2982177734375, -0.2614898681640625, -0.224761962890625, -0.1880340576171875, -0.15130615234375, -0.1145782470703125, -0.077850341796875, -0.0411224365234375, -0.00439453125, 0.0323333740234375, 0.069061279296875, 0.1057891845703125, 0.14251708984375, 0.1792449951171875, 0.215972900390625, 0.2527008056640625, 0.2894287109375, 0.3261566162109375, 0.362884521484375, 0.3996124267578125, 0.43634033203125, 0.4730682373046875, 0.509796142578125, 0.5465240478515625, 0.583251953125, 0.6199798583984375, 0.656707763671875, 0.6934356689453125, 0.73016357421875, 0.7668914794921875, 0.803619384765625, 0.8403472900390625, 0.8770751953125, 0.9138031005859375, 0.950531005859375, 0.9872589111328125, 1.02398681640625, 1.0607147216796875, 1.097442626953125, 1.1341705322265625, 1.1708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 10.0, 13.0, 9.0, 20.0, 31.0, 34.0, 45.0, 84.0, 110.0, 208.0, 319.0, 599.0, 1075.0, 2420.0, 6692.0, 25702.0, 146765.0, 573429.0, 236100.0, 39787.0, 9174.0, 2940.0, 1324.0, 644.0, 355.0, 229.0, 139.0, 75.0, 43.0, 34.0, 36.0, 24.0, 14.0, 9.0, 15.0, 8.0, 8.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8359375, -6.61981201171875, -6.4036865234375, -6.18756103515625, -5.971435546875, -5.75531005859375, -5.5391845703125, -5.32305908203125, -5.10693359375, -4.89080810546875, -4.6746826171875, -4.45855712890625, -4.242431640625, -4.02630615234375, -3.8101806640625, -3.59405517578125, -3.3779296875, -3.16180419921875, -2.9456787109375, -2.72955322265625, -2.513427734375, -2.29730224609375, -2.0811767578125, -1.86505126953125, -1.64892578125, -1.43280029296875, -1.2166748046875, -1.00054931640625, -0.784423828125, -0.56829833984375, -0.3521728515625, -0.13604736328125, 0.080078125, 0.29620361328125, 0.5123291015625, 0.72845458984375, 0.944580078125, 1.16070556640625, 1.3768310546875, 1.59295654296875, 1.80908203125, 2.02520751953125, 2.2413330078125, 2.45745849609375, 2.673583984375, 2.88970947265625, 3.1058349609375, 3.32196044921875, 3.5380859375, 3.75421142578125, 3.9703369140625, 4.18646240234375, 4.402587890625, 4.61871337890625, 4.8348388671875, 5.05096435546875, 5.26708984375, 5.48321533203125, 5.6993408203125, 5.91546630859375, 6.131591796875, 6.34771728515625, 6.5638427734375, 6.77996826171875, 6.99609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 10.0, 12.0, 6.0, 19.0, 20.0, 29.0, 28.0, 40.0, 29.0, 32.0, 44.0, 35.0, 47.0, 41.0, 44.0, 50.0, 38.0, 40.0, 46.0, 38.0, 36.0, 35.0, 39.0, 29.0, 24.0, 29.0, 23.0, 17.0, 15.0, 9.0, 10.0, 11.0, 12.0, 9.0, 4.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.9781494140625, -2.884033203125, -2.7899169921875, -2.69580078125, -2.6016845703125, -2.507568359375, -2.4134521484375, -2.3193359375, -2.2252197265625, -2.131103515625, -2.0369873046875, -1.94287109375, -1.8487548828125, -1.754638671875, -1.6605224609375, -1.56640625, -1.4722900390625, -1.378173828125, -1.2840576171875, -1.18994140625, -1.0958251953125, -1.001708984375, -0.9075927734375, -0.8134765625, -0.7193603515625, -0.625244140625, -0.5311279296875, -0.43701171875, -0.3428955078125, -0.248779296875, -0.1546630859375, -0.060546875, 0.0335693359375, 0.127685546875, 0.2218017578125, 0.31591796875, 0.4100341796875, 0.504150390625, 0.5982666015625, 0.6923828125, 0.7864990234375, 0.880615234375, 0.9747314453125, 1.06884765625, 1.1629638671875, 1.257080078125, 1.3511962890625, 1.4453125, 1.5394287109375, 1.633544921875, 1.7276611328125, 1.82177734375, 1.9158935546875, 2.010009765625, 2.1041259765625, 2.1982421875, 2.2923583984375, 2.386474609375, 2.4805908203125, 2.57470703125, 2.6688232421875, 2.762939453125, 2.8570556640625, 2.951171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 19.0, 25.0, 35.0, 54.0, 74.0, 109.0, 183.0, 322.0, 554.0, 951.0, 1905.0, 3859.0, 8053.0, 18830.0, 49886.0, 147762.0, 368893.0, 286866.0, 99083.0, 34620.0, 13793.0, 6171.0, 2934.0, 1502.0, 792.0, 497.0, 287.0, 162.0, 111.0, 61.0, 45.0, 26.0, 14.0, 24.0, 9.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.8515625, -2.764678955078125, -2.67779541015625, -2.590911865234375, -2.5040283203125, -2.417144775390625, -2.33026123046875, -2.243377685546875, -2.156494140625, -2.069610595703125, -1.98272705078125, -1.895843505859375, -1.8089599609375, -1.722076416015625, -1.63519287109375, -1.548309326171875, -1.46142578125, -1.374542236328125, -1.28765869140625, -1.200775146484375, -1.1138916015625, -1.027008056640625, -0.94012451171875, -0.853240966796875, -0.766357421875, -0.679473876953125, -0.59259033203125, -0.505706787109375, -0.4188232421875, -0.331939697265625, -0.24505615234375, -0.158172607421875, -0.0712890625, 0.015594482421875, 0.10247802734375, 0.189361572265625, 0.2762451171875, 0.363128662109375, 0.45001220703125, 0.536895751953125, 0.623779296875, 0.710662841796875, 0.79754638671875, 0.884429931640625, 0.9713134765625, 1.058197021484375, 1.14508056640625, 1.231964111328125, 1.31884765625, 1.405731201171875, 1.49261474609375, 1.579498291015625, 1.6663818359375, 1.753265380859375, 1.84014892578125, 1.927032470703125, 2.013916015625, 2.100799560546875, 2.18768310546875, 2.274566650390625, 2.3614501953125, 2.448333740234375, 2.53521728515625, 2.622100830078125, 2.708984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 13.0, 21.0, 42.0, 43.0, 89.0, 117.0, 148.0, 158.0, 119.0, 67.0, 51.0, 33.0, 24.0, 15.0, 7.0, 10.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000804901123046875, -0.0007818490266799927, -0.0007587969303131104, -0.000735744833946228, -0.0007126927375793457, -0.0006896406412124634, -0.0006665885448455811, -0.0006435364484786987, -0.0006204843521118164, -0.0005974322557449341, -0.0005743801593780518, -0.0005513280630111694, -0.0005282759666442871, -0.0005052238702774048, -0.00048217177391052246, -0.00045911967754364014, -0.0004360675811767578, -0.0004130154848098755, -0.00038996338844299316, -0.00036691129207611084, -0.0003438591957092285, -0.0003208070993423462, -0.00029775500297546387, -0.00027470290660858154, -0.0002516508102416992, -0.0002285987138748169, -0.00020554661750793457, -0.00018249452114105225, -0.00015944242477416992, -0.0001363903284072876, -0.00011333823204040527, -9.028613567352295e-05, -6.723403930664062e-05, -4.41819429397583e-05, -2.1129846572875977e-05, 1.9222497940063477e-06, 2.4974346160888672e-05, 4.8026442527770996e-05, 7.107853889465332e-05, 9.413063526153564e-05, 0.00011718273162841797, 0.0001402348279953003, 0.00016328692436218262, 0.00018633902072906494, 0.00020939111709594727, 0.0002324432134628296, 0.0002554953098297119, 0.00027854740619659424, 0.00030159950256347656, 0.0003246515989303589, 0.0003477036952972412, 0.00037075579166412354, 0.00039380788803100586, 0.0004168599843978882, 0.0004399120807647705, 0.00046296417713165283, 0.00048601627349853516, 0.0005090683698654175, 0.0005321204662322998, 0.0005551725625991821, 0.0005782246589660645, 0.0006012767553329468, 0.0006243288516998291, 0.0006473809480667114, 0.0006704330444335938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 11.0, 5.0, 6.0, 25.0, 17.0, 25.0, 33.0, 49.0, 92.0, 117.0, 189.0, 283.0, 455.0, 821.0, 1499.0, 3210.0, 8174.0, 26818.0, 116443.0, 502370.0, 302082.0, 59764.0, 15642.0, 5353.0, 2325.0, 1137.0, 589.0, 354.0, 220.0, 125.0, 96.0, 54.0, 41.0, 33.0, 27.0, 16.0, 14.0, 11.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.4296875, -4.305908203125, -4.18212890625, -4.058349609375, -3.9345703125, -3.810791015625, -3.68701171875, -3.563232421875, -3.439453125, -3.315673828125, -3.19189453125, -3.068115234375, -2.9443359375, -2.820556640625, -2.69677734375, -2.572998046875, -2.44921875, -2.325439453125, -2.20166015625, -2.077880859375, -1.9541015625, -1.830322265625, -1.70654296875, -1.582763671875, -1.458984375, -1.335205078125, -1.21142578125, -1.087646484375, -0.9638671875, -0.840087890625, -0.71630859375, -0.592529296875, -0.46875, -0.344970703125, -0.22119140625, -0.097412109375, 0.0263671875, 0.150146484375, 0.27392578125, 0.397705078125, 0.521484375, 0.645263671875, 0.76904296875, 0.892822265625, 1.0166015625, 1.140380859375, 1.26416015625, 1.387939453125, 1.51171875, 1.635498046875, 1.75927734375, 1.883056640625, 2.0068359375, 2.130615234375, 2.25439453125, 2.378173828125, 2.501953125, 2.625732421875, 2.74951171875, 2.873291015625, 2.9970703125, 3.120849609375, 3.24462890625, 3.368408203125, 3.4921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 6.0, 2.0, 10.0, 9.0, 8.0, 12.0, 11.0, 22.0, 17.0, 30.0, 21.0, 30.0, 26.0, 32.0, 45.0, 56.0, 54.0, 66.0, 60.0, 57.0, 60.0, 57.0, 38.0, 53.0, 35.0, 27.0, 22.0, 27.0, 11.0, 9.0, 14.0, 14.0, 15.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7353515625, -1.686309814453125, -1.63726806640625, -1.588226318359375, -1.5391845703125, -1.490142822265625, -1.44110107421875, -1.392059326171875, -1.343017578125, -1.293975830078125, -1.24493408203125, -1.195892333984375, -1.1468505859375, -1.097808837890625, -1.04876708984375, -0.999725341796875, -0.95068359375, -0.901641845703125, -0.85260009765625, -0.803558349609375, -0.7545166015625, -0.705474853515625, -0.65643310546875, -0.607391357421875, -0.558349609375, -0.509307861328125, -0.46026611328125, -0.411224365234375, -0.3621826171875, -0.313140869140625, -0.26409912109375, -0.215057373046875, -0.166015625, -0.116973876953125, -0.06793212890625, -0.018890380859375, 0.0301513671875, 0.079193115234375, 0.12823486328125, 0.177276611328125, 0.226318359375, 0.275360107421875, 0.32440185546875, 0.373443603515625, 0.4224853515625, 0.471527099609375, 0.52056884765625, 0.569610595703125, 0.61865234375, 0.667694091796875, 0.71673583984375, 0.765777587890625, 0.8148193359375, 0.863861083984375, 0.91290283203125, 0.961944580078125, 1.010986328125, 1.060028076171875, 1.10906982421875, 1.158111572265625, 1.2071533203125, 1.256195068359375, 1.30523681640625, 1.354278564453125, 1.4033203125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 36.0, 125.0, 327.0, 312.0, 135.0, 34.0, 9.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.84950637817383, -33.287010192871094, -30.724512100219727, -28.16201400756836, -25.599517822265625, -23.03702163696289, -20.474523544311523, -17.912025451660156, -15.349529266357422, -12.787032127380371, -10.22453498840332, -7.6620378494262695, -5.099540710449219, -2.537043571472168, 0.025453567504882812, 2.58795166015625, 5.150447845458984, 7.712944984436035, 10.275442123413086, 12.837939262390137, 15.400436401367188, 17.962932586669922, 20.52543067932129, 23.087928771972656, 25.65042495727539, 28.212921142578125, 30.775419235229492, 33.33791732788086, 35.900413513183594, 38.46290969848633, 41.02540588378906, 43.58790588378906, 46.15040588378906, 48.7129020690918, 51.27539825439453, 53.83789825439453, 56.400394439697266, 58.962890625, 61.525390625, 64.087890625, 66.65038299560547, 69.21288299560547, 71.77537536621094, 74.33787536621094, 76.90037536621094, 79.4628677368164, 82.0253677368164, 84.58786010742188, 87.15036010742188, 89.71286010742188, 92.27535247802734, 94.83785247802734, 97.40034484863281, 99.96284484863281, 102.52534484863281, 105.08784484863281, 107.65033721923828, 110.21283721923828, 112.77532958984375, 115.33782958984375, 117.90032958984375, 120.46282196044922, 123.02532196044922, 125.58781433105469, 128.1503143310547]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 10.0, 5.0, 17.0, 22.0, 19.0, 26.0, 35.0, 52.0, 61.0, 64.0, 69.0, 62.0, 74.0, 72.0, 62.0, 65.0, 50.0, 49.0, 35.0, 41.0, 28.0, 26.0, 21.0, 8.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.126251220703125, -35.01819610595703, -33.91013717651367, -32.80208206176758, -31.69402503967285, -30.585968017578125, -29.47791290283203, -28.369855880737305, -27.261798858642578, -26.15374183654785, -25.045684814453125, -23.93762969970703, -22.829572677612305, -21.721515655517578, -20.613460540771484, -19.505403518676758, -18.39734649658203, -17.289289474487305, -16.181232452392578, -15.073177337646484, -13.965120315551758, -12.857063293457031, -11.749007225036621, -10.640951156616211, -9.532894134521484, -8.424837112426758, -7.316781044006348, -6.208724498748779, -5.100667953491211, -3.9926114082336426, -2.884554862976074, -1.7764983177185059, -0.6684417724609375, 0.43961477279663086, 1.5476713180541992, 2.6557278633117676, 3.763784408569336, 4.871840953826904, 5.979897499084473, 7.087954044342041, 8.19601058959961, 9.304067611694336, 10.412123680114746, 11.520179748535156, 12.628236770629883, 13.73629379272461, 14.84434986114502, 15.95240592956543, 17.060462951660156, 18.168519973754883, 19.27657699584961, 20.384632110595703, 21.49268913269043, 22.600746154785156, 23.70880126953125, 24.816858291625977, 25.924915313720703, 27.03297233581543, 28.141029357910156, 29.24908447265625, 30.357141494750977, 31.465198516845703, 32.5732536315918, 33.681312561035156, 34.78936767578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 13.0, 30.0, 40.0, 86.0, 183.0, 565.0, 2491.0, 44380.0, 4127901.0, 16316.0, 1588.0, 392.0, 154.0, 69.0, 28.0, 15.0, 10.0, 0.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.96875, -29.98193359375, -28.9951171875, -28.00830078125, -27.021484375, -26.03466796875, -25.0478515625, -24.06103515625, -23.07421875, -22.08740234375, -21.1005859375, -20.11376953125, -19.126953125, -18.14013671875, -17.1533203125, -16.16650390625, -15.1796875, -14.19287109375, -13.2060546875, -12.21923828125, -11.232421875, -10.24560546875, -9.2587890625, -8.27197265625, -7.28515625, -6.29833984375, -5.3115234375, -4.32470703125, -3.337890625, -2.35107421875, -1.3642578125, -0.37744140625, 0.609375, 1.59619140625, 2.5830078125, 3.56982421875, 4.556640625, 5.54345703125, 6.5302734375, 7.51708984375, 8.50390625, 9.49072265625, 10.4775390625, 11.46435546875, 12.451171875, 13.43798828125, 14.4248046875, 15.41162109375, 16.3984375, 17.38525390625, 18.3720703125, 19.35888671875, 20.345703125, 21.33251953125, 22.3193359375, 23.30615234375, 24.29296875, 25.27978515625, 26.2666015625, 27.25341796875, 28.240234375, 29.22705078125, 30.2138671875, 31.20068359375, 32.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 16.0, 34.0, 45.0, 131.0, 153.0, 170.0, 179.0, 112.0, 59.0, 32.0, 23.0, 9.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3422088623046875, -1.296722412109375, -1.2512359619140625, -1.20574951171875, -1.1602630615234375, -1.114776611328125, -1.0692901611328125, -1.0238037109375, -0.9783172607421875, -0.932830810546875, -0.8873443603515625, -0.84185791015625, -0.7963714599609375, -0.750885009765625, -0.7053985595703125, -0.659912109375, -0.6144256591796875, -0.568939208984375, -0.5234527587890625, -0.47796630859375, -0.4324798583984375, -0.386993408203125, -0.3415069580078125, -0.2960205078125, -0.2505340576171875, -0.205047607421875, -0.1595611572265625, -0.11407470703125, -0.0685882568359375, -0.023101806640625, 0.0223846435546875, 0.06787109375, 0.1133575439453125, 0.158843994140625, 0.2043304443359375, 0.24981689453125, 0.2953033447265625, 0.340789794921875, 0.3862762451171875, 0.4317626953125, 0.4772491455078125, 0.522735595703125, 0.5682220458984375, 0.61370849609375, 0.6591949462890625, 0.704681396484375, 0.7501678466796875, 0.795654296875, 0.8411407470703125, 0.886627197265625, 0.9321136474609375, 0.97760009765625, 1.0230865478515625, 1.068572998046875, 1.1140594482421875, 1.1595458984375, 1.2050323486328125, 1.250518798828125, 1.2960052490234375, 1.34149169921875, 1.3869781494140625, 1.432464599609375, 1.4779510498046875, 1.5234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 13.0, 17.0, 26.0, 36.0, 65.0, 104.0, 167.0, 283.0, 631.0, 1388.0, 3452.0, 10703.0, 41698.0, 268221.0, 3452413.0, 344594.0, 50404.0, 12739.0, 4092.0, 1603.0, 719.0, 342.0, 204.0, 128.0, 101.0, 44.0, 40.0, 18.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.58697509765625, -5.3497314453125, -5.11248779296875, -4.875244140625, -4.63800048828125, -4.4007568359375, -4.16351318359375, -3.92626953125, -3.68902587890625, -3.4517822265625, -3.21453857421875, -2.977294921875, -2.74005126953125, -2.5028076171875, -2.26556396484375, -2.0283203125, -1.79107666015625, -1.5538330078125, -1.31658935546875, -1.079345703125, -0.84210205078125, -0.6048583984375, -0.36761474609375, -0.13037109375, 0.10687255859375, 0.3441162109375, 0.58135986328125, 0.818603515625, 1.05584716796875, 1.2930908203125, 1.53033447265625, 1.767578125, 2.00482177734375, 2.2420654296875, 2.47930908203125, 2.716552734375, 2.95379638671875, 3.1910400390625, 3.42828369140625, 3.66552734375, 3.90277099609375, 4.1400146484375, 4.37725830078125, 4.614501953125, 4.85174560546875, 5.0889892578125, 5.32623291015625, 5.5634765625, 5.80072021484375, 6.0379638671875, 6.27520751953125, 6.512451171875, 6.74969482421875, 6.9869384765625, 7.22418212890625, 7.46142578125, 7.69866943359375, 7.9359130859375, 8.17315673828125, 8.410400390625, 8.64764404296875, 8.8848876953125, 9.12213134765625, 9.359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 6.0, 10.0, 21.0, 18.0, 40.0, 54.0, 82.0, 141.0, 238.0, 593.0, 1649.0, 538.0, 251.0, 130.0, 93.0, 44.0, 38.0, 34.0, 22.0, 14.0, 16.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.509765625, -1.454833984375, -1.39990234375, -1.344970703125, -1.2900390625, -1.235107421875, -1.18017578125, -1.125244140625, -1.0703125, -1.015380859375, -0.96044921875, -0.905517578125, -0.8505859375, -0.795654296875, -0.74072265625, -0.685791015625, -0.630859375, -0.575927734375, -0.52099609375, -0.466064453125, -0.4111328125, -0.356201171875, -0.30126953125, -0.246337890625, -0.19140625, -0.136474609375, -0.08154296875, -0.026611328125, 0.0283203125, 0.083251953125, 0.13818359375, 0.193115234375, 0.248046875, 0.302978515625, 0.35791015625, 0.412841796875, 0.4677734375, 0.522705078125, 0.57763671875, 0.632568359375, 0.6875, 0.742431640625, 0.79736328125, 0.852294921875, 0.9072265625, 0.962158203125, 1.01708984375, 1.072021484375, 1.126953125, 1.181884765625, 1.23681640625, 1.291748046875, 1.3466796875, 1.401611328125, 1.45654296875, 1.511474609375, 1.56640625, 1.621337890625, 1.67626953125, 1.731201171875, 1.7861328125, 1.841064453125, 1.89599609375, 1.950927734375, 2.005859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 19.0, 105.0, 345.0, 347.0, 140.0, 32.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.855146408081055, -11.008855819702148, -10.162564277648926, -9.31627368927002, -8.469982147216797, -7.623691558837891, -6.777400970458984, -5.93110990524292, -5.0848188400268555, -4.238527774810791, -3.3922369480133057, -2.5459461212158203, -1.6996550559997559, -0.8533639907836914, -0.007073402404785156, 0.8392176628112793, 1.6855087280273438, 2.531799793243408, 3.3780906200408936, 4.224381446838379, 5.070672512054443, 5.916963577270508, 6.763254165649414, 7.6095452308654785, 8.455836296081543, 9.30212688446045, 10.148418426513672, 10.994709014892578, 11.840999603271484, 12.687291145324707, 13.533581733703613, 14.379873275756836, 15.226165771484375, 16.07245635986328, 16.918746948242188, 17.765037536621094, 18.611330032348633, 19.45762062072754, 20.303911209106445, 21.15020179748535, 21.99649429321289, 22.842784881591797, 23.689075469970703, 24.53536605834961, 25.38165855407715, 26.227949142456055, 27.07423973083496, 27.920530319213867, 28.766820907592773, 29.61311149597168, 30.459402084350586, 31.305694580078125, 32.15198516845703, 32.99827575683594, 33.844566345214844, 34.69085693359375, 35.537147521972656, 36.38343811035156, 37.22972869873047, 38.076019287109375, 38.92230987548828, 39.76860046386719, 40.614891052246094, 41.461185455322266, 42.30747604370117]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 4.0, 10.0, 11.0, 7.0, 14.0, 18.0, 22.0, 24.0, 25.0, 30.0, 26.0, 38.0, 28.0, 41.0, 48.0, 49.0, 42.0, 36.0, 35.0, 39.0, 35.0, 40.0, 27.0, 36.0, 40.0, 37.0, 31.0, 34.0, 23.0, 12.0, 27.0, 16.0, 14.0, 11.0, 11.0, 5.0, 7.0, 9.0, 7.0, 2.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.717405319213867, -4.558929920196533, -4.400454044342041, -4.241978645324707, -4.083503246307373, -3.925027370452881, -3.766551971435547, -3.608076333999634, -3.4496006965637207, -3.2911250591278076, -3.1326496601104736, -2.9741740226745605, -2.8156983852386475, -2.6572227478027344, -2.4987473487854004, -2.3402717113494873, -2.1817963123321533, -2.0233206748962402, -1.8648451566696167, -1.7063696384429932, -1.54789400100708, -1.3894184827804565, -1.230942964553833, -1.07246732711792, -0.9139918088912964, -0.7555162310600281, -0.5970406532287598, -0.43856513500213623, -0.2800895571708679, -0.12161397933959961, 0.036861538887023926, 0.195337176322937, 0.35381269454956055, 0.5122882723808289, 0.6707638502120972, 0.8292393684387207, 0.987714946269989, 1.1461905241012573, 1.3046660423278809, 1.463141679763794, 1.6216171979904175, 1.780092716217041, 1.938568353652954, 2.097043991088867, 2.255519390106201, 2.4139950275421143, 2.5724706649780273, 2.7309460639953613, 2.8894217014312744, 3.0478973388671875, 3.2063727378845215, 3.3648483753204346, 3.5233240127563477, 3.6817994117736816, 3.8402750492095947, 3.998750686645508, 4.157226085662842, 4.315701484680176, 4.474177360534668, 4.632652759552002, 4.791128158569336, 4.949604034423828, 5.108079433441162, 5.266554832458496, 5.425030708312988]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 21.0, 31.0, 52.0, 63.0, 93.0, 154.0, 251.0, 370.0, 661.0, 1131.0, 2161.0, 4941.0, 15229.0, 68105.0, 409965.0, 443947.0, 74735.0, 16182.0, 5145.0, 2307.0, 1169.0, 641.0, 426.0, 250.0, 160.0, 108.0, 74.0, 30.0, 30.0, 21.0, 20.0, 10.0, 12.0, 2.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3887939453125, -6.176025390625, -5.9632568359375, -5.75048828125, -5.5377197265625, -5.324951171875, -5.1121826171875, -4.8994140625, -4.6866455078125, -4.473876953125, -4.2611083984375, -4.04833984375, -3.8355712890625, -3.622802734375, -3.4100341796875, -3.197265625, -2.9844970703125, -2.771728515625, -2.5589599609375, -2.34619140625, -2.1334228515625, -1.920654296875, -1.7078857421875, -1.4951171875, -1.2823486328125, -1.069580078125, -0.8568115234375, -0.64404296875, -0.4312744140625, -0.218505859375, -0.0057373046875, 0.20703125, 0.4197998046875, 0.632568359375, 0.8453369140625, 1.05810546875, 1.2708740234375, 1.483642578125, 1.6964111328125, 1.9091796875, 2.1219482421875, 2.334716796875, 2.5474853515625, 2.76025390625, 2.9730224609375, 3.185791015625, 3.3985595703125, 3.611328125, 3.8240966796875, 4.036865234375, 4.2496337890625, 4.46240234375, 4.6751708984375, 4.887939453125, 5.1007080078125, 5.3134765625, 5.5262451171875, 5.739013671875, 5.9517822265625, 6.16455078125, 6.3773193359375, 6.590087890625, 6.8028564453125, 7.015625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 13.0, 25.0, 61.0, 76.0, 121.0, 162.0, 131.0, 129.0, 104.0, 66.0, 40.0, 21.0, 14.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.37109375, -1.32720947265625, -1.2833251953125, -1.23944091796875, -1.195556640625, -1.15167236328125, -1.1077880859375, -1.06390380859375, -1.02001953125, -0.97613525390625, -0.9322509765625, -0.88836669921875, -0.844482421875, -0.80059814453125, -0.7567138671875, -0.71282958984375, -0.6689453125, -0.62506103515625, -0.5811767578125, -0.53729248046875, -0.493408203125, -0.44952392578125, -0.4056396484375, -0.36175537109375, -0.31787109375, -0.27398681640625, -0.2301025390625, -0.18621826171875, -0.142333984375, -0.09844970703125, -0.0545654296875, -0.01068115234375, 0.033203125, 0.07708740234375, 0.1209716796875, 0.16485595703125, 0.208740234375, 0.25262451171875, 0.2965087890625, 0.34039306640625, 0.38427734375, 0.42816162109375, 0.4720458984375, 0.51593017578125, 0.559814453125, 0.60369873046875, 0.6475830078125, 0.69146728515625, 0.7353515625, 0.77923583984375, 0.8231201171875, 0.86700439453125, 0.910888671875, 0.95477294921875, 0.9986572265625, 1.04254150390625, 1.08642578125, 1.13031005859375, 1.1741943359375, 1.21807861328125, 1.261962890625, 1.30584716796875, 1.3497314453125, 1.39361572265625, 1.4375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 8.0, 7.0, 8.0, 12.0, 30.0, 39.0, 43.0, 83.0, 120.0, 195.0, 393.0, 649.0, 1136.0, 2526.0, 6490.0, 23549.0, 113214.0, 514090.0, 304733.0, 59462.0, 13431.0, 4345.0, 1773.0, 821.0, 530.0, 305.0, 180.0, 119.0, 86.0, 44.0, 40.0, 23.0, 22.0, 15.0, 9.0, 6.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.0625, -8.82891845703125, -8.5953369140625, -8.36175537109375, -8.128173828125, -7.89459228515625, -7.6610107421875, -7.42742919921875, -7.19384765625, -6.96026611328125, -6.7266845703125, -6.49310302734375, -6.259521484375, -6.02593994140625, -5.7923583984375, -5.55877685546875, -5.3251953125, -5.09161376953125, -4.8580322265625, -4.62445068359375, -4.390869140625, -4.15728759765625, -3.9237060546875, -3.69012451171875, -3.45654296875, -3.22296142578125, -2.9893798828125, -2.75579833984375, -2.522216796875, -2.28863525390625, -2.0550537109375, -1.82147216796875, -1.587890625, -1.35430908203125, -1.1207275390625, -0.88714599609375, -0.653564453125, -0.41998291015625, -0.1864013671875, 0.04718017578125, 0.28076171875, 0.51434326171875, 0.7479248046875, 0.98150634765625, 1.215087890625, 1.44866943359375, 1.6822509765625, 1.91583251953125, 2.1494140625, 2.38299560546875, 2.6165771484375, 2.85015869140625, 3.083740234375, 3.31732177734375, 3.5509033203125, 3.78448486328125, 4.01806640625, 4.25164794921875, 4.4852294921875, 4.71881103515625, 4.952392578125, 5.18597412109375, 5.4195556640625, 5.65313720703125, 5.88671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 13.0, 24.0, 19.0, 20.0, 32.0, 42.0, 22.0, 32.0, 37.0, 38.0, 46.0, 66.0, 63.0, 40.0, 63.0, 51.0, 50.0, 39.0, 43.0, 31.0, 32.0, 26.0, 32.0, 14.0, 17.0, 16.0, 9.0, 17.0, 8.0, 11.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 5.0], "bins": [-5.55859375, -5.420257568359375, -5.28192138671875, -5.143585205078125, -5.0052490234375, -4.866912841796875, -4.72857666015625, -4.590240478515625, -4.451904296875, -4.313568115234375, -4.17523193359375, -4.036895751953125, -3.8985595703125, -3.760223388671875, -3.62188720703125, -3.483551025390625, -3.34521484375, -3.206878662109375, -3.06854248046875, -2.930206298828125, -2.7918701171875, -2.653533935546875, -2.51519775390625, -2.376861572265625, -2.238525390625, -2.100189208984375, -1.96185302734375, -1.823516845703125, -1.6851806640625, -1.546844482421875, -1.40850830078125, -1.270172119140625, -1.1318359375, -0.993499755859375, -0.85516357421875, -0.716827392578125, -0.5784912109375, -0.440155029296875, -0.30181884765625, -0.163482666015625, -0.025146484375, 0.113189697265625, 0.25152587890625, 0.389862060546875, 0.5281982421875, 0.666534423828125, 0.80487060546875, 0.943206787109375, 1.08154296875, 1.219879150390625, 1.35821533203125, 1.496551513671875, 1.6348876953125, 1.773223876953125, 1.91156005859375, 2.049896240234375, 2.188232421875, 2.326568603515625, 2.46490478515625, 2.603240966796875, 2.7415771484375, 2.879913330078125, 3.01824951171875, 3.156585693359375, 3.294921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 8.0, 8.0, 8.0, 10.0, 21.0, 21.0, 36.0, 57.0, 69.0, 125.0, 198.0, 385.0, 695.0, 1389.0, 2993.0, 7247.0, 20762.0, 71213.0, 331404.0, 466183.0, 101203.0, 27950.0, 9343.0, 3703.0, 1700.0, 768.0, 425.0, 234.0, 140.0, 86.0, 51.0, 34.0, 20.0, 21.0, 13.0, 14.0, 11.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.62420654296875, -3.4906005859375, -3.35699462890625, -3.223388671875, -3.08978271484375, -2.9561767578125, -2.82257080078125, -2.68896484375, -2.55535888671875, -2.4217529296875, -2.28814697265625, -2.154541015625, -2.02093505859375, -1.8873291015625, -1.75372314453125, -1.6201171875, -1.48651123046875, -1.3529052734375, -1.21929931640625, -1.085693359375, -0.95208740234375, -0.8184814453125, -0.68487548828125, -0.55126953125, -0.41766357421875, -0.2840576171875, -0.15045166015625, -0.016845703125, 0.11676025390625, 0.2503662109375, 0.38397216796875, 0.517578125, 0.65118408203125, 0.7847900390625, 0.91839599609375, 1.052001953125, 1.18560791015625, 1.3192138671875, 1.45281982421875, 1.58642578125, 1.72003173828125, 1.8536376953125, 1.98724365234375, 2.120849609375, 2.25445556640625, 2.3880615234375, 2.52166748046875, 2.6552734375, 2.78887939453125, 2.9224853515625, 3.05609130859375, 3.189697265625, 3.32330322265625, 3.4569091796875, 3.59051513671875, 3.72412109375, 3.85772705078125, 3.9913330078125, 4.12493896484375, 4.258544921875, 4.39215087890625, 4.5257568359375, 4.65936279296875, 4.79296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 11.0, 13.0, 7.0, 14.0, 16.0, 27.0, 27.0, 48.0, 59.0, 107.0, 139.0, 153.0, 113.0, 50.0, 34.0, 47.0, 24.0, 19.0, 16.0, 8.0, 10.0, 9.0, 7.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005202293395996094, -0.0004986226558685303, -0.00047701597213745117, -0.00045540928840637207, -0.00043380260467529297, -0.00041219592094421387, -0.00039058923721313477, -0.00036898255348205566, -0.00034737586975097656, -0.00032576918601989746, -0.00030416250228881836, -0.00028255581855773926, -0.00026094913482666016, -0.00023934245109558105, -0.00021773576736450195, -0.00019612908363342285, -0.00017452239990234375, -0.00015291571617126465, -0.00013130903244018555, -0.00010970234870910645, -8.809566497802734e-05, -6.648898124694824e-05, -4.488229751586914e-05, -2.327561378479004e-05, -1.6689300537109375e-06, 1.9937753677368164e-05, 4.1544437408447266e-05, 6.315112113952637e-05, 8.475780487060547e-05, 0.00010636448860168457, 0.00012797117233276367, 0.00014957785606384277, 0.00017118453979492188, 0.00019279122352600098, 0.00021439790725708008, 0.00023600459098815918, 0.0002576112747192383, 0.0002792179584503174, 0.0003008246421813965, 0.0003224313259124756, 0.0003440380096435547, 0.0003656446933746338, 0.0003872513771057129, 0.000408858060836792, 0.0004304647445678711, 0.0004520714282989502, 0.0004736781120300293, 0.0004952847957611084, 0.0005168914794921875, 0.0005384981632232666, 0.0005601048469543457, 0.0005817115306854248, 0.0006033182144165039, 0.000624924898147583, 0.0006465315818786621, 0.0006681382656097412, 0.0006897449493408203, 0.0007113516330718994, 0.0007329583168029785, 0.0007545650005340576, 0.0007761716842651367, 0.0007977783679962158, 0.0008193850517272949, 0.000840991735458374, 0.0008625984191894531]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 11.0, 11.0, 12.0, 20.0, 47.0, 74.0, 107.0, 239.0, 556.0, 1461.0, 4722.0, 30747.0, 598746.0, 383375.0, 22244.0, 3927.0, 1238.0, 495.0, 223.0, 109.0, 66.0, 42.0, 33.0, 16.0, 14.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.34375, -10.047607421875, -9.75146484375, -9.455322265625, -9.1591796875, -8.863037109375, -8.56689453125, -8.270751953125, -7.974609375, -7.678466796875, -7.38232421875, -7.086181640625, -6.7900390625, -6.493896484375, -6.19775390625, -5.901611328125, -5.60546875, -5.309326171875, -5.01318359375, -4.717041015625, -4.4208984375, -4.124755859375, -3.82861328125, -3.532470703125, -3.236328125, -2.940185546875, -2.64404296875, -2.347900390625, -2.0517578125, -1.755615234375, -1.45947265625, -1.163330078125, -0.8671875, -0.571044921875, -0.27490234375, 0.021240234375, 0.3173828125, 0.613525390625, 0.90966796875, 1.205810546875, 1.501953125, 1.798095703125, 2.09423828125, 2.390380859375, 2.6865234375, 2.982666015625, 3.27880859375, 3.574951171875, 3.87109375, 4.167236328125, 4.46337890625, 4.759521484375, 5.0556640625, 5.351806640625, 5.64794921875, 5.944091796875, 6.240234375, 6.536376953125, 6.83251953125, 7.128662109375, 7.4248046875, 7.720947265625, 8.01708984375, 8.313232421875, 8.609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 9.0, 19.0, 29.0, 40.0, 59.0, 88.0, 123.0, 123.0, 137.0, 92.0, 63.0, 48.0, 44.0, 33.0, 15.0, 15.0, 13.0, 9.0, 4.0, 7.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.47686767578125, -4.3521728515625, -4.22747802734375, -4.102783203125, -3.97808837890625, -3.8533935546875, -3.72869873046875, -3.60400390625, -3.47930908203125, -3.3546142578125, -3.22991943359375, -3.105224609375, -2.98052978515625, -2.8558349609375, -2.73114013671875, -2.6064453125, -2.48175048828125, -2.3570556640625, -2.23236083984375, -2.107666015625, -1.98297119140625, -1.8582763671875, -1.73358154296875, -1.60888671875, -1.48419189453125, -1.3594970703125, -1.23480224609375, -1.110107421875, -0.98541259765625, -0.8607177734375, -0.73602294921875, -0.611328125, -0.48663330078125, -0.3619384765625, -0.23724365234375, -0.112548828125, 0.01214599609375, 0.1368408203125, 0.26153564453125, 0.38623046875, 0.51092529296875, 0.6356201171875, 0.76031494140625, 0.885009765625, 1.00970458984375, 1.1343994140625, 1.25909423828125, 1.3837890625, 1.50848388671875, 1.6331787109375, 1.75787353515625, 1.882568359375, 2.00726318359375, 2.1319580078125, 2.25665283203125, 2.38134765625, 2.50604248046875, 2.6307373046875, 2.75543212890625, 2.880126953125, 3.00482177734375, 3.1295166015625, 3.25421142578125, 3.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 23.0, 64.0, 249.0, 397.0, 195.0, 49.0, 12.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.4267349243164, -64.8946762084961, -61.36262130737305, -57.830562591552734, -54.29850769042969, -50.766448974609375, -47.23439025878906, -43.70233154296875, -40.1702766418457, -36.63821792602539, -33.106163024902344, -29.57410430908203, -26.04204750061035, -22.509990692138672, -18.97793197631836, -15.44587516784668, -11.913818359375, -8.38176155090332, -4.849703788757324, -1.3176460266113281, 2.2144107818603516, 5.746467590332031, 9.278526306152344, 12.810583114624023, 16.342639923095703, 19.874696731567383, 23.406753540039062, 26.938812255859375, 30.470869064331055, 34.002925872802734, 37.53498458862305, 41.067039489746094, 44.59910583496094, 48.13116455078125, 51.6632194519043, 55.19527816772461, 58.727333068847656, 62.25939178466797, 65.79145050048828, 69.3235092163086, 72.85556030273438, 76.38761901855469, 79.919677734375, 83.45173645019531, 86.9837875366211, 90.5158462524414, 94.04790496826172, 97.57996368408203, 101.11202239990234, 104.64408111572266, 108.17613983154297, 111.70819091796875, 115.24024963378906, 118.77230834960938, 122.30436706542969, 125.83642578125, 129.3684844970703, 132.90054321289062, 136.43260192871094, 139.96466064453125, 143.49671936035156, 147.02877807617188, 150.56082153320312, 154.09288024902344, 157.62493896484375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 9.0, 15.0, 11.0, 23.0, 22.0, 21.0, 33.0, 26.0, 40.0, 42.0, 39.0, 46.0, 35.0, 55.0, 59.0, 51.0, 52.0, 32.0, 39.0, 49.0, 38.0, 50.0, 40.0, 24.0, 28.0, 19.0, 22.0, 13.0, 20.0, 12.0, 11.0, 10.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.921775817871094, -37.93449783325195, -36.94721984863281, -35.95994186401367, -34.97266387939453, -33.98538589477539, -32.99810791015625, -32.010826110839844, -31.023550033569336, -30.036272048950195, -29.048994064331055, -28.061716079711914, -27.07443618774414, -26.087158203125, -25.09988021850586, -24.11260223388672, -23.125324249267578, -22.138046264648438, -21.150768280029297, -20.163490295410156, -19.176212310791016, -18.188934326171875, -17.2016544342041, -16.21437644958496, -15.22709846496582, -14.23982048034668, -13.252542495727539, -12.265263557434082, -11.277985572814941, -10.2907075881958, -9.303428649902344, -8.316150665283203, -7.3288726806640625, -6.341594696044922, -5.354316234588623, -4.367037773132324, -3.3797597885131836, -2.392481803894043, -1.4052033424377441, -0.4179248809814453, 0.5693531036376953, 1.556631326675415, 2.5439095497131348, 3.5311877727508545, 4.518465995788574, 5.505743980407715, 6.493022441864014, 7.4803009033203125, 8.467578887939453, 9.454856872558594, 10.442134857177734, 11.429413795471191, 12.416691780090332, 13.403969764709473, 14.39124870300293, 15.37852668762207, 16.36580467224121, 17.35308265686035, 18.340360641479492, 19.327638626098633, 20.314918518066406, 21.302196502685547, 22.289474487304688, 23.276752471923828, 24.26403045654297]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 12.0, 3.0, 10.0, 9.0, 20.0, 34.0, 58.0, 107.0, 214.0, 425.0, 868.0, 2402.0, 9318.0, 71125.0, 3832436.0, 252975.0, 18120.0, 3785.0, 1253.0, 502.0, 268.0, 129.0, 80.0, 36.0, 33.0, 19.0, 7.0, 8.0, 4.0, 7.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.5390625, -10.216796875, -9.89453125, -9.572265625, -9.25, -8.927734375, -8.60546875, -8.283203125, -7.9609375, -7.638671875, -7.31640625, -6.994140625, -6.671875, -6.349609375, -6.02734375, -5.705078125, -5.3828125, -5.060546875, -4.73828125, -4.416015625, -4.09375, -3.771484375, -3.44921875, -3.126953125, -2.8046875, -2.482421875, -2.16015625, -1.837890625, -1.515625, -1.193359375, -0.87109375, -0.548828125, -0.2265625, 0.095703125, 0.41796875, 0.740234375, 1.0625, 1.384765625, 1.70703125, 2.029296875, 2.3515625, 2.673828125, 2.99609375, 3.318359375, 3.640625, 3.962890625, 4.28515625, 4.607421875, 4.9296875, 5.251953125, 5.57421875, 5.896484375, 6.21875, 6.541015625, 6.86328125, 7.185546875, 7.5078125, 7.830078125, 8.15234375, 8.474609375, 8.796875, 9.119140625, 9.44140625, 9.763671875, 10.0859375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 10.0, 14.0, 21.0, 49.0, 53.0, 66.0, 86.0, 112.0, 112.0, 110.0, 96.0, 77.0, 64.0, 42.0, 32.0, 20.0, 7.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4326171875, -1.385894775390625, -1.33917236328125, -1.292449951171875, -1.2457275390625, -1.199005126953125, -1.15228271484375, -1.105560302734375, -1.058837890625, -1.012115478515625, -0.96539306640625, -0.918670654296875, -0.8719482421875, -0.825225830078125, -0.77850341796875, -0.731781005859375, -0.68505859375, -0.638336181640625, -0.59161376953125, -0.544891357421875, -0.4981689453125, -0.451446533203125, -0.40472412109375, -0.358001708984375, -0.311279296875, -0.264556884765625, -0.21783447265625, -0.171112060546875, -0.1243896484375, -0.077667236328125, -0.03094482421875, 0.015777587890625, 0.0625, 0.109222412109375, 0.15594482421875, 0.202667236328125, 0.2493896484375, 0.296112060546875, 0.34283447265625, 0.389556884765625, 0.436279296875, 0.483001708984375, 0.52972412109375, 0.576446533203125, 0.6231689453125, 0.669891357421875, 0.71661376953125, 0.763336181640625, 0.81005859375, 0.856781005859375, 0.90350341796875, 0.950225830078125, 0.9969482421875, 1.043670654296875, 1.09039306640625, 1.137115478515625, 1.183837890625, 1.230560302734375, 1.27728271484375, 1.324005126953125, 1.3707275390625, 1.417449951171875, 1.46417236328125, 1.510894775390625, 1.5576171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 12.0, 14.0, 27.0, 37.0, 52.0, 99.0, 190.0, 382.0, 805.0, 1818.0, 4545.0, 12592.0, 39945.0, 175513.0, 2727820.0, 1063548.0, 120218.0, 29847.0, 9731.0, 3696.0, 1663.0, 830.0, 401.0, 207.0, 122.0, 72.0, 38.0, 27.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.815704345703125, -3.64898681640625, -3.482269287109375, -3.3155517578125, -3.148834228515625, -2.98211669921875, -2.815399169921875, -2.648681640625, -2.481964111328125, -2.31524658203125, -2.148529052734375, -1.9818115234375, -1.815093994140625, -1.64837646484375, -1.481658935546875, -1.31494140625, -1.148223876953125, -0.98150634765625, -0.814788818359375, -0.6480712890625, -0.481353759765625, -0.31463623046875, -0.147918701171875, 0.018798828125, 0.185516357421875, 0.35223388671875, 0.518951416015625, 0.6856689453125, 0.852386474609375, 1.01910400390625, 1.185821533203125, 1.3525390625, 1.519256591796875, 1.68597412109375, 1.852691650390625, 2.0194091796875, 2.186126708984375, 2.35284423828125, 2.519561767578125, 2.686279296875, 2.852996826171875, 3.01971435546875, 3.186431884765625, 3.3531494140625, 3.519866943359375, 3.68658447265625, 3.853302001953125, 4.02001953125, 4.186737060546875, 4.35345458984375, 4.520172119140625, 4.6868896484375, 4.853607177734375, 5.02032470703125, 5.187042236328125, 5.353759765625, 5.520477294921875, 5.68719482421875, 5.853912353515625, 6.0206298828125, 6.187347412109375, 6.35406494140625, 6.520782470703125, 6.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 15.0, 17.0, 15.0, 26.0, 27.0, 37.0, 34.0, 68.0, 124.0, 171.0, 245.0, 618.0, 1406.0, 494.0, 246.0, 170.0, 86.0, 65.0, 44.0, 37.0, 26.0, 16.0, 17.0, 16.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.02813720703125, -0.9859619140625, -0.94378662109375, -0.901611328125, -0.85943603515625, -0.8172607421875, -0.77508544921875, -0.73291015625, -0.69073486328125, -0.6485595703125, -0.60638427734375, -0.564208984375, -0.52203369140625, -0.4798583984375, -0.43768310546875, -0.3955078125, -0.35333251953125, -0.3111572265625, -0.26898193359375, -0.226806640625, -0.18463134765625, -0.1424560546875, -0.10028076171875, -0.05810546875, -0.01593017578125, 0.0262451171875, 0.06842041015625, 0.110595703125, 0.15277099609375, 0.1949462890625, 0.23712158203125, 0.279296875, 0.32147216796875, 0.3636474609375, 0.40582275390625, 0.447998046875, 0.49017333984375, 0.5323486328125, 0.57452392578125, 0.61669921875, 0.65887451171875, 0.7010498046875, 0.74322509765625, 0.785400390625, 0.82757568359375, 0.8697509765625, 0.91192626953125, 0.9541015625, 0.99627685546875, 1.0384521484375, 1.08062744140625, 1.122802734375, 1.16497802734375, 1.2071533203125, 1.24932861328125, 1.29150390625, 1.33367919921875, 1.3758544921875, 1.41802978515625, 1.460205078125, 1.50238037109375, 1.5445556640625, 1.58673095703125, 1.62890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 38.0, 56.0, 129.0, 158.0, 202.0, 186.0, 130.0, 52.0, 29.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.782783508300781, -6.3131513595581055, -5.8435187339782715, -5.373886585235596, -4.904253959655762, -4.434621810913086, -3.96498966217041, -3.4953572750091553, -3.0257248878479004, -2.5560925006866455, -2.0864601135253906, -1.6168279647827148, -1.14719557762146, -0.6775631904602051, -0.2079310417175293, 0.2617013454437256, 0.7313337326049805, 1.2009661197662354, 1.6705983877182007, 2.140230655670166, 2.609863042831421, 3.079495429992676, 3.5491275787353516, 4.018759727478027, 4.488392353057861, 4.958024501800537, 5.427657127380371, 5.897289276123047, 6.366921424865723, 6.836554050445557, 7.306186199188232, 7.775818824768066, 8.245450973510742, 8.715083122253418, 9.184715270996094, 9.654348373413086, 10.123980522155762, 10.593612670898438, 11.063244819641113, 11.532876968383789, 12.002510070800781, 12.472142219543457, 12.941774368286133, 13.411407470703125, 13.8810396194458, 14.350671768188477, 14.820303916931152, 15.289936065673828, 15.759568214416504, 16.22920036315918, 16.698833465576172, 17.16846466064453, 17.638097763061523, 18.107730865478516, 18.577362060546875, 19.046995162963867, 19.516626358032227, 19.98625946044922, 20.455890655517578, 20.92552375793457, 21.39515495300293, 21.864788055419922, 22.33441925048828, 22.804052352905273, 23.273685455322266]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 10.0, 13.0, 10.0, 12.0, 17.0, 20.0, 16.0, 18.0, 21.0, 27.0, 28.0, 36.0, 38.0, 38.0, 36.0, 50.0, 33.0, 41.0, 52.0, 25.0, 39.0, 40.0, 37.0, 29.0, 38.0, 28.0, 26.0, 23.0, 28.0, 34.0, 16.0, 17.0, 16.0, 15.0, 8.0, 9.0, 6.0, 6.0, 9.0, 7.0, 9.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.587404251098633, -4.446531772613525, -4.30565881729126, -4.164786338806152, -4.023913383483887, -3.8830409049987793, -3.742168426513672, -3.6012957096099854, -3.460422992706299, -3.3195502758026123, -3.178677558898926, -3.0378050804138184, -2.896932363510132, -2.7560596466064453, -2.615187168121338, -2.4743144512176514, -2.333441734313965, -2.1925690174102783, -2.051696300506592, -1.9108238220214844, -1.7699511051177979, -1.6290783882141113, -1.4882057905197144, -1.3473331928253174, -1.2064604759216309, -1.0655877590179443, -0.9247151613235474, -0.7838425040245056, -0.6429698467254639, -0.5020971894264221, -0.36122453212738037, -0.22035187482833862, -0.07947874069213867, 0.061393916606903076, 0.20226657390594482, 0.3431392312049866, 0.4840118885040283, 0.6248845458030701, 0.7657572031021118, 0.9066298604011536, 1.0475025177001953, 1.1883752346038818, 1.3292478322982788, 1.4701204299926758, 1.6109931468963623, 1.7518658638000488, 1.8927384614944458, 2.0336110591888428, 2.1744837760925293, 2.315356492996216, 2.4562292098999023, 2.5971016883850098, 2.7379744052886963, 2.878847122192383, 3.0197196006774902, 3.1605923175811768, 3.3014650344848633, 3.44233775138855, 3.5832104682922363, 3.7240829467773438, 3.8649556636810303, 4.005828380584717, 4.146700859069824, 4.28757381439209, 4.428446292877197]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 0.0, 7.0, 5.0, 4.0, 6.0, 9.0, 13.0, 16.0, 22.0, 27.0, 39.0, 44.0, 71.0, 98.0, 145.0, 185.0, 270.0, 447.0, 676.0, 1188.0, 2166.0, 4299.0, 9657.0, 23719.0, 63461.0, 174577.0, 372555.0, 244901.0, 91066.0, 33224.0, 13249.0, 5708.0, 2744.0, 1528.0, 762.0, 514.0, 343.0, 241.0, 147.0, 114.0, 92.0, 53.0, 61.0, 32.0, 17.0, 19.0, 7.0, 10.0, 10.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.8515625, -3.72601318359375, -3.6004638671875, -3.47491455078125, -3.349365234375, -3.22381591796875, -3.0982666015625, -2.97271728515625, -2.84716796875, -2.72161865234375, -2.5960693359375, -2.47052001953125, -2.344970703125, -2.21942138671875, -2.0938720703125, -1.96832275390625, -1.8427734375, -1.71722412109375, -1.5916748046875, -1.46612548828125, -1.340576171875, -1.21502685546875, -1.0894775390625, -0.96392822265625, -0.83837890625, -0.71282958984375, -0.5872802734375, -0.46173095703125, -0.336181640625, -0.21063232421875, -0.0850830078125, 0.04046630859375, 0.166015625, 0.29156494140625, 0.4171142578125, 0.54266357421875, 0.668212890625, 0.79376220703125, 0.9193115234375, 1.04486083984375, 1.17041015625, 1.29595947265625, 1.4215087890625, 1.54705810546875, 1.672607421875, 1.79815673828125, 1.9237060546875, 2.04925537109375, 2.1748046875, 2.30035400390625, 2.4259033203125, 2.55145263671875, 2.677001953125, 2.80255126953125, 2.9281005859375, 3.05364990234375, 3.17919921875, 3.30474853515625, 3.4302978515625, 3.55584716796875, 3.681396484375, 3.80694580078125, 3.9324951171875, 4.05804443359375, 4.18359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 8.0, 11.0, 26.0, 41.0, 56.0, 85.0, 97.0, 95.0, 126.0, 104.0, 103.0, 79.0, 69.0, 31.0, 22.0, 13.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.398101806640625, -1.34893798828125, -1.299774169921875, -1.2506103515625, -1.201446533203125, -1.15228271484375, -1.103118896484375, -1.053955078125, -1.004791259765625, -0.95562744140625, -0.906463623046875, -0.8572998046875, -0.808135986328125, -0.75897216796875, -0.709808349609375, -0.66064453125, -0.611480712890625, -0.56231689453125, -0.513153076171875, -0.4639892578125, -0.414825439453125, -0.36566162109375, -0.316497802734375, -0.267333984375, -0.218170166015625, -0.16900634765625, -0.119842529296875, -0.0706787109375, -0.021514892578125, 0.02764892578125, 0.076812744140625, 0.1259765625, 0.175140380859375, 0.22430419921875, 0.273468017578125, 0.3226318359375, 0.371795654296875, 0.42095947265625, 0.470123291015625, 0.519287109375, 0.568450927734375, 0.61761474609375, 0.666778564453125, 0.7159423828125, 0.765106201171875, 0.81427001953125, 0.863433837890625, 0.91259765625, 0.961761474609375, 1.01092529296875, 1.060089111328125, 1.1092529296875, 1.158416748046875, 1.20758056640625, 1.256744384765625, 1.305908203125, 1.355072021484375, 1.40423583984375, 1.453399658203125, 1.5025634765625, 1.551727294921875, 1.60089111328125, 1.650054931640625, 1.69921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 12.0, 16.0, 23.0, 39.0, 48.0, 56.0, 96.0, 119.0, 167.0, 341.0, 524.0, 807.0, 1408.0, 2865.0, 6778.0, 19428.0, 63447.0, 210098.0, 433060.0, 212419.0, 64069.0, 19351.0, 6728.0, 2947.0, 1427.0, 832.0, 485.0, 328.0, 190.0, 137.0, 94.0, 66.0, 44.0, 30.0, 19.0, 19.0, 14.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.77117919921875, -4.6243896484375, -4.47760009765625, -4.330810546875, -4.18402099609375, -4.0372314453125, -3.89044189453125, -3.74365234375, -3.59686279296875, -3.4500732421875, -3.30328369140625, -3.156494140625, -3.00970458984375, -2.8629150390625, -2.71612548828125, -2.5693359375, -2.42254638671875, -2.2757568359375, -2.12896728515625, -1.982177734375, -1.83538818359375, -1.6885986328125, -1.54180908203125, -1.39501953125, -1.24822998046875, -1.1014404296875, -0.95465087890625, -0.807861328125, -0.66107177734375, -0.5142822265625, -0.36749267578125, -0.220703125, -0.07391357421875, 0.0728759765625, 0.21966552734375, 0.366455078125, 0.51324462890625, 0.6600341796875, 0.80682373046875, 0.95361328125, 1.10040283203125, 1.2471923828125, 1.39398193359375, 1.540771484375, 1.68756103515625, 1.8343505859375, 1.98114013671875, 2.1279296875, 2.27471923828125, 2.4215087890625, 2.56829833984375, 2.715087890625, 2.86187744140625, 3.0086669921875, 3.15545654296875, 3.30224609375, 3.44903564453125, 3.5958251953125, 3.74261474609375, 3.889404296875, 4.03619384765625, 4.1829833984375, 4.32977294921875, 4.4765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 11.0, 10.0, 17.0, 8.0, 8.0, 15.0, 23.0, 29.0, 34.0, 44.0, 46.0, 47.0, 46.0, 46.0, 47.0, 51.0, 76.0, 45.0, 52.0, 33.0, 37.0, 49.0, 32.0, 29.0, 23.0, 24.0, 21.0, 17.0, 13.0, 11.0, 14.0, 12.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.33087158203125, -4.1812744140625, -4.03167724609375, -3.882080078125, -3.73248291015625, -3.5828857421875, -3.43328857421875, -3.28369140625, -3.13409423828125, -2.9844970703125, -2.83489990234375, -2.685302734375, -2.53570556640625, -2.3861083984375, -2.23651123046875, -2.0869140625, -1.93731689453125, -1.7877197265625, -1.63812255859375, -1.488525390625, -1.33892822265625, -1.1893310546875, -1.03973388671875, -0.89013671875, -0.74053955078125, -0.5909423828125, -0.44134521484375, -0.291748046875, -0.14215087890625, 0.0074462890625, 0.15704345703125, 0.306640625, 0.45623779296875, 0.6058349609375, 0.75543212890625, 0.905029296875, 1.05462646484375, 1.2042236328125, 1.35382080078125, 1.50341796875, 1.65301513671875, 1.8026123046875, 1.95220947265625, 2.101806640625, 2.25140380859375, 2.4010009765625, 2.55059814453125, 2.7001953125, 2.84979248046875, 2.9993896484375, 3.14898681640625, 3.298583984375, 3.44818115234375, 3.5977783203125, 3.74737548828125, 3.89697265625, 4.04656982421875, 4.1961669921875, 4.34576416015625, 4.495361328125, 4.64495849609375, 4.7945556640625, 4.94415283203125, 5.09375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 8.0, 9.0, 13.0, 18.0, 27.0, 32.0, 51.0, 88.0, 148.0, 252.0, 448.0, 1002.0, 2130.0, 5126.0, 13384.0, 42179.0, 164168.0, 495154.0, 236949.0, 58092.0, 17648.0, 6411.0, 2684.0, 1204.0, 557.0, 320.0, 169.0, 114.0, 57.0, 41.0, 29.0, 19.0, 16.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.8607177734375, -2.770263671875, -2.6798095703125, -2.58935546875, -2.4989013671875, -2.408447265625, -2.3179931640625, -2.2275390625, -2.1370849609375, -2.046630859375, -1.9561767578125, -1.86572265625, -1.7752685546875, -1.684814453125, -1.5943603515625, -1.50390625, -1.4134521484375, -1.322998046875, -1.2325439453125, -1.14208984375, -1.0516357421875, -0.961181640625, -0.8707275390625, -0.7802734375, -0.6898193359375, -0.599365234375, -0.5089111328125, -0.41845703125, -0.3280029296875, -0.237548828125, -0.1470947265625, -0.056640625, 0.0338134765625, 0.124267578125, 0.2147216796875, 0.30517578125, 0.3956298828125, 0.486083984375, 0.5765380859375, 0.6669921875, 0.7574462890625, 0.847900390625, 0.9383544921875, 1.02880859375, 1.1192626953125, 1.209716796875, 1.3001708984375, 1.390625, 1.4810791015625, 1.571533203125, 1.6619873046875, 1.75244140625, 1.8428955078125, 1.933349609375, 2.0238037109375, 2.1142578125, 2.2047119140625, 2.295166015625, 2.3856201171875, 2.47607421875, 2.5665283203125, 2.656982421875, 2.7474365234375, 2.837890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 13.0, 13.0, 16.0, 27.0, 23.0, 55.0, 49.0, 109.0, 169.0, 168.0, 121.0, 81.0, 54.0, 27.0, 18.0, 11.0, 15.0, 13.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005216598510742188, -0.00049571692943573, -0.0004697740077972412, -0.00044383108615875244, -0.00041788816452026367, -0.0003919452428817749, -0.00036600232124328613, -0.00034005939960479736, -0.0003141164779663086, -0.0002881735563278198, -0.00026223063468933105, -0.00023628771305084229, -0.00021034479141235352, -0.00018440186977386475, -0.00015845894813537598, -0.0001325160264968872, -0.00010657310485839844, -8.063018321990967e-05, -5.46872615814209e-05, -2.874433994293213e-05, -2.8014183044433594e-06, 2.314150333404541e-05, 4.908442497253418e-05, 7.502734661102295e-05, 0.00010097026824951172, 0.0001269131898880005, 0.00015285611152648926, 0.00017879903316497803, 0.0002047419548034668, 0.00023068487644195557, 0.00025662779808044434, 0.0002825707197189331, 0.0003085136413574219, 0.00033445656299591064, 0.0003603994846343994, 0.0003863424062728882, 0.00041228532791137695, 0.0004382282495498657, 0.0004641711711883545, 0.0004901140928268433, 0.000516057014465332, 0.0005419999361038208, 0.0005679428577423096, 0.0005938857793807983, 0.0006198287010192871, 0.0006457716226577759, 0.0006717145442962646, 0.0006976574659347534, 0.0007236003875732422, 0.000749543309211731, 0.0007754862308502197, 0.0008014291524887085, 0.0008273720741271973, 0.000853314995765686, 0.0008792579174041748, 0.0009052008390426636, 0.0009311437606811523, 0.0009570866823196411, 0.0009830296039581299, 0.0010089725255966187, 0.0010349154472351074, 0.0010608583688735962, 0.001086801290512085, 0.0011127442121505737, 0.0011386871337890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 9.0, 19.0, 30.0, 57.0, 104.0, 201.0, 465.0, 1240.0, 4619.0, 29383.0, 403852.0, 560374.0, 40009.0, 5716.0, 1485.0, 515.0, 220.0, 118.0, 73.0, 26.0, 16.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.01727294921875, -3.8431396484375, -3.66900634765625, -3.494873046875, -3.32073974609375, -3.1466064453125, -2.97247314453125, -2.79833984375, -2.62420654296875, -2.4500732421875, -2.27593994140625, -2.101806640625, -1.92767333984375, -1.7535400390625, -1.57940673828125, -1.4052734375, -1.23114013671875, -1.0570068359375, -0.88287353515625, -0.708740234375, -0.53460693359375, -0.3604736328125, -0.18634033203125, -0.01220703125, 0.16192626953125, 0.3360595703125, 0.51019287109375, 0.684326171875, 0.85845947265625, 1.0325927734375, 1.20672607421875, 1.380859375, 1.55499267578125, 1.7291259765625, 1.90325927734375, 2.077392578125, 2.25152587890625, 2.4256591796875, 2.59979248046875, 2.77392578125, 2.94805908203125, 3.1221923828125, 3.29632568359375, 3.470458984375, 3.64459228515625, 3.8187255859375, 3.99285888671875, 4.1669921875, 4.34112548828125, 4.5152587890625, 4.68939208984375, 4.863525390625, 5.03765869140625, 5.2117919921875, 5.38592529296875, 5.56005859375, 5.73419189453125, 5.9083251953125, 6.08245849609375, 6.256591796875, 6.43072509765625, 6.6048583984375, 6.77899169921875, 6.953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 10.0, 8.0, 7.0, 16.0, 20.0, 41.0, 58.0, 100.0, 130.0, 166.0, 141.0, 123.0, 62.0, 55.0, 32.0, 23.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.744476318359375, -2.62371826171875, -2.502960205078125, -2.3822021484375, -2.261444091796875, -2.14068603515625, -2.019927978515625, -1.899169921875, -1.778411865234375, -1.65765380859375, -1.536895751953125, -1.4161376953125, -1.295379638671875, -1.17462158203125, -1.053863525390625, -0.93310546875, -0.812347412109375, -0.69158935546875, -0.570831298828125, -0.4500732421875, -0.329315185546875, -0.20855712890625, -0.087799072265625, 0.032958984375, 0.153717041015625, 0.27447509765625, 0.395233154296875, 0.5159912109375, 0.636749267578125, 0.75750732421875, 0.878265380859375, 0.9990234375, 1.119781494140625, 1.24053955078125, 1.361297607421875, 1.4820556640625, 1.602813720703125, 1.72357177734375, 1.844329833984375, 1.965087890625, 2.085845947265625, 2.20660400390625, 2.327362060546875, 2.4481201171875, 2.568878173828125, 2.68963623046875, 2.810394287109375, 2.93115234375, 3.051910400390625, 3.17266845703125, 3.293426513671875, 3.4141845703125, 3.534942626953125, 3.65570068359375, 3.776458740234375, 3.897216796875, 4.017974853515625, 4.13873291015625, 4.259490966796875, 4.3802490234375, 4.501007080078125, 4.62176513671875, 4.742523193359375, 4.86328125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 8.0, 12.0, 14.0, 9.0, 22.0, 32.0, 57.0, 73.0, 105.0, 131.0, 110.0, 96.0, 92.0, 79.0, 58.0, 41.0, 26.0, 11.0, 8.0, 4.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.80368423461914, -21.86678123474121, -20.92987823486328, -19.99297332763672, -19.05607032775879, -18.11916732788086, -17.18226432800293, -16.245361328125, -15.308457374572754, -14.371554374694824, -13.434650421142578, -12.497747421264648, -11.560844421386719, -10.623940467834473, -9.687037467956543, -8.750133514404297, -7.813230514526367, -6.876327037811279, -5.939423561096191, -5.002520561218262, -4.065617084503174, -3.128713607788086, -2.1918106079101562, -1.2549071311950684, -0.31800365447998047, 0.6188997030258179, 1.5558030605316162, 2.492706298828125, 3.429609775543213, 4.366513252258301, 5.3034162521362305, 6.240319728851318, 7.177223205566406, 8.114126205444336, 9.051030158996582, 9.987933158874512, 10.924837112426758, 11.861740112304688, 12.798643112182617, 13.735546112060547, 14.672450065612793, 15.609353065490723, 16.54625701904297, 17.4831600189209, 18.420063018798828, 19.35696792602539, 20.293869018554688, 21.23077392578125, 22.16767692565918, 23.10457992553711, 24.04148292541504, 24.97838592529297, 25.91529083251953, 26.85219383239746, 27.78909683227539, 28.72599983215332, 29.66290283203125, 30.59980583190918, 31.53670883178711, 32.47361373901367, 33.41051483154297, 34.34741973876953, 35.284324645996094, 36.22122573852539, 37.15813064575195]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 8.0, 4.0, 10.0, 12.0, 11.0, 22.0, 17.0, 12.0, 21.0, 25.0, 26.0, 25.0, 29.0, 32.0, 52.0, 47.0, 41.0, 48.0, 51.0, 39.0, 41.0, 45.0, 47.0, 34.0, 33.0, 46.0, 32.0, 27.0, 28.0, 26.0, 23.0, 19.0, 8.0, 10.0, 7.0, 4.0, 3.0, 4.0, 5.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-25.314834594726562, -24.57830810546875, -23.841781616210938, -23.105255126953125, -22.368730545043945, -21.632204055786133, -20.89567756652832, -20.159151077270508, -19.422626495361328, -18.686100006103516, -17.949573516845703, -17.21304702758789, -16.47652244567871, -15.739995956420898, -15.003469467163086, -14.266942977905273, -13.530416488647461, -12.793889999389648, -12.057364463806152, -11.32083797454834, -10.584312438964844, -9.847785949707031, -9.111259460449219, -8.374732971191406, -7.63820743560791, -6.901681423187256, -6.165155410766602, -5.428628921508789, -4.692102909088135, -3.9555768966674805, -3.219050407409668, -2.4825243949890137, -1.7459983825683594, -1.0094722509384155, -0.2729461193084717, 0.4635801315307617, 1.200106143951416, 1.9366321563720703, 2.673158645629883, 3.409684658050537, 4.146210670471191, 4.882736682891846, 5.6192626953125, 6.3557891845703125, 7.092315196990967, 7.828841209411621, 8.565367698669434, 9.30189323425293, 10.038419723510742, 10.774946212768555, 11.51147174835205, 12.247998237609863, 12.98452377319336, 13.721050262451172, 14.457576751708984, 15.194103240966797, 15.930628776550293, 16.66715431213379, 17.4036808013916, 18.140207290649414, 18.876733779907227, 19.613258361816406, 20.34978485107422, 21.08631134033203, 21.822837829589844]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 13.0, 8.0, 14.0, 20.0, 28.0, 53.0, 79.0, 126.0, 227.0, 459.0, 1019.0, 2403.0, 6889.0, 29207.0, 299973.0, 3743975.0, 88307.0, 14459.0, 4044.0, 1505.0, 680.0, 339.0, 188.0, 111.0, 54.0, 32.0, 27.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.35430908203125, -7.1031494140625, -6.85198974609375, -6.600830078125, -6.34967041015625, -6.0985107421875, -5.84735107421875, -5.59619140625, -5.34503173828125, -5.0938720703125, -4.84271240234375, -4.591552734375, -4.34039306640625, -4.0892333984375, -3.83807373046875, -3.5869140625, -3.33575439453125, -3.0845947265625, -2.83343505859375, -2.582275390625, -2.33111572265625, -2.0799560546875, -1.82879638671875, -1.57763671875, -1.32647705078125, -1.0753173828125, -0.82415771484375, -0.572998046875, -0.32183837890625, -0.0706787109375, 0.18048095703125, 0.431640625, 0.68280029296875, 0.9339599609375, 1.18511962890625, 1.436279296875, 1.68743896484375, 1.9385986328125, 2.18975830078125, 2.44091796875, 2.69207763671875, 2.9432373046875, 3.19439697265625, 3.445556640625, 3.69671630859375, 3.9478759765625, 4.19903564453125, 4.4501953125, 4.70135498046875, 4.9525146484375, 5.20367431640625, 5.454833984375, 5.70599365234375, 5.9571533203125, 6.20831298828125, 6.45947265625, 6.71063232421875, 6.9617919921875, 7.21295166015625, 7.464111328125, 7.71527099609375, 7.9664306640625, 8.21759033203125, 8.46875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 9.0, 17.0, 15.0, 25.0, 44.0, 46.0, 71.0, 89.0, 92.0, 99.0, 104.0, 83.0, 80.0, 69.0, 41.0, 35.0, 32.0, 16.0, 9.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.3122100830078125, -1.265045166015625, -1.2178802490234375, -1.17071533203125, -1.1235504150390625, -1.076385498046875, -1.0292205810546875, -0.9820556640625, -0.9348907470703125, -0.887725830078125, -0.8405609130859375, -0.79339599609375, -0.7462310791015625, -0.699066162109375, -0.6519012451171875, -0.604736328125, -0.5575714111328125, -0.510406494140625, -0.4632415771484375, -0.41607666015625, -0.3689117431640625, -0.321746826171875, -0.2745819091796875, -0.2274169921875, -0.1802520751953125, -0.133087158203125, -0.0859222412109375, -0.03875732421875, 0.0084075927734375, 0.055572509765625, 0.1027374267578125, 0.14990234375, 0.1970672607421875, 0.244232177734375, 0.2913970947265625, 0.33856201171875, 0.3857269287109375, 0.432891845703125, 0.4800567626953125, 0.5272216796875, 0.5743865966796875, 0.621551513671875, 0.6687164306640625, 0.71588134765625, 0.7630462646484375, 0.810211181640625, 0.8573760986328125, 0.904541015625, 0.9517059326171875, 0.998870849609375, 1.0460357666015625, 1.09320068359375, 1.1403656005859375, 1.187530517578125, 1.2346954345703125, 1.2818603515625, 1.3290252685546875, 1.376190185546875, 1.4233551025390625, 1.47052001953125, 1.5176849365234375, 1.564849853515625, 1.6120147705078125, 1.6591796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 12.0, 11.0, 27.0, 31.0, 35.0, 77.0, 112.0, 170.0, 295.0, 481.0, 852.0, 1575.0, 3006.0, 6740.0, 17120.0, 52642.0, 243078.0, 3173605.0, 562587.0, 88732.0, 25204.0, 9344.0, 4110.0, 1964.0, 1038.0, 562.0, 335.0, 202.0, 116.0, 79.0, 38.0, 35.0, 15.0, 11.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.8984375, -4.74859619140625, -4.5987548828125, -4.44891357421875, -4.299072265625, -4.14923095703125, -3.9993896484375, -3.84954833984375, -3.69970703125, -3.54986572265625, -3.4000244140625, -3.25018310546875, -3.100341796875, -2.95050048828125, -2.8006591796875, -2.65081787109375, -2.5009765625, -2.35113525390625, -2.2012939453125, -2.05145263671875, -1.901611328125, -1.75177001953125, -1.6019287109375, -1.45208740234375, -1.30224609375, -1.15240478515625, -1.0025634765625, -0.85272216796875, -0.702880859375, -0.55303955078125, -0.4031982421875, -0.25335693359375, -0.103515625, 0.04632568359375, 0.1961669921875, 0.34600830078125, 0.495849609375, 0.64569091796875, 0.7955322265625, 0.94537353515625, 1.09521484375, 1.24505615234375, 1.3948974609375, 1.54473876953125, 1.694580078125, 1.84442138671875, 1.9942626953125, 2.14410400390625, 2.2939453125, 2.44378662109375, 2.5936279296875, 2.74346923828125, 2.893310546875, 3.04315185546875, 3.1929931640625, 3.34283447265625, 3.49267578125, 3.64251708984375, 3.7923583984375, 3.94219970703125, 4.092041015625, 4.24188232421875, 4.3917236328125, 4.54156494140625, 4.69140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 8.0, 12.0, 13.0, 17.0, 24.0, 24.0, 31.0, 41.0, 72.0, 98.0, 179.0, 350.0, 869.0, 1272.0, 401.0, 203.0, 123.0, 84.0, 61.0, 47.0, 17.0, 17.0, 15.0, 11.0, 12.0, 7.0, 5.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2412109375, -1.20001220703125, -1.1588134765625, -1.11761474609375, -1.076416015625, -1.03521728515625, -0.9940185546875, -0.95281982421875, -0.91162109375, -0.87042236328125, -0.8292236328125, -0.78802490234375, -0.746826171875, -0.70562744140625, -0.6644287109375, -0.62322998046875, -0.58203125, -0.54083251953125, -0.4996337890625, -0.45843505859375, -0.417236328125, -0.37603759765625, -0.3348388671875, -0.29364013671875, -0.25244140625, -0.21124267578125, -0.1700439453125, -0.12884521484375, -0.087646484375, -0.04644775390625, -0.0052490234375, 0.03594970703125, 0.0771484375, 0.11834716796875, 0.1595458984375, 0.20074462890625, 0.241943359375, 0.28314208984375, 0.3243408203125, 0.36553955078125, 0.40673828125, 0.44793701171875, 0.4891357421875, 0.53033447265625, 0.571533203125, 0.61273193359375, 0.6539306640625, 0.69512939453125, 0.736328125, 0.77752685546875, 0.8187255859375, 0.85992431640625, 0.901123046875, 0.94232177734375, 0.9835205078125, 1.02471923828125, 1.06591796875, 1.10711669921875, 1.1483154296875, 1.18951416015625, 1.230712890625, 1.27191162109375, 1.3131103515625, 1.35430908203125, 1.3955078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 23.0, 45.0, 68.0, 133.0, 184.0, 196.0, 139.0, 94.0, 62.0, 22.0, 15.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.871591567993164, -6.447042465209961, -6.022493362426758, -5.597944259643555, -5.173395156860352, -4.748846054077148, -4.3242974281311035, -3.8997483253479004, -3.4751992225646973, -3.050650119781494, -2.626101016998291, -2.201552152633667, -1.7770030498504639, -1.3524539470672607, -0.9279050827026367, -0.5033559799194336, -0.07880687713623047, 0.3457421660423279, 0.7702912092208862, 1.1948401927947998, 1.619389295578003, 2.043938398361206, 2.46848726272583, 2.893036365509033, 3.3175854682922363, 3.7421345710754395, 4.166683673858643, 4.5912322998046875, 5.015781402587891, 5.440330505371094, 5.864879608154297, 6.2894287109375, 6.713977813720703, 7.138526916503906, 7.563076019287109, 7.9876251220703125, 8.412174224853516, 8.836723327636719, 9.261272430419922, 9.685821533203125, 10.110370635986328, 10.534919738769531, 10.959468841552734, 11.384017944335938, 11.80856704711914, 12.233116149902344, 12.657665252685547, 13.08221435546875, 13.506762504577637, 13.93131160736084, 14.355860710144043, 14.780409812927246, 15.20495891571045, 15.629508018493652, 16.05405616760254, 16.478605270385742, 16.903154373168945, 17.32770347595215, 17.75225257873535, 18.176801681518555, 18.601350784301758, 19.02589988708496, 19.450448989868164, 19.874998092651367, 20.29954719543457]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 6.0, 13.0, 22.0, 9.0, 19.0, 26.0, 35.0, 29.0, 24.0, 31.0, 36.0, 43.0, 37.0, 34.0, 39.0, 38.0, 49.0, 46.0, 50.0, 34.0, 59.0, 33.0, 35.0, 33.0, 29.0, 22.0, 12.0, 27.0, 13.0, 16.0, 22.0, 11.0, 18.0, 9.0, 8.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 3.0], "bins": [-6.211277008056641, -6.048167705535889, -5.885058403015137, -5.721949100494385, -5.558839797973633, -5.395730495452881, -5.232621192932129, -5.069511890411377, -4.906402587890625, -4.743293285369873, -4.580183982849121, -4.417074680328369, -4.253965377807617, -4.090856075286865, -3.9277467727661133, -3.7646374702453613, -3.6015284061431885, -3.4384191036224365, -3.2753098011016846, -3.1122004985809326, -2.9490911960601807, -2.7859818935394287, -2.622872829437256, -2.459763526916504, -2.296654224395752, -2.133544921875, -1.970435619354248, -1.807326316833496, -1.6442170143127441, -1.4811077117919922, -1.3179985284805298, -1.1548892259597778, -0.9917798042297363, -0.8286705017089844, -0.6655611991882324, -0.5024519562721252, -0.3393426537513733, -0.17623335123062134, -0.01312410831451416, 0.1499851942062378, 0.31309449672698975, 0.4762037992477417, 0.6393131017684937, 0.8024223446846008, 0.9655316472053528, 1.12864089012146, 1.291750192642212, 1.4548594951629639, 1.6179687976837158, 1.7810781002044678, 1.9441874027252197, 2.1072967052459717, 2.2704060077667236, 2.4335153102874756, 2.5966243743896484, 2.7597336769104004, 2.9228429794311523, 3.0859522819519043, 3.2490615844726562, 3.412170886993408, 3.57528018951416, 3.738389492034912, 3.901498794555664, 4.064608097076416, 4.227717399597168]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 11.0, 11.0, 15.0, 12.0, 26.0, 32.0, 40.0, 75.0, 97.0, 146.0, 280.0, 498.0, 853.0, 1733.0, 3530.0, 7815.0, 18807.0, 52087.0, 151414.0, 374557.0, 280288.0, 97913.0, 33950.0, 12991.0, 5631.0, 2631.0, 1327.0, 697.0, 409.0, 215.0, 147.0, 93.0, 60.0, 46.0, 28.0, 24.0, 16.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-5.015625, -4.875518798828125, -4.73541259765625, -4.595306396484375, -4.4552001953125, -4.315093994140625, -4.17498779296875, -4.034881591796875, -3.894775390625, -3.754669189453125, -3.61456298828125, -3.474456787109375, -3.3343505859375, -3.194244384765625, -3.05413818359375, -2.914031982421875, -2.77392578125, -2.633819580078125, -2.49371337890625, -2.353607177734375, -2.2135009765625, -2.073394775390625, -1.93328857421875, -1.793182373046875, -1.653076171875, -1.512969970703125, -1.37286376953125, -1.232757568359375, -1.0926513671875, -0.952545166015625, -0.81243896484375, -0.672332763671875, -0.5322265625, -0.392120361328125, -0.25201416015625, -0.111907958984375, 0.0281982421875, 0.168304443359375, 0.30841064453125, 0.448516845703125, 0.588623046875, 0.728729248046875, 0.86883544921875, 1.008941650390625, 1.1490478515625, 1.289154052734375, 1.42926025390625, 1.569366455078125, 1.70947265625, 1.849578857421875, 1.98968505859375, 2.129791259765625, 2.2698974609375, 2.410003662109375, 2.55010986328125, 2.690216064453125, 2.830322265625, 2.970428466796875, 3.11053466796875, 3.250640869140625, 3.3907470703125, 3.530853271484375, 3.67095947265625, 3.811065673828125, 3.951171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 13.0, 12.0, 29.0, 27.0, 42.0, 61.0, 81.0, 87.0, 107.0, 81.0, 92.0, 80.0, 68.0, 51.0, 45.0, 38.0, 23.0, 17.0, 10.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.283111572265625, -1.23614501953125, -1.189178466796875, -1.1422119140625, -1.095245361328125, -1.04827880859375, -1.001312255859375, -0.954345703125, -0.907379150390625, -0.86041259765625, -0.813446044921875, -0.7664794921875, -0.719512939453125, -0.67254638671875, -0.625579833984375, -0.57861328125, -0.531646728515625, -0.48468017578125, -0.437713623046875, -0.3907470703125, -0.343780517578125, -0.29681396484375, -0.249847412109375, -0.202880859375, -0.155914306640625, -0.10894775390625, -0.061981201171875, -0.0150146484375, 0.031951904296875, 0.07891845703125, 0.125885009765625, 0.1728515625, 0.219818115234375, 0.26678466796875, 0.313751220703125, 0.3607177734375, 0.407684326171875, 0.45465087890625, 0.501617431640625, 0.548583984375, 0.595550537109375, 0.64251708984375, 0.689483642578125, 0.7364501953125, 0.783416748046875, 0.83038330078125, 0.877349853515625, 0.92431640625, 0.971282958984375, 1.01824951171875, 1.065216064453125, 1.1121826171875, 1.159149169921875, 1.20611572265625, 1.253082275390625, 1.300048828125, 1.347015380859375, 1.39398193359375, 1.440948486328125, 1.4879150390625, 1.534881591796875, 1.58184814453125, 1.628814697265625, 1.67578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 14.0, 24.0, 32.0, 41.0, 62.0, 85.0, 115.0, 210.0, 371.0, 573.0, 1092.0, 2055.0, 5315.0, 18579.0, 82120.0, 361119.0, 435324.0, 106197.0, 23597.0, 6425.0, 2322.0, 1181.0, 602.0, 412.0, 244.0, 140.0, 87.0, 63.0, 44.0, 22.0, 24.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.0234375, -5.85174560546875, -5.6800537109375, -5.50836181640625, -5.336669921875, -5.16497802734375, -4.9932861328125, -4.82159423828125, -4.64990234375, -4.47821044921875, -4.3065185546875, -4.13482666015625, -3.963134765625, -3.79144287109375, -3.6197509765625, -3.44805908203125, -3.2763671875, -3.10467529296875, -2.9329833984375, -2.76129150390625, -2.589599609375, -2.41790771484375, -2.2462158203125, -2.07452392578125, -1.90283203125, -1.73114013671875, -1.5594482421875, -1.38775634765625, -1.216064453125, -1.04437255859375, -0.8726806640625, -0.70098876953125, -0.529296875, -0.35760498046875, -0.1859130859375, -0.01422119140625, 0.157470703125, 0.32916259765625, 0.5008544921875, 0.67254638671875, 0.84423828125, 1.01593017578125, 1.1876220703125, 1.35931396484375, 1.531005859375, 1.70269775390625, 1.8743896484375, 2.04608154296875, 2.2177734375, 2.38946533203125, 2.5611572265625, 2.73284912109375, 2.904541015625, 3.07623291015625, 3.2479248046875, 3.41961669921875, 3.59130859375, 3.76300048828125, 3.9346923828125, 4.10638427734375, 4.278076171875, 4.44976806640625, 4.6214599609375, 4.79315185546875, 4.96484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 10.0, 18.0, 12.0, 15.0, 21.0, 20.0, 20.0, 25.0, 27.0, 27.0, 38.0, 42.0, 48.0, 51.0, 57.0, 42.0, 49.0, 47.0, 44.0, 44.0, 36.0, 34.0, 34.0, 38.0, 35.0, 27.0, 20.0, 19.0, 18.0, 19.0, 10.0, 10.0, 8.0, 8.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.7265625, -4.596282958984375, -4.46600341796875, -4.335723876953125, -4.2054443359375, -4.075164794921875, -3.94488525390625, -3.814605712890625, -3.684326171875, -3.554046630859375, -3.42376708984375, -3.293487548828125, -3.1632080078125, -3.032928466796875, -2.90264892578125, -2.772369384765625, -2.64208984375, -2.511810302734375, -2.38153076171875, -2.251251220703125, -2.1209716796875, -1.990692138671875, -1.86041259765625, -1.730133056640625, -1.599853515625, -1.469573974609375, -1.33929443359375, -1.209014892578125, -1.0787353515625, -0.948455810546875, -0.81817626953125, -0.687896728515625, -0.5576171875, -0.427337646484375, -0.29705810546875, -0.166778564453125, -0.0364990234375, 0.093780517578125, 0.22406005859375, 0.354339599609375, 0.484619140625, 0.614898681640625, 0.74517822265625, 0.875457763671875, 1.0057373046875, 1.136016845703125, 1.26629638671875, 1.396575927734375, 1.52685546875, 1.657135009765625, 1.78741455078125, 1.917694091796875, 2.0479736328125, 2.178253173828125, 2.30853271484375, 2.438812255859375, 2.569091796875, 2.699371337890625, 2.82965087890625, 2.959930419921875, 3.0902099609375, 3.220489501953125, 3.35076904296875, 3.481048583984375, 3.611328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 2.0, 8.0, 7.0, 17.0, 29.0, 38.0, 68.0, 133.0, 221.0, 393.0, 678.0, 1264.0, 2719.0, 6271.0, 15603.0, 43588.0, 148563.0, 434922.0, 274680.0, 76619.0, 25198.0, 9653.0, 4004.0, 1857.0, 914.0, 447.0, 263.0, 149.0, 71.0, 60.0, 37.0, 28.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.966796875, -2.88818359375, -2.8095703125, -2.73095703125, -2.65234375, -2.57373046875, -2.4951171875, -2.41650390625, -2.337890625, -2.25927734375, -2.1806640625, -2.10205078125, -2.0234375, -1.94482421875, -1.8662109375, -1.78759765625, -1.708984375, -1.63037109375, -1.5517578125, -1.47314453125, -1.39453125, -1.31591796875, -1.2373046875, -1.15869140625, -1.080078125, -1.00146484375, -0.9228515625, -0.84423828125, -0.765625, -0.68701171875, -0.6083984375, -0.52978515625, -0.451171875, -0.37255859375, -0.2939453125, -0.21533203125, -0.13671875, -0.05810546875, 0.0205078125, 0.09912109375, 0.177734375, 0.25634765625, 0.3349609375, 0.41357421875, 0.4921875, 0.57080078125, 0.6494140625, 0.72802734375, 0.806640625, 0.88525390625, 0.9638671875, 1.04248046875, 1.12109375, 1.19970703125, 1.2783203125, 1.35693359375, 1.435546875, 1.51416015625, 1.5927734375, 1.67138671875, 1.75, 1.82861328125, 1.9072265625, 1.98583984375, 2.064453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 6.0, 5.0, 6.0, 16.0, 24.0, 10.0, 20.0, 29.0, 24.0, 29.0, 39.0, 75.0, 79.0, 96.0, 127.0, 75.0, 54.0, 52.0, 38.0, 34.0, 20.0, 25.0, 21.0, 9.0, 7.0, 9.0, 8.0, 1.0, 5.0, 5.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.000469207763671875, -0.00045462697744369507, -0.00044004619121551514, -0.0004254654049873352, -0.0004108846187591553, -0.00039630383253097534, -0.0003817230463027954, -0.0003671422600746155, -0.00035256147384643555, -0.0003379806876182556, -0.0003233999013900757, -0.00030881911516189575, -0.0002942383289337158, -0.0002796575427055359, -0.00026507675647735596, -0.000250495970249176, -0.0002359151840209961, -0.00022133439779281616, -0.00020675361156463623, -0.0001921728253364563, -0.00017759203910827637, -0.00016301125288009644, -0.0001484304666519165, -0.00013384968042373657, -0.00011926889419555664, -0.00010468810796737671, -9.010732173919678e-05, -7.552653551101685e-05, -6.0945749282836914e-05, -4.636496305465698e-05, -3.178417682647705e-05, -1.720339059829712e-05, -2.6226043701171875e-06, 1.1958181858062744e-05, 2.6538968086242676e-05, 4.111975431442261e-05, 5.570054054260254e-05, 7.028132677078247e-05, 8.48621129989624e-05, 9.944289922714233e-05, 0.00011402368545532227, 0.0001286044716835022, 0.00014318525791168213, 0.00015776604413986206, 0.000172346830368042, 0.00018692761659622192, 0.00020150840282440186, 0.0002160891890525818, 0.00023066997528076172, 0.00024525076150894165, 0.0002598315477371216, 0.0002744123339653015, 0.00028899312019348145, 0.0003035739064216614, 0.0003181546926498413, 0.00033273547887802124, 0.00034731626510620117, 0.0003618970513343811, 0.00037647783756256104, 0.00039105862379074097, 0.0004056394100189209, 0.00042022019624710083, 0.00043480098247528076, 0.0004493817687034607, 0.0004639625549316406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 8.0, 8.0, 12.0, 16.0, 32.0, 50.0, 65.0, 106.0, 163.0, 313.0, 560.0, 1002.0, 2397.0, 6012.0, 19611.0, 83532.0, 437272.0, 395465.0, 74077.0, 17835.0, 5711.0, 2078.0, 967.0, 513.0, 240.0, 166.0, 101.0, 72.0, 45.0, 29.0, 21.0, 11.0, 12.0, 15.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.4140625, -3.31048583984375, -3.2069091796875, -3.10333251953125, -2.999755859375, -2.89617919921875, -2.7926025390625, -2.68902587890625, -2.58544921875, -2.48187255859375, -2.3782958984375, -2.27471923828125, -2.171142578125, -2.06756591796875, -1.9639892578125, -1.86041259765625, -1.7568359375, -1.65325927734375, -1.5496826171875, -1.44610595703125, -1.342529296875, -1.23895263671875, -1.1353759765625, -1.03179931640625, -0.92822265625, -0.82464599609375, -0.7210693359375, -0.61749267578125, -0.513916015625, -0.41033935546875, -0.3067626953125, -0.20318603515625, -0.099609375, 0.00396728515625, 0.1075439453125, 0.21112060546875, 0.314697265625, 0.41827392578125, 0.5218505859375, 0.62542724609375, 0.72900390625, 0.83258056640625, 0.9361572265625, 1.03973388671875, 1.143310546875, 1.24688720703125, 1.3504638671875, 1.45404052734375, 1.5576171875, 1.66119384765625, 1.7647705078125, 1.86834716796875, 1.971923828125, 2.07550048828125, 2.1790771484375, 2.28265380859375, 2.38623046875, 2.48980712890625, 2.5933837890625, 2.69696044921875, 2.800537109375, 2.90411376953125, 3.0076904296875, 3.11126708984375, 3.21484375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 16.0, 20.0, 25.0, 34.0, 33.0, 42.0, 56.0, 76.0, 98.0, 85.0, 91.0, 91.0, 69.0, 51.0, 42.0, 35.0, 29.0, 26.0, 16.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.306365966796875, -2.23382568359375, -2.161285400390625, -2.0887451171875, -2.016204833984375, -1.94366455078125, -1.871124267578125, -1.798583984375, -1.726043701171875, -1.65350341796875, -1.580963134765625, -1.5084228515625, -1.435882568359375, -1.36334228515625, -1.290802001953125, -1.21826171875, -1.145721435546875, -1.07318115234375, -1.000640869140625, -0.9281005859375, -0.855560302734375, -0.78302001953125, -0.710479736328125, -0.637939453125, -0.565399169921875, -0.49285888671875, -0.420318603515625, -0.3477783203125, -0.275238037109375, -0.20269775390625, -0.130157470703125, -0.0576171875, 0.014923095703125, 0.08746337890625, 0.160003662109375, 0.2325439453125, 0.305084228515625, 0.37762451171875, 0.450164794921875, 0.522705078125, 0.595245361328125, 0.66778564453125, 0.740325927734375, 0.8128662109375, 0.885406494140625, 0.95794677734375, 1.030487060546875, 1.10302734375, 1.175567626953125, 1.24810791015625, 1.320648193359375, 1.3931884765625, 1.465728759765625, 1.53826904296875, 1.610809326171875, 1.683349609375, 1.755889892578125, 1.82843017578125, 1.900970458984375, 1.9735107421875, 2.046051025390625, 2.11859130859375, 2.191131591796875, 2.263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 19.0, 52.0, 124.0, 233.0, 247.0, 184.0, 95.0, 29.0, 13.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.62129211425781, -80.56230926513672, -78.50332641601562, -76.44434356689453, -74.38536071777344, -72.32637786865234, -70.26739501953125, -68.20841979980469, -66.14942932128906, -64.09044647216797, -62.031463623046875, -59.97248077392578, -57.91349792480469, -55.854515075683594, -53.795536041259766, -51.73655319213867, -49.677574157714844, -47.61859130859375, -45.559608459472656, -43.50062561035156, -41.44164276123047, -39.382659912109375, -37.32368087768555, -35.26469802856445, -33.20571517944336, -31.146732330322266, -29.087749481201172, -27.02876853942871, -24.969785690307617, -22.910802841186523, -20.851821899414062, -18.79283905029297, -16.733848571777344, -14.67486572265625, -12.615883827209473, -10.556901931762695, -8.497919082641602, -6.438936233520508, -4.3799543380737305, -2.320972442626953, -0.2619895935058594, 1.7969927787780762, 3.8559751510620117, 5.914957523345947, 7.973939895629883, 10.032922744750977, 12.091904640197754, 14.150886535644531, 16.209869384765625, 18.26885223388672, 20.327835083007812, 22.386816024780273, 24.445798873901367, 26.50478172302246, 28.563762664794922, 30.622745513916016, 32.68172836303711, 34.7407112121582, 36.7996940612793, 38.85867691040039, 40.91765594482422, 42.97663879394531, 45.035621643066406, 47.0946044921875, 49.153587341308594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 8.0, 22.0, 18.0, 25.0, 38.0, 44.0, 41.0, 47.0, 61.0, 51.0, 68.0, 69.0, 78.0, 64.0, 60.0, 53.0, 35.0, 36.0, 39.0, 27.0, 16.0, 22.0, 11.0, 20.0, 13.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.555089950561523, -24.59972381591797, -23.64435577392578, -22.688989639282227, -21.733623504638672, -20.778255462646484, -19.82288932800293, -18.867523193359375, -17.912155151367188, -16.956789016723633, -16.001420974731445, -15.04605484008789, -14.090688705444336, -13.135321617126465, -12.179954528808594, -11.224588394165039, -10.269222259521484, -9.313855171203613, -8.358489036560059, -7.4031219482421875, -6.447755336761475, -5.492388725280762, -4.537021636962891, -3.5816550254821777, -2.626288414001465, -1.6709216833114624, -0.71555495262146, 0.23981189727783203, 1.195178508758545, 2.150545120239258, 3.105912208557129, 4.061278820037842, 5.016643524169922, 5.972010135650635, 6.927376747131348, 7.882743835449219, 8.838109970092773, 9.793477058410645, 10.748844146728516, 11.70421028137207, 12.659577369689941, 13.614944458007812, 14.570310592651367, 15.525677680969238, 16.48104476928711, 17.436410903930664, 18.39177703857422, 19.347145080566406, 20.30251121520996, 21.257877349853516, 22.213245391845703, 23.168611526489258, 24.123977661132812, 25.079345703125, 26.034711837768555, 26.99007797241211, 27.945446014404297, 28.90081214904785, 29.85618019104004, 30.811546325683594, 31.76691246032715, 32.7222785949707, 33.67764663696289, 34.63301467895508, 35.58837890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 20.0, 25.0, 37.0, 64.0, 117.0, 178.0, 323.0, 687.0, 1477.0, 3564.0, 9991.0, 34349.0, 192105.0, 3405040.0, 464825.0, 58104.0, 14576.0, 4952.0, 1929.0, 881.0, 423.0, 256.0, 134.0, 73.0, 39.0, 31.0, 11.0, 9.0, 11.0, 9.0, 7.0, 2.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.5361328125, -5.349609375, -5.1630859375, -4.9765625, -4.7900390625, -4.603515625, -4.4169921875, -4.23046875, -4.0439453125, -3.857421875, -3.6708984375, -3.484375, -3.2978515625, -3.111328125, -2.9248046875, -2.73828125, -2.5517578125, -2.365234375, -2.1787109375, -1.9921875, -1.8056640625, -1.619140625, -1.4326171875, -1.24609375, -1.0595703125, -0.873046875, -0.6865234375, -0.5, -0.3134765625, -0.126953125, 0.0595703125, 0.24609375, 0.4326171875, 0.619140625, 0.8056640625, 0.9921875, 1.1787109375, 1.365234375, 1.5517578125, 1.73828125, 1.9248046875, 2.111328125, 2.2978515625, 2.484375, 2.6708984375, 2.857421875, 3.0439453125, 3.23046875, 3.4169921875, 3.603515625, 3.7900390625, 3.9765625, 4.1630859375, 4.349609375, 4.5361328125, 4.72265625, 4.9091796875, 5.095703125, 5.2822265625, 5.46875, 5.6552734375, 5.841796875, 6.0283203125, 6.21484375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 8.0, 10.0, 21.0, 28.0, 44.0, 55.0, 54.0, 80.0, 81.0, 107.0, 83.0, 82.0, 74.0, 81.0, 54.0, 28.0, 31.0, 28.0, 16.0, 9.0, 9.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.3318634033203125, -1.282867431640625, -1.2338714599609375, -1.18487548828125, -1.1358795166015625, -1.086883544921875, -1.0378875732421875, -0.9888916015625, -0.9398956298828125, -0.890899658203125, -0.8419036865234375, -0.79290771484375, -0.7439117431640625, -0.694915771484375, -0.6459197998046875, -0.596923828125, -0.5479278564453125, -0.498931884765625, -0.4499359130859375, -0.40093994140625, -0.3519439697265625, -0.302947998046875, -0.2539520263671875, -0.2049560546875, -0.1559600830078125, -0.106964111328125, -0.0579681396484375, -0.00897216796875, 0.0400238037109375, 0.089019775390625, 0.1380157470703125, 0.18701171875, 0.2360076904296875, 0.285003662109375, 0.3339996337890625, 0.38299560546875, 0.4319915771484375, 0.480987548828125, 0.5299835205078125, 0.5789794921875, 0.6279754638671875, 0.676971435546875, 0.7259674072265625, 0.77496337890625, 0.8239593505859375, 0.872955322265625, 0.9219512939453125, 0.970947265625, 1.0199432373046875, 1.068939208984375, 1.1179351806640625, 1.16693115234375, 1.2159271240234375, 1.264923095703125, 1.3139190673828125, 1.3629150390625, 1.4119110107421875, 1.460906982421875, 1.5099029541015625, 1.55889892578125, 1.6078948974609375, 1.656890869140625, 1.7058868408203125, 1.7548828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 15.0, 14.0, 17.0, 28.0, 43.0, 60.0, 109.0, 186.0, 294.0, 512.0, 1086.0, 2449.0, 5540.0, 16145.0, 58403.0, 318839.0, 3024855.0, 636303.0, 92552.0, 23206.0, 7507.0, 2974.0, 1373.0, 731.0, 378.0, 233.0, 130.0, 101.0, 70.0, 42.0, 25.0, 19.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.41241455078125, -4.2584228515625, -4.10443115234375, -3.950439453125, -3.79644775390625, -3.6424560546875, -3.48846435546875, -3.33447265625, -3.18048095703125, -3.0264892578125, -2.87249755859375, -2.718505859375, -2.56451416015625, -2.4105224609375, -2.25653076171875, -2.1025390625, -1.94854736328125, -1.7945556640625, -1.64056396484375, -1.486572265625, -1.33258056640625, -1.1785888671875, -1.02459716796875, -0.87060546875, -0.71661376953125, -0.5626220703125, -0.40863037109375, -0.254638671875, -0.10064697265625, 0.0533447265625, 0.20733642578125, 0.361328125, 0.51531982421875, 0.6693115234375, 0.82330322265625, 0.977294921875, 1.13128662109375, 1.2852783203125, 1.43927001953125, 1.59326171875, 1.74725341796875, 1.9012451171875, 2.05523681640625, 2.209228515625, 2.36322021484375, 2.5172119140625, 2.67120361328125, 2.8251953125, 2.97918701171875, 3.1331787109375, 3.28717041015625, 3.441162109375, 3.59515380859375, 3.7491455078125, 3.90313720703125, 4.05712890625, 4.21112060546875, 4.3651123046875, 4.51910400390625, 4.673095703125, 4.82708740234375, 4.9810791015625, 5.13507080078125, 5.2890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 11.0, 16.0, 17.0, 27.0, 36.0, 48.0, 56.0, 127.0, 145.0, 249.0, 430.0, 997.0, 778.0, 433.0, 221.0, 147.0, 89.0, 52.0, 46.0, 33.0, 32.0, 21.0, 4.0, 10.0, 4.0, 12.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.833984375, -1.7706298828125, -1.707275390625, -1.6439208984375, -1.58056640625, -1.5172119140625, -1.453857421875, -1.3905029296875, -1.3271484375, -1.2637939453125, -1.200439453125, -1.1370849609375, -1.07373046875, -1.0103759765625, -0.947021484375, -0.8836669921875, -0.8203125, -0.7569580078125, -0.693603515625, -0.6302490234375, -0.56689453125, -0.5035400390625, -0.440185546875, -0.3768310546875, -0.3134765625, -0.2501220703125, -0.186767578125, -0.1234130859375, -0.06005859375, 0.0032958984375, 0.066650390625, 0.1300048828125, 0.193359375, 0.2567138671875, 0.320068359375, 0.3834228515625, 0.44677734375, 0.5101318359375, 0.573486328125, 0.6368408203125, 0.7001953125, 0.7635498046875, 0.826904296875, 0.8902587890625, 0.95361328125, 1.0169677734375, 1.080322265625, 1.1436767578125, 1.20703125, 1.2703857421875, 1.333740234375, 1.3970947265625, 1.46044921875, 1.5238037109375, 1.587158203125, 1.6505126953125, 1.7138671875, 1.7772216796875, 1.840576171875, 1.9039306640625, 1.96728515625, 2.0306396484375, 2.093994140625, 2.1573486328125, 2.220703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 31.0, 54.0, 106.0, 161.0, 166.0, 181.0, 137.0, 85.0, 40.0, 22.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.774612426757812, -19.061376571655273, -18.3481388092041, -17.634902954101562, -16.921667098999023, -16.208431243896484, -15.495193481445312, -14.781957626342773, -14.068721771240234, -13.355484962463379, -12.64224910736084, -11.929012298583984, -11.215776443481445, -10.50253963470459, -9.789302825927734, -9.076066970825195, -8.36283016204834, -7.649593830108643, -6.936357498168945, -6.22312068939209, -5.509884834289551, -4.796648025512695, -4.083411693572998, -3.370175361633301, -2.6569390296936035, -1.9437026977539062, -1.2304662466049194, -0.5172297954559326, 0.19600653648376465, 0.9092428684234619, 1.6224794387817383, 2.3357157707214355, 3.048952102661133, 3.76218843460083, 4.475424766540527, 5.188661575317383, 5.901897430419922, 6.615134239196777, 7.328370571136475, 8.041606903076172, 8.754842758178711, 9.468079566955566, 10.181315422058105, 10.894552230834961, 11.6077880859375, 12.321024894714355, 13.034261703491211, 13.74749755859375, 14.460734367370605, 15.173971176147461, 15.88720703125, 16.60044288635254, 17.31368064880371, 18.02691650390625, 18.74015235900879, 19.453388214111328, 20.1666259765625, 20.87986183166504, 21.59309959411621, 22.30633544921875, 23.01957130432129, 23.732807159423828, 24.446044921875, 25.15928077697754, 25.872516632080078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 10.0, 10.0, 23.0, 18.0, 13.0, 19.0, 20.0, 28.0, 18.0, 29.0, 28.0, 31.0, 23.0, 35.0, 40.0, 42.0, 43.0, 52.0, 44.0, 37.0, 40.0, 37.0, 30.0, 33.0, 28.0, 23.0, 31.0, 22.0, 34.0, 22.0, 22.0, 13.0, 17.0, 7.0, 13.0, 7.0, 6.0, 6.0, 13.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.53273344039917, -6.3186116218566895, -6.104490280151367, -5.890368461608887, -5.6762471199035645, -5.462125301361084, -5.248003959655762, -5.033882141113281, -4.819760322570801, -4.60563850402832, -4.391517162322998, -4.177395343780518, -3.9632740020751953, -3.749152183532715, -3.5350306034088135, -3.320909023284912, -3.10678768157959, -2.8926661014556885, -2.678544521331787, -2.4644227027893066, -2.2503013610839844, -2.036179542541504, -1.8220579624176025, -1.6079363822937012, -1.3938148021697998, -1.1796932220458984, -0.9655715823173523, -0.7514499425888062, -0.5373283624649048, -0.3232067823410034, -0.1090850830078125, 0.10503649711608887, 0.31915855407714844, 0.5332801342010498, 0.747401773929596, 0.9615234136581421, 1.1756449937820435, 1.3897665739059448, 1.6038882732391357, 1.818009853363037, 2.0321314334869385, 2.24625301361084, 2.460374593734741, 2.6744961738586426, 2.888617992401123, 3.1027393341064453, 3.316861152648926, 3.530982732772827, 3.7451043128967285, 3.95922589302063, 4.173347473144531, 4.387469291687012, 4.601590633392334, 4.8157124519348145, 5.029833793640137, 5.243955612182617, 5.458077430725098, 5.672199249267578, 5.8863205909729, 6.100442409515381, 6.314563751220703, 6.528685569763184, 6.742807388305664, 6.956928730010986, 7.171050071716309]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 4.0, 8.0, 14.0, 14.0, 24.0, 38.0, 69.0, 88.0, 152.0, 258.0, 496.0, 1078.0, 2611.0, 7339.0, 22389.0, 76642.0, 333131.0, 457577.0, 102215.0, 29273.0, 9242.0, 3163.0, 1414.0, 582.0, 288.0, 162.0, 98.0, 69.0, 33.0, 23.0, 18.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.879638671875, -4.67724609375, -4.474853515625, -4.2724609375, -4.070068359375, -3.86767578125, -3.665283203125, -3.462890625, -3.260498046875, -3.05810546875, -2.855712890625, -2.6533203125, -2.450927734375, -2.24853515625, -2.046142578125, -1.84375, -1.641357421875, -1.43896484375, -1.236572265625, -1.0341796875, -0.831787109375, -0.62939453125, -0.427001953125, -0.224609375, -0.022216796875, 0.18017578125, 0.382568359375, 0.5849609375, 0.787353515625, 0.98974609375, 1.192138671875, 1.39453125, 1.596923828125, 1.79931640625, 2.001708984375, 2.2041015625, 2.406494140625, 2.60888671875, 2.811279296875, 3.013671875, 3.216064453125, 3.41845703125, 3.620849609375, 3.8232421875, 4.025634765625, 4.22802734375, 4.430419921875, 4.6328125, 4.835205078125, 5.03759765625, 5.239990234375, 5.4423828125, 5.644775390625, 5.84716796875, 6.049560546875, 6.251953125, 6.454345703125, 6.65673828125, 6.859130859375, 7.0615234375, 7.263916015625, 7.46630859375, 7.668701171875, 7.87109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 13.0, 20.0, 26.0, 27.0, 34.0, 71.0, 62.0, 73.0, 96.0, 92.0, 84.0, 67.0, 77.0, 54.0, 59.0, 32.0, 32.0, 18.0, 17.0, 15.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3420562744140625, -1.295440673828125, -1.2488250732421875, -1.20220947265625, -1.1555938720703125, -1.108978271484375, -1.0623626708984375, -1.0157470703125, -0.9691314697265625, -0.922515869140625, -0.8759002685546875, -0.82928466796875, -0.7826690673828125, -0.736053466796875, -0.6894378662109375, -0.642822265625, -0.5962066650390625, -0.549591064453125, -0.5029754638671875, -0.45635986328125, -0.4097442626953125, -0.363128662109375, -0.3165130615234375, -0.2698974609375, -0.2232818603515625, -0.176666259765625, -0.1300506591796875, -0.08343505859375, -0.0368194580078125, 0.009796142578125, 0.0564117431640625, 0.10302734375, 0.1496429443359375, 0.196258544921875, 0.2428741455078125, 0.28948974609375, 0.3361053466796875, 0.382720947265625, 0.4293365478515625, 0.4759521484375, 0.5225677490234375, 0.569183349609375, 0.6157989501953125, 0.66241455078125, 0.7090301513671875, 0.755645751953125, 0.8022613525390625, 0.848876953125, 0.8954925537109375, 0.942108154296875, 0.9887237548828125, 1.03533935546875, 1.0819549560546875, 1.128570556640625, 1.1751861572265625, 1.2218017578125, 1.2684173583984375, 1.315032958984375, 1.3616485595703125, 1.40826416015625, 1.4548797607421875, 1.501495361328125, 1.5481109619140625, 1.5947265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 11.0, 8.0, 22.0, 24.0, 29.0, 61.0, 74.0, 134.0, 204.0, 355.0, 636.0, 1179.0, 2279.0, 5053.0, 12856.0, 41059.0, 165750.0, 546919.0, 198325.0, 48263.0, 14395.0, 5471.0, 2452.0, 1258.0, 683.0, 387.0, 220.0, 148.0, 91.0, 62.0, 43.0, 36.0, 18.0, 14.0, 10.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.85784912109375, -5.6883544921875, -5.51885986328125, -5.349365234375, -5.17987060546875, -5.0103759765625, -4.84088134765625, -4.67138671875, -4.50189208984375, -4.3323974609375, -4.16290283203125, -3.993408203125, -3.82391357421875, -3.6544189453125, -3.48492431640625, -3.3154296875, -3.14593505859375, -2.9764404296875, -2.80694580078125, -2.637451171875, -2.46795654296875, -2.2984619140625, -2.12896728515625, -1.95947265625, -1.78997802734375, -1.6204833984375, -1.45098876953125, -1.281494140625, -1.11199951171875, -0.9425048828125, -0.77301025390625, -0.603515625, -0.43402099609375, -0.2645263671875, -0.09503173828125, 0.074462890625, 0.24395751953125, 0.4134521484375, 0.58294677734375, 0.75244140625, 0.92193603515625, 1.0914306640625, 1.26092529296875, 1.430419921875, 1.59991455078125, 1.7694091796875, 1.93890380859375, 2.1083984375, 2.27789306640625, 2.4473876953125, 2.61688232421875, 2.786376953125, 2.95587158203125, 3.1253662109375, 3.29486083984375, 3.46435546875, 3.63385009765625, 3.8033447265625, 3.97283935546875, 4.142333984375, 4.31182861328125, 4.4813232421875, 4.65081787109375, 4.8203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 3.0, 8.0, 5.0, 9.0, 13.0, 22.0, 19.0, 21.0, 21.0, 25.0, 35.0, 34.0, 46.0, 46.0, 44.0, 43.0, 53.0, 45.0, 56.0, 52.0, 39.0, 38.0, 47.0, 38.0, 42.0, 39.0, 28.0, 27.0, 18.0, 12.0, 15.0, 6.0, 9.0, 7.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.841796875, -4.69140625, -4.541015625, -4.390625, -4.240234375, -4.08984375, -3.939453125, -3.7890625, -3.638671875, -3.48828125, -3.337890625, -3.1875, -3.037109375, -2.88671875, -2.736328125, -2.5859375, -2.435546875, -2.28515625, -2.134765625, -1.984375, -1.833984375, -1.68359375, -1.533203125, -1.3828125, -1.232421875, -1.08203125, -0.931640625, -0.78125, -0.630859375, -0.48046875, -0.330078125, -0.1796875, -0.029296875, 0.12109375, 0.271484375, 0.421875, 0.572265625, 0.72265625, 0.873046875, 1.0234375, 1.173828125, 1.32421875, 1.474609375, 1.625, 1.775390625, 1.92578125, 2.076171875, 2.2265625, 2.376953125, 2.52734375, 2.677734375, 2.828125, 2.978515625, 3.12890625, 3.279296875, 3.4296875, 3.580078125, 3.73046875, 3.880859375, 4.03125, 4.181640625, 4.33203125, 4.482421875, 4.6328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 1.0, 5.0, 13.0, 11.0, 19.0, 23.0, 40.0, 80.0, 127.0, 247.0, 405.0, 909.0, 1899.0, 4904.0, 14783.0, 56167.0, 334733.0, 519858.0, 83534.0, 19918.0, 6321.0, 2374.0, 1021.0, 489.0, 301.0, 128.0, 73.0, 54.0, 28.0, 21.0, 17.0, 14.0, 6.0, 15.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.11328125, -4.96343994140625, -4.8135986328125, -4.66375732421875, -4.513916015625, -4.36407470703125, -4.2142333984375, -4.06439208984375, -3.91455078125, -3.76470947265625, -3.6148681640625, -3.46502685546875, -3.315185546875, -3.16534423828125, -3.0155029296875, -2.86566162109375, -2.7158203125, -2.56597900390625, -2.4161376953125, -2.26629638671875, -2.116455078125, -1.96661376953125, -1.8167724609375, -1.66693115234375, -1.51708984375, -1.36724853515625, -1.2174072265625, -1.06756591796875, -0.917724609375, -0.76788330078125, -0.6180419921875, -0.46820068359375, -0.318359375, -0.16851806640625, -0.0186767578125, 0.13116455078125, 0.281005859375, 0.43084716796875, 0.5806884765625, 0.73052978515625, 0.88037109375, 1.03021240234375, 1.1800537109375, 1.32989501953125, 1.479736328125, 1.62957763671875, 1.7794189453125, 1.92926025390625, 2.0791015625, 2.22894287109375, 2.3787841796875, 2.52862548828125, 2.678466796875, 2.82830810546875, 2.9781494140625, 3.12799072265625, 3.27783203125, 3.42767333984375, 3.5775146484375, 3.72735595703125, 3.877197265625, 4.02703857421875, 4.1768798828125, 4.32672119140625, 4.4765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 13.0, 7.0, 13.0, 27.0, 34.0, 44.0, 68.0, 97.0, 206.0, 217.0, 101.0, 51.0, 39.0, 27.0, 15.0, 14.0, 4.0, 10.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012350082397460938, -0.00119762122631073, -0.0011602342128753662, -0.0011228471994400024, -0.0010854601860046387, -0.001048073172569275, -0.0010106861591339111, -0.0009732991456985474, -0.0009359121322631836, -0.0008985251188278198, -0.0008611381053924561, -0.0008237510919570923, -0.0007863640785217285, -0.0007489770650863647, -0.000711590051651001, -0.0006742030382156372, -0.0006368160247802734, -0.0005994290113449097, -0.0005620419979095459, -0.0005246549844741821, -0.00048726797103881836, -0.0004498809576034546, -0.0004124939441680908, -0.00037510693073272705, -0.0003377199172973633, -0.0003003329038619995, -0.00026294589042663574, -0.00022555887699127197, -0.0001881718635559082, -0.00015078485012054443, -0.00011339783668518066, -7.60108232498169e-05, -3.8623809814453125e-05, -1.2367963790893555e-06, 3.6150217056274414e-05, 7.353723049163818e-05, 0.00011092424392700195, 0.00014831125736236572, 0.0001856982707977295, 0.00022308528423309326, 0.00026047229766845703, 0.0002978593111038208, 0.00033524632453918457, 0.00037263333797454834, 0.0004100203514099121, 0.0004474073648452759, 0.00048479437828063965, 0.0005221813917160034, 0.0005595684051513672, 0.000596955418586731, 0.0006343424320220947, 0.0006717294454574585, 0.0007091164588928223, 0.000746503472328186, 0.0007838904857635498, 0.0008212774991989136, 0.0008586645126342773, 0.0008960515260696411, 0.0009334385395050049, 0.0009708255529403687, 0.0010082125663757324, 0.0010455995798110962, 0.00108298659324646, 0.0011203736066818237, 0.0011577606201171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 10.0, 14.0, 23.0, 29.0, 35.0, 57.0, 75.0, 136.0, 207.0, 355.0, 517.0, 994.0, 1872.0, 3979.0, 9487.0, 26200.0, 92584.0, 414928.0, 373285.0, 82854.0, 24065.0, 8989.0, 3757.0, 1760.0, 916.0, 521.0, 305.0, 200.0, 107.0, 94.0, 55.0, 33.0, 31.0, 18.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.98126220703125, -2.8746337890625, -2.76800537109375, -2.661376953125, -2.55474853515625, -2.4481201171875, -2.34149169921875, -2.23486328125, -2.12823486328125, -2.0216064453125, -1.91497802734375, -1.808349609375, -1.70172119140625, -1.5950927734375, -1.48846435546875, -1.3818359375, -1.27520751953125, -1.1685791015625, -1.06195068359375, -0.955322265625, -0.84869384765625, -0.7420654296875, -0.63543701171875, -0.52880859375, -0.42218017578125, -0.3155517578125, -0.20892333984375, -0.102294921875, 0.00433349609375, 0.1109619140625, 0.21759033203125, 0.32421875, 0.43084716796875, 0.5374755859375, 0.64410400390625, 0.750732421875, 0.85736083984375, 0.9639892578125, 1.07061767578125, 1.17724609375, 1.28387451171875, 1.3905029296875, 1.49713134765625, 1.603759765625, 1.71038818359375, 1.8170166015625, 1.92364501953125, 2.0302734375, 2.13690185546875, 2.2435302734375, 2.35015869140625, 2.456787109375, 2.56341552734375, 2.6700439453125, 2.77667236328125, 2.88330078125, 2.98992919921875, 3.0965576171875, 3.20318603515625, 3.309814453125, 3.41644287109375, 3.5230712890625, 3.62969970703125, 3.736328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 8.0, 9.0, 22.0, 18.0, 19.0, 27.0, 30.0, 48.0, 72.0, 66.0, 88.0, 105.0, 90.0, 82.0, 64.0, 62.0, 41.0, 31.0, 20.0, 27.0, 9.0, 12.0, 9.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.96807861328125, -2.8775634765625, -2.78704833984375, -2.696533203125, -2.60601806640625, -2.5155029296875, -2.42498779296875, -2.33447265625, -2.24395751953125, -2.1534423828125, -2.06292724609375, -1.972412109375, -1.88189697265625, -1.7913818359375, -1.70086669921875, -1.6103515625, -1.51983642578125, -1.4293212890625, -1.33880615234375, -1.248291015625, -1.15777587890625, -1.0672607421875, -0.97674560546875, -0.88623046875, -0.79571533203125, -0.7052001953125, -0.61468505859375, -0.524169921875, -0.43365478515625, -0.3431396484375, -0.25262451171875, -0.162109375, -0.07159423828125, 0.0189208984375, 0.10943603515625, 0.199951171875, 0.29046630859375, 0.3809814453125, 0.47149658203125, 0.56201171875, 0.65252685546875, 0.7430419921875, 0.83355712890625, 0.924072265625, 1.01458740234375, 1.1051025390625, 1.19561767578125, 1.2861328125, 1.37664794921875, 1.4671630859375, 1.55767822265625, 1.648193359375, 1.73870849609375, 1.8292236328125, 1.91973876953125, 2.01025390625, 2.10076904296875, 2.1912841796875, 2.28179931640625, 2.372314453125, 2.46282958984375, 2.5533447265625, 2.64385986328125, 2.734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 10.0, 22.0, 29.0, 55.0, 83.0, 138.0, 179.0, 176.0, 130.0, 98.0, 51.0, 20.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.571617126464844, -56.747459411621094, -54.92329788208008, -53.09914016723633, -51.27497863769531, -49.45082092285156, -47.62666320800781, -45.8025016784668, -43.97834014892578, -42.15418243408203, -40.330020904541016, -38.505863189697266, -36.68170166015625, -34.8575439453125, -33.03338623046875, -31.209224700927734, -29.385066986083984, -27.5609073638916, -25.73674774169922, -23.91259002685547, -22.088428497314453, -20.264270782470703, -18.44011116027832, -16.615951538085938, -14.791791915893555, -12.967632293701172, -11.143472671508789, -9.319314002990723, -7.49515438079834, -5.670994758605957, -3.8468360900878906, -2.022676467895508, -0.19852066040039062, 1.625638723373413, 3.449798107147217, 5.273957252502441, 7.098116874694824, 8.922276496887207, 10.746435165405273, 12.570594787597656, 14.394754409790039, 16.218914031982422, 18.043073654174805, 19.867233276367188, 21.691390991210938, 23.515552520751953, 25.339710235595703, 27.163869857788086, 28.98802947998047, 30.81218910217285, 32.636348724365234, 34.460506439208984, 36.28466796875, 38.10882568359375, 39.9329833984375, 41.757144927978516, 43.58130645751953, 45.40546417236328, 47.2296257019043, 49.05378341674805, 50.87794494628906, 52.70210266113281, 54.52626037597656, 56.35042190551758, 58.17457962036133]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 9.0, 12.0, 5.0, 14.0, 13.0, 14.0, 25.0, 21.0, 14.0, 26.0, 35.0, 37.0, 30.0, 44.0, 39.0, 42.0, 43.0, 67.0, 49.0, 35.0, 44.0, 41.0, 37.0, 38.0, 37.0, 30.0, 37.0, 24.0, 20.0, 14.0, 20.0, 19.0, 9.0, 8.0, 6.0, 10.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-30.260047912597656, -29.383255004882812, -28.506460189819336, -27.629667282104492, -26.75287437438965, -25.876079559326172, -24.999286651611328, -24.122493743896484, -23.245698928833008, -22.368906021118164, -21.492111206054688, -20.615318298339844, -19.738525390625, -18.861730575561523, -17.98493766784668, -17.108142852783203, -16.23134994506836, -15.3545560836792, -14.477763175964355, -13.600969314575195, -12.724175453186035, -11.847381591796875, -10.970588684082031, -10.093794822692871, -9.217002868652344, -8.340209007263184, -7.463415622711182, -6.58662223815918, -5.7098283767700195, -4.833034992218018, -3.9562416076660156, -3.0794477462768555, -2.2026538848876953, -1.3258602619171143, -0.44906675815582275, 0.42772674560546875, 1.3045203685760498, 2.181313991546631, 3.058107376098633, 3.934901237487793, 4.811694622039795, 5.688488006591797, 6.565281867980957, 7.442075252532959, 8.318868637084961, 9.195662498474121, 10.072456359863281, 10.949249267578125, 11.826043128967285, 12.702836990356445, 13.579629898071289, 14.45642375946045, 15.33321762084961, 16.210010528564453, 17.086803436279297, 17.963598251342773, 18.840391159057617, 19.71718406677246, 20.593978881835938, 21.47077178955078, 22.347564697265625, 23.2243595123291, 24.101152420043945, 24.977947235107422, 25.854740142822266]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 10.0, 15.0, 14.0, 37.0, 41.0, 61.0, 96.0, 176.0, 242.0, 433.0, 674.0, 1237.0, 2234.0, 4628.0, 9985.0, 25813.0, 87067.0, 663724.0, 3171377.0, 161394.0, 38678.0, 13604.0, 5982.0, 2859.0, 1594.0, 809.0, 490.0, 351.0, 204.0, 130.0, 90.0, 67.0, 53.0, 24.0, 22.0, 10.0, 17.0, 5.0, 10.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.44140625, -4.278076171875, -4.11474609375, -3.951416015625, -3.7880859375, -3.624755859375, -3.46142578125, -3.298095703125, -3.134765625, -2.971435546875, -2.80810546875, -2.644775390625, -2.4814453125, -2.318115234375, -2.15478515625, -1.991455078125, -1.828125, -1.664794921875, -1.50146484375, -1.338134765625, -1.1748046875, -1.011474609375, -0.84814453125, -0.684814453125, -0.521484375, -0.358154296875, -0.19482421875, -0.031494140625, 0.1318359375, 0.295166015625, 0.45849609375, 0.621826171875, 0.78515625, 0.948486328125, 1.11181640625, 1.275146484375, 1.4384765625, 1.601806640625, 1.76513671875, 1.928466796875, 2.091796875, 2.255126953125, 2.41845703125, 2.581787109375, 2.7451171875, 2.908447265625, 3.07177734375, 3.235107421875, 3.3984375, 3.561767578125, 3.72509765625, 3.888427734375, 4.0517578125, 4.215087890625, 4.37841796875, 4.541748046875, 4.705078125, 4.868408203125, 5.03173828125, 5.195068359375, 5.3583984375, 5.521728515625, 5.68505859375, 5.848388671875, 6.01171875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 6.0, 6.0, 13.0, 18.0, 26.0, 40.0, 45.0, 44.0, 56.0, 72.0, 79.0, 85.0, 88.0, 66.0, 81.0, 55.0, 44.0, 51.0, 26.0, 29.0, 18.0, 16.0, 12.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4184112548828125, -1.366119384765625, -1.3138275146484375, -1.26153564453125, -1.2092437744140625, -1.156951904296875, -1.1046600341796875, -1.0523681640625, -1.0000762939453125, -0.947784423828125, -0.8954925537109375, -0.84320068359375, -0.7909088134765625, -0.738616943359375, -0.6863250732421875, -0.634033203125, -0.5817413330078125, -0.529449462890625, -0.4771575927734375, -0.42486572265625, -0.3725738525390625, -0.320281982421875, -0.2679901123046875, -0.2156982421875, -0.1634063720703125, -0.111114501953125, -0.0588226318359375, -0.00653076171875, 0.0457611083984375, 0.098052978515625, 0.1503448486328125, 0.20263671875, 0.2549285888671875, 0.307220458984375, 0.3595123291015625, 0.41180419921875, 0.4640960693359375, 0.516387939453125, 0.5686798095703125, 0.6209716796875, 0.6732635498046875, 0.725555419921875, 0.7778472900390625, 0.83013916015625, 0.8824310302734375, 0.934722900390625, 0.9870147705078125, 1.039306640625, 1.0915985107421875, 1.143890380859375, 1.1961822509765625, 1.24847412109375, 1.3007659912109375, 1.353057861328125, 1.4053497314453125, 1.4576416015625, 1.5099334716796875, 1.562225341796875, 1.6145172119140625, 1.66680908203125, 1.7191009521484375, 1.771392822265625, 1.8236846923828125, 1.8759765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 15.0, 25.0, 32.0, 42.0, 87.0, 85.0, 167.0, 276.0, 510.0, 931.0, 1662.0, 3293.0, 7641.0, 19896.0, 62158.0, 289590.0, 3163243.0, 511374.0, 88335.0, 26222.0, 9832.0, 4206.0, 1976.0, 1082.0, 589.0, 355.0, 222.0, 148.0, 77.0, 66.0, 43.0, 33.0, 20.0, 11.0, 7.0, 6.0, 4.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.9390869140625, -5.757080078125, -5.5750732421875, -5.39306640625, -5.2110595703125, -5.029052734375, -4.8470458984375, -4.6650390625, -4.4830322265625, -4.301025390625, -4.1190185546875, -3.93701171875, -3.7550048828125, -3.572998046875, -3.3909912109375, -3.208984375, -3.0269775390625, -2.844970703125, -2.6629638671875, -2.48095703125, -2.2989501953125, -2.116943359375, -1.9349365234375, -1.7529296875, -1.5709228515625, -1.388916015625, -1.2069091796875, -1.02490234375, -0.8428955078125, -0.660888671875, -0.4788818359375, -0.296875, -0.1148681640625, 0.067138671875, 0.2491455078125, 0.43115234375, 0.6131591796875, 0.795166015625, 0.9771728515625, 1.1591796875, 1.3411865234375, 1.523193359375, 1.7052001953125, 1.88720703125, 2.0692138671875, 2.251220703125, 2.4332275390625, 2.615234375, 2.7972412109375, 2.979248046875, 3.1612548828125, 3.34326171875, 3.5252685546875, 3.707275390625, 3.8892822265625, 4.0712890625, 4.2532958984375, 4.435302734375, 4.6173095703125, 4.79931640625, 4.9813232421875, 5.163330078125, 5.3453369140625, 5.52734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 5.0, 8.0, 10.0, 9.0, 15.0, 16.0, 25.0, 43.0, 48.0, 89.0, 129.0, 221.0, 496.0, 1448.0, 710.0, 313.0, 159.0, 109.0, 58.0, 45.0, 26.0, 18.0, 14.0, 13.0, 7.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.421875, -2.34295654296875, -2.2640380859375, -2.18511962890625, -2.106201171875, -2.02728271484375, -1.9483642578125, -1.86944580078125, -1.79052734375, -1.71160888671875, -1.6326904296875, -1.55377197265625, -1.474853515625, -1.39593505859375, -1.3170166015625, -1.23809814453125, -1.1591796875, -1.08026123046875, -1.0013427734375, -0.92242431640625, -0.843505859375, -0.76458740234375, -0.6856689453125, -0.60675048828125, -0.52783203125, -0.44891357421875, -0.3699951171875, -0.29107666015625, -0.212158203125, -0.13323974609375, -0.0543212890625, 0.02459716796875, 0.103515625, 0.18243408203125, 0.2613525390625, 0.34027099609375, 0.419189453125, 0.49810791015625, 0.5770263671875, 0.65594482421875, 0.73486328125, 0.81378173828125, 0.8927001953125, 0.97161865234375, 1.050537109375, 1.12945556640625, 1.2083740234375, 1.28729248046875, 1.3662109375, 1.44512939453125, 1.5240478515625, 1.60296630859375, 1.681884765625, 1.76080322265625, 1.8397216796875, 1.91864013671875, 1.99755859375, 2.07647705078125, 2.1553955078125, 2.23431396484375, 2.313232421875, 2.39215087890625, 2.4710693359375, 2.54998779296875, 2.62890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 16.0, 42.0, 53.0, 106.0, 154.0, 154.0, 157.0, 117.0, 87.0, 50.0, 27.0, 19.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.903913497924805, -15.205830574035645, -14.507747650146484, -13.809663772583008, -13.111580848693848, -12.413497924804688, -11.715414047241211, -11.01733112335205, -10.31924819946289, -9.62116527557373, -8.92308235168457, -8.224998474121094, -7.526915550231934, -6.828832626342773, -6.130749225616455, -5.432665824890137, -4.734582901000977, -4.036499977111816, -3.338416576385498, -2.640333414077759, -1.9422502517700195, -1.2441670894622803, -0.546083927154541, 0.15199947357177734, 0.8500823974609375, 1.5481655597686768, 2.246248722076416, 2.9443318843841553, 3.6424150466918945, 4.340497970581055, 5.038581371307373, 5.736664772033691, 6.434745788574219, 7.132828712463379, 7.830912113189697, 8.528995513916016, 9.227078437805176, 9.925161361694336, 10.623245239257812, 11.321328163146973, 12.019411087036133, 12.717494010925293, 13.415576934814453, 14.11366081237793, 14.81174373626709, 15.50982666015625, 16.207910537719727, 16.905994415283203, 17.604076385498047, 18.302160263061523, 19.000242233276367, 19.698326110839844, 20.396408081054688, 21.094491958618164, 21.79257583618164, 22.490657806396484, 23.18874168395996, 23.886825561523438, 24.58490753173828, 25.282991409301758, 25.981075286865234, 26.679157257080078, 27.377241134643555, 28.07532501220703, 28.773406982421875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 11.0, 14.0, 12.0, 19.0, 15.0, 21.0, 27.0, 28.0, 19.0, 26.0, 36.0, 40.0, 47.0, 44.0, 30.0, 45.0, 49.0, 46.0, 35.0, 49.0, 54.0, 42.0, 29.0, 26.0, 32.0, 27.0, 29.0, 22.0, 18.0, 19.0, 18.0, 12.0, 12.0, 9.0, 7.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.771770477294922, -9.498116493225098, -9.224462509155273, -8.950807571411133, -8.677153587341309, -8.403499603271484, -8.12984561920166, -7.856191635131836, -7.5825371742248535, -7.308883190155029, -7.035228729248047, -6.761574745178223, -6.487920761108398, -6.214266300201416, -5.940612316131592, -5.666957855224609, -5.393303871154785, -5.119649887084961, -4.8459954261779785, -4.572341442108154, -4.298686981201172, -4.025032997131348, -3.7513790130615234, -3.47772479057312, -3.204070568084717, -2.9304163455963135, -2.65676212310791, -2.383108139038086, -2.1094539165496826, -1.8357996940612793, -1.5621455907821655, -1.2884914875030518, -1.0148382186889648, -0.7411840558052063, -0.46752989292144775, -0.1938757300376892, 0.07977843284606934, 0.35343265533447266, 0.6270867586135864, 0.9007408618927002, 1.1743950843811035, 1.4480493068695068, 1.7217034101486206, 1.9953575134277344, 2.2690117359161377, 2.542665958404541, 2.8163199424743652, 3.0899741649627686, 3.363628387451172, 3.637282609939575, 3.9109368324279785, 4.184590816497803, 4.458245277404785, 4.731899261474609, 5.005553245544434, 5.279207229614258, 5.55286169052124, 5.8265156745910645, 6.100170135498047, 6.373824119567871, 6.647478103637695, 6.921132564544678, 7.194786548614502, 7.468441009521484, 7.742094993591309]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 14.0, 25.0, 34.0, 37.0, 77.0, 122.0, 199.0, 308.0, 510.0, 971.0, 1761.0, 3606.0, 7344.0, 15996.0, 36042.0, 84398.0, 211479.0, 378411.0, 177459.0, 72028.0, 30831.0, 13897.0, 6367.0, 3008.0, 1597.0, 841.0, 457.0, 272.0, 172.0, 110.0, 59.0, 31.0, 32.0, 11.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.796875, -5.64190673828125, -5.4869384765625, -5.33197021484375, -5.177001953125, -5.02203369140625, -4.8670654296875, -4.71209716796875, -4.55712890625, -4.40216064453125, -4.2471923828125, -4.09222412109375, -3.937255859375, -3.78228759765625, -3.6273193359375, -3.47235107421875, -3.3173828125, -3.16241455078125, -3.0074462890625, -2.85247802734375, -2.697509765625, -2.54254150390625, -2.3875732421875, -2.23260498046875, -2.07763671875, -1.92266845703125, -1.7677001953125, -1.61273193359375, -1.457763671875, -1.30279541015625, -1.1478271484375, -0.99285888671875, -0.837890625, -0.68292236328125, -0.5279541015625, -0.37298583984375, -0.218017578125, -0.06304931640625, 0.0919189453125, 0.24688720703125, 0.40185546875, 0.55682373046875, 0.7117919921875, 0.86676025390625, 1.021728515625, 1.17669677734375, 1.3316650390625, 1.48663330078125, 1.6416015625, 1.79656982421875, 1.9515380859375, 2.10650634765625, 2.261474609375, 2.41644287109375, 2.5714111328125, 2.72637939453125, 2.88134765625, 3.03631591796875, 3.1912841796875, 3.34625244140625, 3.501220703125, 3.65618896484375, 3.8111572265625, 3.96612548828125, 4.12109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 13.0, 8.0, 17.0, 12.0, 23.0, 36.0, 47.0, 45.0, 57.0, 61.0, 61.0, 83.0, 80.0, 84.0, 71.0, 57.0, 52.0, 36.0, 27.0, 34.0, 24.0, 20.0, 8.0, 20.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.466796875, -1.41680908203125, -1.3668212890625, -1.31683349609375, -1.266845703125, -1.21685791015625, -1.1668701171875, -1.11688232421875, -1.06689453125, -1.01690673828125, -0.9669189453125, -0.91693115234375, -0.866943359375, -0.81695556640625, -0.7669677734375, -0.71697998046875, -0.6669921875, -0.61700439453125, -0.5670166015625, -0.51702880859375, -0.467041015625, -0.41705322265625, -0.3670654296875, -0.31707763671875, -0.26708984375, -0.21710205078125, -0.1671142578125, -0.11712646484375, -0.067138671875, -0.01715087890625, 0.0328369140625, 0.08282470703125, 0.1328125, 0.18280029296875, 0.2327880859375, 0.28277587890625, 0.332763671875, 0.38275146484375, 0.4327392578125, 0.48272705078125, 0.53271484375, 0.58270263671875, 0.6326904296875, 0.68267822265625, 0.732666015625, 0.78265380859375, 0.8326416015625, 0.88262939453125, 0.9326171875, 0.98260498046875, 1.0325927734375, 1.08258056640625, 1.132568359375, 1.18255615234375, 1.2325439453125, 1.28253173828125, 1.33251953125, 1.38250732421875, 1.4324951171875, 1.48248291015625, 1.532470703125, 1.58245849609375, 1.6324462890625, 1.68243408203125, 1.732421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 10.0, 8.0, 11.0, 15.0, 17.0, 33.0, 33.0, 57.0, 53.0, 105.0, 136.0, 158.0, 293.0, 348.0, 592.0, 1109.0, 1965.0, 4643.0, 12938.0, 40986.0, 143629.0, 474247.0, 260545.0, 71692.0, 21437.0, 7013.0, 2857.0, 1396.0, 685.0, 461.0, 336.0, 212.0, 156.0, 96.0, 62.0, 59.0, 27.0, 33.0, 28.0, 16.0, 11.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9261474609375, -4.754638671875, -4.5831298828125, -4.41162109375, -4.2401123046875, -4.068603515625, -3.8970947265625, -3.7255859375, -3.5540771484375, -3.382568359375, -3.2110595703125, -3.03955078125, -2.8680419921875, -2.696533203125, -2.5250244140625, -2.353515625, -2.1820068359375, -2.010498046875, -1.8389892578125, -1.66748046875, -1.4959716796875, -1.324462890625, -1.1529541015625, -0.9814453125, -0.8099365234375, -0.638427734375, -0.4669189453125, -0.29541015625, -0.1239013671875, 0.047607421875, 0.2191162109375, 0.390625, 0.5621337890625, 0.733642578125, 0.9051513671875, 1.07666015625, 1.2481689453125, 1.419677734375, 1.5911865234375, 1.7626953125, 1.9342041015625, 2.105712890625, 2.2772216796875, 2.44873046875, 2.6202392578125, 2.791748046875, 2.9632568359375, 3.134765625, 3.3062744140625, 3.477783203125, 3.6492919921875, 3.82080078125, 3.9923095703125, 4.163818359375, 4.3353271484375, 4.5068359375, 4.6783447265625, 4.849853515625, 5.0213623046875, 5.19287109375, 5.3643798828125, 5.535888671875, 5.7073974609375, 5.87890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 12.0, 9.0, 16.0, 13.0, 11.0, 13.0, 25.0, 23.0, 30.0, 35.0, 32.0, 42.0, 53.0, 42.0, 43.0, 36.0, 29.0, 44.0, 57.0, 48.0, 47.0, 51.0, 36.0, 48.0, 25.0, 28.0, 24.0, 19.0, 18.0, 17.0, 15.0, 6.0, 8.0, 7.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.42578125, -4.26611328125, -4.1064453125, -3.94677734375, -3.787109375, -3.62744140625, -3.4677734375, -3.30810546875, -3.1484375, -2.98876953125, -2.8291015625, -2.66943359375, -2.509765625, -2.35009765625, -2.1904296875, -2.03076171875, -1.87109375, -1.71142578125, -1.5517578125, -1.39208984375, -1.232421875, -1.07275390625, -0.9130859375, -0.75341796875, -0.59375, -0.43408203125, -0.2744140625, -0.11474609375, 0.044921875, 0.20458984375, 0.3642578125, 0.52392578125, 0.68359375, 0.84326171875, 1.0029296875, 1.16259765625, 1.322265625, 1.48193359375, 1.6416015625, 1.80126953125, 1.9609375, 2.12060546875, 2.2802734375, 2.43994140625, 2.599609375, 2.75927734375, 2.9189453125, 3.07861328125, 3.23828125, 3.39794921875, 3.5576171875, 3.71728515625, 3.876953125, 4.03662109375, 4.1962890625, 4.35595703125, 4.515625, 4.67529296875, 4.8349609375, 4.99462890625, 5.154296875, 5.31396484375, 5.4736328125, 5.63330078125, 5.79296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 9.0, 14.0, 21.0, 36.0, 74.0, 125.0, 250.0, 550.0, 1270.0, 3617.0, 11903.0, 48535.0, 297692.0, 565717.0, 90129.0, 19578.0, 5737.0, 1832.0, 805.0, 299.0, 161.0, 85.0, 43.0, 29.0, 13.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.19329833984375, -6.0311279296875, -5.86895751953125, -5.706787109375, -5.54461669921875, -5.3824462890625, -5.22027587890625, -5.05810546875, -4.89593505859375, -4.7337646484375, -4.57159423828125, -4.409423828125, -4.24725341796875, -4.0850830078125, -3.92291259765625, -3.7607421875, -3.59857177734375, -3.4364013671875, -3.27423095703125, -3.112060546875, -2.94989013671875, -2.7877197265625, -2.62554931640625, -2.46337890625, -2.30120849609375, -2.1390380859375, -1.97686767578125, -1.814697265625, -1.65252685546875, -1.4903564453125, -1.32818603515625, -1.166015625, -1.00384521484375, -0.8416748046875, -0.67950439453125, -0.517333984375, -0.35516357421875, -0.1929931640625, -0.03082275390625, 0.13134765625, 0.29351806640625, 0.4556884765625, 0.61785888671875, 0.780029296875, 0.94219970703125, 1.1043701171875, 1.26654052734375, 1.4287109375, 1.59088134765625, 1.7530517578125, 1.91522216796875, 2.077392578125, 2.23956298828125, 2.4017333984375, 2.56390380859375, 2.72607421875, 2.88824462890625, 3.0504150390625, 3.21258544921875, 3.374755859375, 3.53692626953125, 3.6990966796875, 3.86126708984375, 4.0234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 10.0, 10.0, 19.0, 23.0, 21.0, 27.0, 40.0, 64.0, 77.0, 160.0, 155.0, 120.0, 63.0, 48.0, 44.0, 22.0, 19.0, 17.0, 8.0, 16.0, 9.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008945465087890625, -0.000863984227180481, -0.0008334219455718994, -0.0008028596639633179, -0.0007722973823547363, -0.0007417351007461548, -0.0007111728191375732, -0.0006806105375289917, -0.0006500482559204102, -0.0006194859743118286, -0.0005889236927032471, -0.0005583614110946655, -0.000527799129486084, -0.0004972368478775024, -0.0004666745662689209, -0.00043611228466033936, -0.0004055500030517578, -0.00037498772144317627, -0.0003444254398345947, -0.0003138631582260132, -0.00028330087661743164, -0.0002527385950088501, -0.00022217631340026855, -0.000191614031791687, -0.00016105175018310547, -0.00013048946857452393, -9.992718696594238e-05, -6.936490535736084e-05, -3.88026237487793e-05, -8.240342140197754e-06, 2.232193946838379e-05, 5.288422107696533e-05, 8.344650268554688e-05, 0.00011400878429412842, 0.00014457106590270996, 0.0001751333475112915, 0.00020569562911987305, 0.0002362579107284546, 0.00026682019233703613, 0.0002973824739456177, 0.0003279447555541992, 0.00035850703716278076, 0.0003890693187713623, 0.00041963160037994385, 0.0004501938819885254, 0.00048075616359710693, 0.0005113184452056885, 0.00054188072681427, 0.0005724430084228516, 0.0006030052900314331, 0.0006335675716400146, 0.0006641298532485962, 0.0006946921348571777, 0.0007252544164657593, 0.0007558166980743408, 0.0007863789796829224, 0.0008169412612915039, 0.0008475035429000854, 0.000878065824508667, 0.0009086281061172485, 0.0009391903877258301, 0.0009697526693344116, 0.0010003149509429932, 0.0010308772325515747, 0.0010614395141601562]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 15.0, 14.0, 23.0, 46.0, 49.0, 80.0, 141.0, 274.0, 567.0, 1114.0, 2957.0, 9492.0, 39287.0, 282344.0, 605958.0, 81536.0, 16635.0, 4689.0, 1764.0, 708.0, 346.0, 201.0, 139.0, 68.0, 29.0, 26.0, 13.0, 9.0, 11.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.14605712890625, -4.9757080078125, -4.80535888671875, -4.635009765625, -4.46466064453125, -4.2943115234375, -4.12396240234375, -3.95361328125, -3.78326416015625, -3.6129150390625, -3.44256591796875, -3.272216796875, -3.10186767578125, -2.9315185546875, -2.76116943359375, -2.5908203125, -2.42047119140625, -2.2501220703125, -2.07977294921875, -1.909423828125, -1.73907470703125, -1.5687255859375, -1.39837646484375, -1.22802734375, -1.05767822265625, -0.8873291015625, -0.71697998046875, -0.546630859375, -0.37628173828125, -0.2059326171875, -0.03558349609375, 0.134765625, 0.30511474609375, 0.4754638671875, 0.64581298828125, 0.816162109375, 0.98651123046875, 1.1568603515625, 1.32720947265625, 1.49755859375, 1.66790771484375, 1.8382568359375, 2.00860595703125, 2.178955078125, 2.34930419921875, 2.5196533203125, 2.69000244140625, 2.8603515625, 3.03070068359375, 3.2010498046875, 3.37139892578125, 3.541748046875, 3.71209716796875, 3.8824462890625, 4.05279541015625, 4.22314453125, 4.39349365234375, 4.5638427734375, 4.73419189453125, 4.904541015625, 5.07489013671875, 5.2452392578125, 5.41558837890625, 5.5859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 7.0, 13.0, 6.0, 8.0, 14.0, 10.0, 18.0, 19.0, 35.0, 37.0, 47.0, 71.0, 77.0, 108.0, 109.0, 72.0, 80.0, 60.0, 48.0, 24.0, 25.0, 24.0, 14.0, 18.0, 6.0, 10.0, 8.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.85546875, -2.76385498046875, -2.6722412109375, -2.58062744140625, -2.489013671875, -2.39739990234375, -2.3057861328125, -2.21417236328125, -2.12255859375, -2.03094482421875, -1.9393310546875, -1.84771728515625, -1.756103515625, -1.66448974609375, -1.5728759765625, -1.48126220703125, -1.3896484375, -1.29803466796875, -1.2064208984375, -1.11480712890625, -1.023193359375, -0.93157958984375, -0.8399658203125, -0.74835205078125, -0.65673828125, -0.56512451171875, -0.4735107421875, -0.38189697265625, -0.290283203125, -0.19866943359375, -0.1070556640625, -0.01544189453125, 0.076171875, 0.16778564453125, 0.2593994140625, 0.35101318359375, 0.442626953125, 0.53424072265625, 0.6258544921875, 0.71746826171875, 0.80908203125, 0.90069580078125, 0.9923095703125, 1.08392333984375, 1.175537109375, 1.26715087890625, 1.3587646484375, 1.45037841796875, 1.5419921875, 1.63360595703125, 1.7252197265625, 1.81683349609375, 1.908447265625, 2.00006103515625, 2.0916748046875, 2.18328857421875, 2.27490234375, 2.36651611328125, 2.4581298828125, 2.54974365234375, 2.641357421875, 2.73297119140625, 2.8245849609375, 2.91619873046875, 3.0078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 19.0, 37.0, 94.0, 197.0, 240.0, 221.0, 109.0, 53.0, 18.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-131.51681518554688, -128.91770935058594, -126.318603515625, -123.71949768066406, -121.12039184570312, -118.52128601074219, -115.92218017578125, -113.32307434082031, -110.72396850585938, -108.12486267089844, -105.5257568359375, -102.92665100097656, -100.32754516601562, -97.72843933105469, -95.12933349609375, -92.53022766113281, -89.9311294555664, -87.33202362060547, -84.73291778564453, -82.1338119506836, -79.53470611572266, -76.93560028076172, -74.33649444580078, -71.73739624023438, -69.13829040527344, -66.5391845703125, -63.94007873535156, -61.340972900390625, -58.74186706542969, -56.14276123046875, -53.54365921020508, -50.94455337524414, -48.34545135498047, -45.74634552001953, -43.147239685058594, -40.548133850097656, -37.94902801513672, -35.34992218017578, -32.75082015991211, -30.151714324951172, -27.552608489990234, -24.953502655029297, -22.35439682006836, -19.755292892456055, -17.156187057495117, -14.55708122253418, -11.957976341247559, -9.358871459960938, -6.759765625, -4.160660266876221, -1.5615549087524414, 1.037550449371338, 3.636655807495117, 6.235761642456055, 8.834866523742676, 11.433971405029297, 14.033077239990234, 16.632183074951172, 19.23128890991211, 21.830392837524414, 24.42949867248535, 27.02860450744629, 29.627708435058594, 32.22681427001953, 34.82592010498047]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 2.0, 7.0, 10.0, 7.0, 12.0, 14.0, 16.0, 17.0, 15.0, 19.0, 24.0, 22.0, 28.0, 29.0, 37.0, 32.0, 42.0, 54.0, 48.0, 40.0, 50.0, 50.0, 45.0, 46.0, 38.0, 42.0, 42.0, 28.0, 37.0, 35.0, 21.0, 14.0, 14.0, 10.0, 9.0, 13.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.914569854736328, -28.060869216918945, -27.207168579101562, -26.35346794128418, -25.499767303466797, -24.646068572998047, -23.792367935180664, -22.93866729736328, -22.0849666595459, -21.231266021728516, -20.377565383911133, -19.52386474609375, -18.670166015625, -17.816463470458984, -16.962764739990234, -16.10906410217285, -15.255363464355469, -14.401662826538086, -13.547962188720703, -12.694262504577637, -11.840561866760254, -10.986861228942871, -10.133161544799805, -9.279460906982422, -8.425760269165039, -7.572059631347656, -6.718359470367432, -5.864659309387207, -5.010958671569824, -4.157258033752441, -3.303557872772217, -2.449857711791992, -1.5961551666259766, -0.7424547672271729, 0.11124563217163086, 0.9649460315704346, 1.8186464309692383, 2.672347068786621, 3.5260472297668457, 4.37974739074707, 5.233448028564453, 6.087148666381836, 6.9408488273620605, 7.794548988342285, 8.648249626159668, 9.50195026397705, 10.355649948120117, 11.2093505859375, 12.063051223754883, 12.916751861572266, 13.770452499389648, 14.624152183532715, 15.477852821350098, 16.331554412841797, 17.185253143310547, 18.03895378112793, 18.892654418945312, 19.746355056762695, 20.600055694580078, 21.45375633239746, 22.307456970214844, 23.161155700683594, 24.014856338500977, 24.86855697631836, 25.722257614135742]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 11.0, 7.0, 12.0, 19.0, 25.0, 68.0, 104.0, 150.0, 329.0, 669.0, 1324.0, 2976.0, 7758.0, 24580.0, 110924.0, 2752665.0, 1172825.0, 87997.0, 20302.0, 6577.0, 2504.0, 1156.0, 546.0, 292.0, 170.0, 84.0, 52.0, 45.0, 32.0, 23.0, 14.0, 9.0, 4.0, 5.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.36566162109375, -5.1414794921875, -4.91729736328125, -4.693115234375, -4.46893310546875, -4.2447509765625, -4.02056884765625, -3.79638671875, -3.57220458984375, -3.3480224609375, -3.12384033203125, -2.899658203125, -2.67547607421875, -2.4512939453125, -2.22711181640625, -2.0029296875, -1.77874755859375, -1.5545654296875, -1.33038330078125, -1.106201171875, -0.88201904296875, -0.6578369140625, -0.43365478515625, -0.20947265625, 0.01470947265625, 0.2388916015625, 0.46307373046875, 0.687255859375, 0.91143798828125, 1.1356201171875, 1.35980224609375, 1.583984375, 1.80816650390625, 2.0323486328125, 2.25653076171875, 2.480712890625, 2.70489501953125, 2.9290771484375, 3.15325927734375, 3.37744140625, 3.60162353515625, 3.8258056640625, 4.04998779296875, 4.274169921875, 4.49835205078125, 4.7225341796875, 4.94671630859375, 5.1708984375, 5.39508056640625, 5.6192626953125, 5.84344482421875, 6.067626953125, 6.29180908203125, 6.5159912109375, 6.74017333984375, 6.96435546875, 7.18853759765625, 7.4127197265625, 7.63690185546875, 7.861083984375, 8.08526611328125, 8.3094482421875, 8.53363037109375, 8.7578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 10.0, 15.0, 12.0, 17.0, 26.0, 31.0, 34.0, 30.0, 52.0, 62.0, 51.0, 58.0, 69.0, 73.0, 67.0, 59.0, 58.0, 33.0, 49.0, 39.0, 21.0, 25.0, 21.0, 18.0, 14.0, 13.0, 11.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.259765625, -1.213592529296875, -1.16741943359375, -1.121246337890625, -1.0750732421875, -1.028900146484375, -0.98272705078125, -0.936553955078125, -0.890380859375, -0.844207763671875, -0.79803466796875, -0.751861572265625, -0.7056884765625, -0.659515380859375, -0.61334228515625, -0.567169189453125, -0.52099609375, -0.474822998046875, -0.42864990234375, -0.382476806640625, -0.3363037109375, -0.290130615234375, -0.24395751953125, -0.197784423828125, -0.151611328125, -0.105438232421875, -0.05926513671875, -0.013092041015625, 0.0330810546875, 0.079254150390625, 0.12542724609375, 0.171600341796875, 0.2177734375, 0.263946533203125, 0.31011962890625, 0.356292724609375, 0.4024658203125, 0.448638916015625, 0.49481201171875, 0.540985107421875, 0.587158203125, 0.633331298828125, 0.67950439453125, 0.725677490234375, 0.7718505859375, 0.818023681640625, 0.86419677734375, 0.910369873046875, 0.95654296875, 1.002716064453125, 1.04888916015625, 1.095062255859375, 1.1412353515625, 1.187408447265625, 1.23358154296875, 1.279754638671875, 1.325927734375, 1.372100830078125, 1.41827392578125, 1.464447021484375, 1.5106201171875, 1.556793212890625, 1.60296630859375, 1.649139404296875, 1.6953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 9.0, 12.0, 21.0, 48.0, 69.0, 103.0, 152.0, 314.0, 563.0, 951.0, 1700.0, 3356.0, 7467.0, 18107.0, 54488.0, 216172.0, 2250536.0, 1390202.0, 174500.0, 46679.0, 15701.0, 6443.0, 2973.0, 1547.0, 866.0, 516.0, 285.0, 202.0, 123.0, 72.0, 43.0, 25.0, 11.0, 12.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.59124755859375, -4.4207763671875, -4.25030517578125, -4.079833984375, -3.90936279296875, -3.7388916015625, -3.56842041015625, -3.39794921875, -3.22747802734375, -3.0570068359375, -2.88653564453125, -2.716064453125, -2.54559326171875, -2.3751220703125, -2.20465087890625, -2.0341796875, -1.86370849609375, -1.6932373046875, -1.52276611328125, -1.352294921875, -1.18182373046875, -1.0113525390625, -0.84088134765625, -0.67041015625, -0.49993896484375, -0.3294677734375, -0.15899658203125, 0.011474609375, 0.18194580078125, 0.3524169921875, 0.52288818359375, 0.693359375, 0.86383056640625, 1.0343017578125, 1.20477294921875, 1.375244140625, 1.54571533203125, 1.7161865234375, 1.88665771484375, 2.05712890625, 2.22760009765625, 2.3980712890625, 2.56854248046875, 2.739013671875, 2.90948486328125, 3.0799560546875, 3.25042724609375, 3.4208984375, 3.59136962890625, 3.7618408203125, 3.93231201171875, 4.102783203125, 4.27325439453125, 4.4437255859375, 4.61419677734375, 4.78466796875, 4.95513916015625, 5.1256103515625, 5.29608154296875, 5.466552734375, 5.63702392578125, 5.8074951171875, 5.97796630859375, 6.1484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 7.0, 3.0, 5.0, 5.0, 16.0, 7.0, 17.0, 19.0, 24.0, 32.0, 54.0, 55.0, 90.0, 85.0, 140.0, 224.0, 286.0, 585.0, 961.0, 473.0, 281.0, 186.0, 137.0, 95.0, 60.0, 46.0, 46.0, 26.0, 16.0, 20.0, 12.0, 12.0, 7.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.984375, -1.91900634765625, -1.8536376953125, -1.78826904296875, -1.722900390625, -1.65753173828125, -1.5921630859375, -1.52679443359375, -1.46142578125, -1.39605712890625, -1.3306884765625, -1.26531982421875, -1.199951171875, -1.13458251953125, -1.0692138671875, -1.00384521484375, -0.9384765625, -0.87310791015625, -0.8077392578125, -0.74237060546875, -0.677001953125, -0.61163330078125, -0.5462646484375, -0.48089599609375, -0.41552734375, -0.35015869140625, -0.2847900390625, -0.21942138671875, -0.154052734375, -0.08868408203125, -0.0233154296875, 0.04205322265625, 0.107421875, 0.17279052734375, 0.2381591796875, 0.30352783203125, 0.368896484375, 0.43426513671875, 0.4996337890625, 0.56500244140625, 0.63037109375, 0.69573974609375, 0.7611083984375, 0.82647705078125, 0.891845703125, 0.95721435546875, 1.0225830078125, 1.08795166015625, 1.1533203125, 1.21868896484375, 1.2840576171875, 1.34942626953125, 1.414794921875, 1.48016357421875, 1.5455322265625, 1.61090087890625, 1.67626953125, 1.74163818359375, 1.8070068359375, 1.87237548828125, 1.937744140625, 2.00311279296875, 2.0684814453125, 2.13385009765625, 2.19921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 27.0, 40.0, 106.0, 183.0, 261.0, 189.0, 121.0, 46.0, 14.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-58.00514602661133, -56.78849411010742, -55.571842193603516, -54.35519027709961, -53.1385383605957, -51.9218864440918, -50.70523452758789, -49.48857879638672, -48.27192687988281, -47.055274963378906, -45.838623046875, -44.621971130371094, -43.40531921386719, -42.18866729736328, -40.972015380859375, -39.75536346435547, -38.53871154785156, -37.322059631347656, -36.10540771484375, -34.888755798339844, -33.67210388183594, -32.45545196533203, -31.238798141479492, -30.022146224975586, -28.80549430847168, -27.588842391967773, -26.372190475463867, -25.15553855895996, -23.938884735107422, -22.722232818603516, -21.50558090209961, -20.288928985595703, -19.072280883789062, -17.855628967285156, -16.63897705078125, -15.422324180603027, -14.205672264099121, -12.989020347595215, -11.772367477416992, -10.555715560913086, -9.33906364440918, -8.122411727905273, -6.905759334564209, -5.6891069412231445, -4.472455024719238, -3.255803108215332, -2.0391507148742676, -0.8224983215332031, 0.3941535949707031, 1.6108057498931885, 2.827457904815674, 4.044110298156738, 5.2607622146606445, 6.477414131164551, 7.694066524505615, 8.91071891784668, 10.127370834350586, 11.344022750854492, 12.560674667358398, 13.777327537536621, 14.993979454040527, 16.21063232421875, 17.427284240722656, 18.643936157226562, 19.86058807373047]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 11.0, 15.0, 21.0, 15.0, 18.0, 15.0, 34.0, 25.0, 33.0, 35.0, 36.0, 40.0, 40.0, 50.0, 48.0, 49.0, 48.0, 43.0, 33.0, 37.0, 40.0, 31.0, 32.0, 30.0, 37.0, 24.0, 21.0, 20.0, 16.0, 17.0, 13.0, 12.0, 8.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.16110610961914, -10.830178260803223, -10.499251365661621, -10.168323516845703, -9.837395668029785, -9.506467819213867, -9.175540924072266, -8.844613075256348, -8.51368522644043, -8.182757377624512, -7.851830005645752, -7.520902633666992, -7.189974784851074, -6.8590474128723145, -6.528120040893555, -6.197192192077637, -5.866265296936035, -5.535337924957275, -5.204410076141357, -4.873482704162598, -4.54255485534668, -4.21162748336792, -3.88070011138916, -3.5497725009918213, -3.2188448905944824, -2.8879172801971436, -2.5569896697998047, -2.226062297821045, -1.895134687423706, -1.5642070770263672, -1.2332795858383179, -0.9023520946502686, -0.5714235305786133, -0.2404959797859192, 0.0904315710067749, 0.421359121799469, 0.7522866725921631, 1.083214282989502, 1.4141417741775513, 1.7450692653656006, 2.0759968757629395, 2.4069244861602783, 2.737852096557617, 3.068779468536377, 3.399707078933716, 3.7306346893310547, 4.0615620613098145, 4.392489433288574, 4.723417282104492, 5.054344654083252, 5.38527250289917, 5.71619987487793, 6.047127723693848, 6.378055095672607, 6.708982467651367, 7.039910316467285, 7.370837688446045, 7.701765060424805, 8.032692909240723, 8.36362075805664, 8.694547653198242, 9.02547550201416, 9.356403350830078, 9.68733024597168, 10.018258094787598]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 4.0, 20.0, 25.0, 47.0, 65.0, 88.0, 142.0, 202.0, 295.0, 538.0, 835.0, 1336.0, 2201.0, 3897.0, 6877.0, 12229.0, 22679.0, 44067.0, 94006.0, 434907.0, 273388.0, 71640.0, 36171.0, 18662.0, 10110.0, 5706.0, 3336.0, 2019.0, 1171.0, 660.0, 441.0, 291.0, 176.0, 111.0, 66.0, 42.0, 41.0, 26.0, 6.0, 9.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.33203125, -4.1868896484375, -4.041748046875, -3.8966064453125, -3.75146484375, -3.6063232421875, -3.461181640625, -3.3160400390625, -3.1708984375, -3.0257568359375, -2.880615234375, -2.7354736328125, -2.59033203125, -2.4451904296875, -2.300048828125, -2.1549072265625, -2.009765625, -1.8646240234375, -1.719482421875, -1.5743408203125, -1.42919921875, -1.2840576171875, -1.138916015625, -0.9937744140625, -0.8486328125, -0.7034912109375, -0.558349609375, -0.4132080078125, -0.26806640625, -0.1229248046875, 0.022216796875, 0.1673583984375, 0.3125, 0.4576416015625, 0.602783203125, 0.7479248046875, 0.89306640625, 1.0382080078125, 1.183349609375, 1.3284912109375, 1.4736328125, 1.6187744140625, 1.763916015625, 1.9090576171875, 2.05419921875, 2.1993408203125, 2.344482421875, 2.4896240234375, 2.634765625, 2.7799072265625, 2.925048828125, 3.0701904296875, 3.21533203125, 3.3604736328125, 3.505615234375, 3.6507568359375, 3.7958984375, 3.9410400390625, 4.086181640625, 4.2313232421875, 4.37646484375, 4.5216064453125, 4.666748046875, 4.8118896484375, 4.95703125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 11.0, 5.0, 14.0, 17.0, 20.0, 28.0, 37.0, 36.0, 26.0, 38.0, 47.0, 49.0, 57.0, 48.0, 76.0, 55.0, 53.0, 56.0, 48.0, 53.0, 36.0, 24.0, 33.0, 24.0, 25.0, 17.0, 18.0, 10.0, 9.0, 6.0, 2.0, 6.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.2933807373046875, -1.249847412109375, -1.2063140869140625, -1.16278076171875, -1.1192474365234375, -1.075714111328125, -1.0321807861328125, -0.9886474609375, -0.9451141357421875, -0.901580810546875, -0.8580474853515625, -0.81451416015625, -0.7709808349609375, -0.727447509765625, -0.6839141845703125, -0.640380859375, -0.5968475341796875, -0.553314208984375, -0.5097808837890625, -0.46624755859375, -0.4227142333984375, -0.379180908203125, -0.3356475830078125, -0.2921142578125, -0.2485809326171875, -0.205047607421875, -0.1615142822265625, -0.11798095703125, -0.0744476318359375, -0.030914306640625, 0.0126190185546875, 0.05615234375, 0.0996856689453125, 0.143218994140625, 0.1867523193359375, 0.23028564453125, 0.2738189697265625, 0.317352294921875, 0.3608856201171875, 0.4044189453125, 0.4479522705078125, 0.491485595703125, 0.5350189208984375, 0.57855224609375, 0.6220855712890625, 0.665618896484375, 0.7091522216796875, 0.752685546875, 0.7962188720703125, 0.839752197265625, 0.8832855224609375, 0.92681884765625, 0.9703521728515625, 1.013885498046875, 1.0574188232421875, 1.1009521484375, 1.1444854736328125, 1.188018798828125, 1.2315521240234375, 1.27508544921875, 1.3186187744140625, 1.362152099609375, 1.4056854248046875, 1.44921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 10.0, 18.0, 22.0, 31.0, 43.0, 58.0, 83.0, 114.0, 148.0, 236.0, 360.0, 628.0, 1104.0, 2270.0, 5277.0, 16134.0, 62089.0, 489748.0, 390035.0, 55715.0, 14584.0, 4940.0, 2131.0, 1041.0, 590.0, 349.0, 237.0, 160.0, 121.0, 65.0, 45.0, 43.0, 39.0, 20.0, 20.0, 9.0, 9.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.83984375, -7.60198974609375, -7.3641357421875, -7.12628173828125, -6.888427734375, -6.65057373046875, -6.4127197265625, -6.17486572265625, -5.93701171875, -5.69915771484375, -5.4613037109375, -5.22344970703125, -4.985595703125, -4.74774169921875, -4.5098876953125, -4.27203369140625, -4.0341796875, -3.79632568359375, -3.5584716796875, -3.32061767578125, -3.082763671875, -2.84490966796875, -2.6070556640625, -2.36920166015625, -2.13134765625, -1.89349365234375, -1.6556396484375, -1.41778564453125, -1.179931640625, -0.94207763671875, -0.7042236328125, -0.46636962890625, -0.228515625, 0.00933837890625, 0.2471923828125, 0.48504638671875, 0.722900390625, 0.96075439453125, 1.1986083984375, 1.43646240234375, 1.67431640625, 1.91217041015625, 2.1500244140625, 2.38787841796875, 2.625732421875, 2.86358642578125, 3.1014404296875, 3.33929443359375, 3.5771484375, 3.81500244140625, 4.0528564453125, 4.29071044921875, 4.528564453125, 4.76641845703125, 5.0042724609375, 5.24212646484375, 5.47998046875, 5.71783447265625, 5.9556884765625, 6.19354248046875, 6.431396484375, 6.66925048828125, 6.9071044921875, 7.14495849609375, 7.3828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 10.0, 9.0, 12.0, 25.0, 30.0, 25.0, 34.0, 48.0, 43.0, 45.0, 61.0, 49.0, 51.0, 62.0, 53.0, 60.0, 62.0, 42.0, 43.0, 41.0, 29.0, 28.0, 25.0, 22.0, 19.0, 16.0, 6.0, 9.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.578125, -7.376708984375, -7.17529296875, -6.973876953125, -6.7724609375, -6.571044921875, -6.36962890625, -6.168212890625, -5.966796875, -5.765380859375, -5.56396484375, -5.362548828125, -5.1611328125, -4.959716796875, -4.75830078125, -4.556884765625, -4.35546875, -4.154052734375, -3.95263671875, -3.751220703125, -3.5498046875, -3.348388671875, -3.14697265625, -2.945556640625, -2.744140625, -2.542724609375, -2.34130859375, -2.139892578125, -1.9384765625, -1.737060546875, -1.53564453125, -1.334228515625, -1.1328125, -0.931396484375, -0.72998046875, -0.528564453125, -0.3271484375, -0.125732421875, 0.07568359375, 0.277099609375, 0.478515625, 0.679931640625, 0.88134765625, 1.082763671875, 1.2841796875, 1.485595703125, 1.68701171875, 1.888427734375, 2.08984375, 2.291259765625, 2.49267578125, 2.694091796875, 2.8955078125, 3.096923828125, 3.29833984375, 3.499755859375, 3.701171875, 3.902587890625, 4.10400390625, 4.305419921875, 4.5068359375, 4.708251953125, 4.90966796875, 5.111083984375, 5.3125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 10.0, 21.0, 53.0, 99.0, 225.0, 690.0, 2824.0, 20814.0, 292982.0, 693325.0, 31968.0, 4204.0, 880.0, 257.0, 94.0, 54.0, 22.0, 10.0, 9.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.4788818359375, -9.223388671875, -8.9678955078125, -8.71240234375, -8.4569091796875, -8.201416015625, -7.9459228515625, -7.6904296875, -7.4349365234375, -7.179443359375, -6.9239501953125, -6.66845703125, -6.4129638671875, -6.157470703125, -5.9019775390625, -5.646484375, -5.3909912109375, -5.135498046875, -4.8800048828125, -4.62451171875, -4.3690185546875, -4.113525390625, -3.8580322265625, -3.6025390625, -3.3470458984375, -3.091552734375, -2.8360595703125, -2.58056640625, -2.3250732421875, -2.069580078125, -1.8140869140625, -1.55859375, -1.3031005859375, -1.047607421875, -0.7921142578125, -0.53662109375, -0.2811279296875, -0.025634765625, 0.2298583984375, 0.4853515625, 0.7408447265625, 0.996337890625, 1.2518310546875, 1.50732421875, 1.7628173828125, 2.018310546875, 2.2738037109375, 2.529296875, 2.7847900390625, 3.040283203125, 3.2957763671875, 3.55126953125, 3.8067626953125, 4.062255859375, 4.3177490234375, 4.5732421875, 4.8287353515625, 5.084228515625, 5.3397216796875, 5.59521484375, 5.8507080078125, 6.106201171875, 6.3616943359375, 6.6171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 16.0, 13.0, 17.0, 17.0, 30.0, 39.0, 57.0, 127.0, 232.0, 163.0, 58.0, 40.0, 28.0, 22.0, 26.0, 11.0, 16.0, 7.0, 9.0, 5.0, 3.0, 7.0, 1.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.0010013580322265625, -0.0009723901748657227, -0.0009434223175048828, -0.000914454460144043, -0.0008854866027832031, -0.0008565187454223633, -0.0008275508880615234, -0.0007985830307006836, -0.0007696151733398438, -0.0007406473159790039, -0.0007116794586181641, -0.0006827116012573242, -0.0006537437438964844, -0.0006247758865356445, -0.0005958080291748047, -0.0005668401718139648, -0.000537872314453125, -0.0005089044570922852, -0.0004799365997314453, -0.00045096874237060547, -0.0004220008850097656, -0.0003930330276489258, -0.00036406517028808594, -0.0003350973129272461, -0.00030612945556640625, -0.0002771615982055664, -0.00024819374084472656, -0.00021922588348388672, -0.00019025802612304688, -0.00016129016876220703, -0.0001323223114013672, -0.00010335445404052734, -7.43865966796875e-05, -4.5418739318847656e-05, -1.6450881958007812e-05, 1.2516975402832031e-05, 4.1484832763671875e-05, 7.045269012451172e-05, 9.942054748535156e-05, 0.0001283884048461914, 0.00015735626220703125, 0.0001863241195678711, 0.00021529197692871094, 0.0002442598342895508, 0.0002732276916503906, 0.00030219554901123047, 0.0003311634063720703, 0.00036013126373291016, 0.00038909912109375, 0.00041806697845458984, 0.0004470348358154297, 0.00047600269317626953, 0.0005049705505371094, 0.0005339384078979492, 0.0005629062652587891, 0.0005918741226196289, 0.0006208419799804688, 0.0006498098373413086, 0.0006787776947021484, 0.0007077455520629883, 0.0007367134094238281, 0.000765681266784668, 0.0007946491241455078, 0.0008236169815063477, 0.0008525848388671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 3.0, 16.0, 16.0, 6.0, 24.0, 16.0, 35.0, 44.0, 60.0, 92.0, 152.0, 222.0, 343.0, 629.0, 1311.0, 3310.0, 10156.0, 36668.0, 172462.0, 695300.0, 92612.0, 23323.0, 6921.0, 2353.0, 1027.0, 539.0, 312.0, 167.0, 123.0, 89.0, 52.0, 46.0, 31.0, 25.0, 20.0, 5.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4635009765625, -4.325439453125, -4.1873779296875, -4.04931640625, -3.9112548828125, -3.773193359375, -3.6351318359375, -3.4970703125, -3.3590087890625, -3.220947265625, -3.0828857421875, -2.94482421875, -2.8067626953125, -2.668701171875, -2.5306396484375, -2.392578125, -2.2545166015625, -2.116455078125, -1.9783935546875, -1.84033203125, -1.7022705078125, -1.564208984375, -1.4261474609375, -1.2880859375, -1.1500244140625, -1.011962890625, -0.8739013671875, -0.73583984375, -0.5977783203125, -0.459716796875, -0.3216552734375, -0.18359375, -0.0455322265625, 0.092529296875, 0.2305908203125, 0.36865234375, 0.5067138671875, 0.644775390625, 0.7828369140625, 0.9208984375, 1.0589599609375, 1.197021484375, 1.3350830078125, 1.47314453125, 1.6112060546875, 1.749267578125, 1.8873291015625, 2.025390625, 2.1634521484375, 2.301513671875, 2.4395751953125, 2.57763671875, 2.7156982421875, 2.853759765625, 2.9918212890625, 3.1298828125, 3.2679443359375, 3.406005859375, 3.5440673828125, 3.68212890625, 3.8201904296875, 3.958251953125, 4.0963134765625, 4.234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 7.0, 5.0, 10.0, 7.0, 10.0, 15.0, 16.0, 27.0, 65.0, 93.0, 194.0, 203.0, 131.0, 60.0, 34.0, 22.0, 29.0, 19.0, 11.0, 7.0, 8.0, 7.0, 6.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.6912841796875, -3.550537109375, -3.4097900390625, -3.26904296875, -3.1282958984375, -2.987548828125, -2.8468017578125, -2.7060546875, -2.5653076171875, -2.424560546875, -2.2838134765625, -2.14306640625, -2.0023193359375, -1.861572265625, -1.7208251953125, -1.580078125, -1.4393310546875, -1.298583984375, -1.1578369140625, -1.01708984375, -0.8763427734375, -0.735595703125, -0.5948486328125, -0.4541015625, -0.3133544921875, -0.172607421875, -0.0318603515625, 0.10888671875, 0.2496337890625, 0.390380859375, 0.5311279296875, 0.671875, 0.8126220703125, 0.953369140625, 1.0941162109375, 1.23486328125, 1.3756103515625, 1.516357421875, 1.6571044921875, 1.7978515625, 1.9385986328125, 2.079345703125, 2.2200927734375, 2.36083984375, 2.5015869140625, 2.642333984375, 2.7830810546875, 2.923828125, 3.0645751953125, 3.205322265625, 3.3460693359375, 3.48681640625, 3.6275634765625, 3.768310546875, 3.9090576171875, 4.0498046875, 4.1905517578125, 4.331298828125, 4.4720458984375, 4.61279296875, 4.7535400390625, 4.894287109375, 5.0350341796875, 5.17578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 22.0, 41.0, 79.0, 130.0, 159.0, 187.0, 162.0, 115.0, 46.0, 40.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.07857131958008, -45.9244384765625, -43.77030944824219, -41.61617660522461, -39.46204376220703, -37.30791473388672, -35.15378189086914, -32.99964904785156, -30.845518112182617, -28.691387176513672, -26.537254333496094, -24.38312339782715, -22.228992462158203, -20.074859619140625, -17.92072868347168, -15.766596794128418, -13.612464904785156, -11.458333015441895, -9.304201126098633, -7.1500701904296875, -4.995938301086426, -2.841806411743164, -0.6876754760742188, 1.466456413269043, 3.6205883026123047, 5.774720191955566, 7.92885160446167, 10.082983016967773, 12.237114906311035, 14.391246795654297, 16.545377731323242, 18.699508666992188, 20.8536376953125, 23.007768630981445, 25.161901473999023, 27.31603240966797, 29.470165252685547, 31.624296188354492, 33.77842712402344, 35.932559967041016, 38.086692810058594, 40.24082565307617, 42.394954681396484, 44.54908752441406, 46.70322036743164, 48.85735321044922, 51.01148223876953, 53.16561508178711, 55.31974411010742, 57.473876953125, 59.62800598144531, 61.78213882446289, 63.93627166748047, 66.09040069580078, 68.24453735351562, 70.39866638183594, 72.55279541015625, 74.70692443847656, 76.8610610961914, 79.01519012451172, 81.16931915283203, 83.32345581054688, 85.47758483886719, 87.6317138671875, 89.78585052490234]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 12.0, 9.0, 11.0, 12.0, 20.0, 16.0, 17.0, 31.0, 21.0, 18.0, 25.0, 23.0, 24.0, 29.0, 30.0, 39.0, 30.0, 39.0, 34.0, 42.0, 27.0, 34.0, 37.0, 32.0, 37.0, 29.0, 36.0, 29.0, 32.0, 27.0, 30.0, 29.0, 26.0, 11.0, 13.0, 11.0, 16.0, 10.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-25.554346084594727, -24.79286003112793, -24.031373977661133, -23.269886016845703, -22.508399963378906, -21.74691390991211, -20.985427856445312, -20.223941802978516, -19.46245574951172, -18.700969696044922, -17.939483642578125, -17.177997589111328, -16.4165096282959, -15.655023574829102, -14.893537521362305, -14.132051467895508, -13.370563507080078, -12.609077453613281, -11.847590446472168, -11.086104393005371, -10.324617385864258, -9.563131332397461, -8.801645278930664, -8.040159225463867, -7.278672218322754, -6.517185688018799, -5.755699157714844, -4.994213104248047, -4.232726573944092, -3.4712400436401367, -2.70975399017334, -1.9482674598693848, -1.1867828369140625, -0.425296425819397, 0.33618998527526855, 1.0976762771606445, 1.8591628074645996, 2.6206493377685547, 3.3821353912353516, 4.143621921539307, 4.905108451843262, 5.666594982147217, 6.428081512451172, 7.189567565917969, 7.951054096221924, 8.712540626525879, 9.474026679992676, 10.235513687133789, 10.996999740600586, 11.758485794067383, 12.519972801208496, 13.281458854675293, 14.042945861816406, 14.804431915283203, 15.56591796875, 16.327404022216797, 17.088890075683594, 17.85037612915039, 18.611862182617188, 19.373348236083984, 20.134836196899414, 20.89632225036621, 21.657808303833008, 22.419294357299805, 23.180782318115234]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 9.0, 9.0, 10.0, 9.0, 13.0, 19.0, 23.0, 41.0, 70.0, 89.0, 120.0, 209.0, 418.0, 1017.0, 2389.0, 6743.0, 25553.0, 180190.0, 3743521.0, 196504.0, 26271.0, 6753.0, 2232.0, 959.0, 435.0, 232.0, 142.0, 79.0, 61.0, 39.0, 29.0, 27.0, 22.0, 12.0, 5.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.35516357421875, -7.0423583984375, -6.72955322265625, -6.416748046875, -6.10394287109375, -5.7911376953125, -5.47833251953125, -5.16552734375, -4.85272216796875, -4.5399169921875, -4.22711181640625, -3.914306640625, -3.60150146484375, -3.2886962890625, -2.97589111328125, -2.6630859375, -2.35028076171875, -2.0374755859375, -1.72467041015625, -1.411865234375, -1.09906005859375, -0.7862548828125, -0.47344970703125, -0.16064453125, 0.15216064453125, 0.4649658203125, 0.77777099609375, 1.090576171875, 1.40338134765625, 1.7161865234375, 2.02899169921875, 2.341796875, 2.65460205078125, 2.9674072265625, 3.28021240234375, 3.593017578125, 3.90582275390625, 4.2186279296875, 4.53143310546875, 4.84423828125, 5.15704345703125, 5.4698486328125, 5.78265380859375, 6.095458984375, 6.40826416015625, 6.7210693359375, 7.03387451171875, 7.3466796875, 7.65948486328125, 7.9722900390625, 8.28509521484375, 8.597900390625, 8.91070556640625, 9.2235107421875, 9.53631591796875, 9.84912109375, 10.16192626953125, 10.4747314453125, 10.78753662109375, 11.100341796875, 11.41314697265625, 11.7259521484375, 12.03875732421875, 12.3515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 7.0, 10.0, 14.0, 15.0, 22.0, 18.0, 28.0, 39.0, 40.0, 36.0, 60.0, 48.0, 50.0, 51.0, 43.0, 51.0, 62.0, 54.0, 63.0, 50.0, 49.0, 17.0, 26.0, 34.0, 27.0, 14.0, 16.0, 12.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.5589752197265625, -1.508575439453125, -1.4581756591796875, -1.40777587890625, -1.3573760986328125, -1.306976318359375, -1.2565765380859375, -1.2061767578125, -1.1557769775390625, -1.105377197265625, -1.0549774169921875, -1.00457763671875, -0.9541778564453125, -0.903778076171875, -0.8533782958984375, -0.802978515625, -0.7525787353515625, -0.702178955078125, -0.6517791748046875, -0.60137939453125, -0.5509796142578125, -0.500579833984375, -0.4501800537109375, -0.3997802734375, -0.3493804931640625, -0.298980712890625, -0.2485809326171875, -0.19818115234375, -0.1477813720703125, -0.097381591796875, -0.0469818115234375, 0.00341796875, 0.0538177490234375, 0.104217529296875, 0.1546173095703125, 0.20501708984375, 0.2554168701171875, 0.305816650390625, 0.3562164306640625, 0.4066162109375, 0.4570159912109375, 0.507415771484375, 0.5578155517578125, 0.60821533203125, 0.6586151123046875, 0.709014892578125, 0.7594146728515625, 0.809814453125, 0.8602142333984375, 0.910614013671875, 0.9610137939453125, 1.01141357421875, 1.0618133544921875, 1.112213134765625, 1.1626129150390625, 1.2130126953125, 1.2634124755859375, 1.313812255859375, 1.3642120361328125, 1.41461181640625, 1.4650115966796875, 1.515411376953125, 1.5658111572265625, 1.6162109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 10.0, 4.0, 7.0, 9.0, 25.0, 27.0, 55.0, 74.0, 131.0, 189.0, 342.0, 522.0, 935.0, 1776.0, 3676.0, 8037.0, 20882.0, 71231.0, 454432.0, 3271436.0, 276763.0, 53406.0, 16799.0, 6741.0, 3117.0, 1587.0, 855.0, 474.0, 292.0, 185.0, 78.0, 70.0, 33.0, 24.0, 17.0, 19.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5859375, -7.3653564453125, -7.144775390625, -6.9241943359375, -6.70361328125, -6.4830322265625, -6.262451171875, -6.0418701171875, -5.8212890625, -5.6007080078125, -5.380126953125, -5.1595458984375, -4.93896484375, -4.7183837890625, -4.497802734375, -4.2772216796875, -4.056640625, -3.8360595703125, -3.615478515625, -3.3948974609375, -3.17431640625, -2.9537353515625, -2.733154296875, -2.5125732421875, -2.2919921875, -2.0714111328125, -1.850830078125, -1.6302490234375, -1.40966796875, -1.1890869140625, -0.968505859375, -0.7479248046875, -0.52734375, -0.3067626953125, -0.086181640625, 0.1343994140625, 0.35498046875, 0.5755615234375, 0.796142578125, 1.0167236328125, 1.2373046875, 1.4578857421875, 1.678466796875, 1.8990478515625, 2.11962890625, 2.3402099609375, 2.560791015625, 2.7813720703125, 3.001953125, 3.2225341796875, 3.443115234375, 3.6636962890625, 3.88427734375, 4.1048583984375, 4.325439453125, 4.5460205078125, 4.7666015625, 4.9871826171875, 5.207763671875, 5.4283447265625, 5.64892578125, 5.8695068359375, 6.090087890625, 6.3106689453125, 6.53125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 2.0, 8.0, 7.0, 11.0, 12.0, 20.0, 24.0, 50.0, 70.0, 93.0, 186.0, 358.0, 1136.0, 1180.0, 346.0, 187.0, 109.0, 81.0, 47.0, 40.0, 25.0, 23.0, 12.0, 10.0, 10.0, 7.0, 2.0, 0.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.50146484375, -2.4013671875, -2.30126953125, -2.201171875, -2.10107421875, -2.0009765625, -1.90087890625, -1.80078125, -1.70068359375, -1.6005859375, -1.50048828125, -1.400390625, -1.30029296875, -1.2001953125, -1.10009765625, -1.0, -0.89990234375, -0.7998046875, -0.69970703125, -0.599609375, -0.49951171875, -0.3994140625, -0.29931640625, -0.19921875, -0.09912109375, 0.0009765625, 0.10107421875, 0.201171875, 0.30126953125, 0.4013671875, 0.50146484375, 0.6015625, 0.70166015625, 0.8017578125, 0.90185546875, 1.001953125, 1.10205078125, 1.2021484375, 1.30224609375, 1.40234375, 1.50244140625, 1.6025390625, 1.70263671875, 1.802734375, 1.90283203125, 2.0029296875, 2.10302734375, 2.203125, 2.30322265625, 2.4033203125, 2.50341796875, 2.603515625, 2.70361328125, 2.8037109375, 2.90380859375, 3.00390625, 3.10400390625, 3.2041015625, 3.30419921875, 3.404296875, 3.50439453125, 3.6044921875, 3.70458984375, 3.8046875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 16.0, 28.0, 45.0, 76.0, 103.0, 121.0, 142.0, 118.0, 133.0, 75.0, 63.0, 20.0, 24.0, 7.0, 9.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.569719314575195, -12.874899864196777, -12.18008041381836, -11.485260963439941, -10.790441513061523, -10.095622062683105, -9.400802612304688, -8.705982208251953, -8.011163711547852, -7.316344261169434, -6.621524810791016, -5.926705360412598, -5.23188591003418, -4.537066459655762, -3.8422465324401855, -3.1474270820617676, -2.4526071548461914, -1.7577877044677734, -1.062968134880066, -0.3681485652923584, 0.32667088508605957, 1.0214903354644775, 1.7163100242614746, 2.4111294746398926, 3.1059489250183105, 3.8007683753967285, 4.4955878257751465, 5.190407752990723, 5.885227203369141, 6.580046653747559, 7.274866104125977, 7.9696855545043945, 8.664505004882812, 9.35932445526123, 10.054143905639648, 10.748963356018066, 11.443782806396484, 12.138602256774902, 12.83342170715332, 13.528242111206055, 14.223060607910156, 14.917880058288574, 15.612699508666992, 16.307519912719727, 17.002338409423828, 17.697158813476562, 18.391977310180664, 19.0867977142334, 19.7816162109375, 20.476436614990234, 21.171255111694336, 21.86607551574707, 22.560894012451172, 23.255714416503906, 23.950532913208008, 24.645353317260742, 25.340173721313477, 26.03499412536621, 26.729812622070312, 27.424633026123047, 28.11945152282715, 28.814271926879883, 29.509090423583984, 30.20391082763672, 30.89872932434082]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 9.0, 14.0, 8.0, 24.0, 14.0, 21.0, 23.0, 26.0, 23.0, 25.0, 39.0, 40.0, 47.0, 36.0, 43.0, 37.0, 38.0, 46.0, 39.0, 36.0, 33.0, 38.0, 35.0, 38.0, 33.0, 33.0, 26.0, 19.0, 23.0, 20.0, 11.0, 22.0, 11.0, 9.0, 10.0, 9.0, 11.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.839078903198242, -9.54525375366211, -9.25142765045166, -8.957601547241211, -8.663776397705078, -8.369951248168945, -8.076125144958496, -7.782299518585205, -7.488473892211914, -7.194648265838623, -6.900822639465332, -6.606997013092041, -6.31317138671875, -6.019345760345459, -5.725520133972168, -5.431694507598877, -5.137868881225586, -4.844043254852295, -4.550217628479004, -4.256392002105713, -3.962566375732422, -3.668740749359131, -3.37491512298584, -3.081089496612549, -2.787263870239258, -2.493438243865967, -2.199612617492676, -1.9057869911193848, -1.6119613647460938, -1.3181357383728027, -1.0243101119995117, -0.7304844856262207, -0.4366588592529297, -0.14283323287963867, 0.15099239349365234, 0.44481801986694336, 0.7386436462402344, 1.0324692726135254, 1.3262948989868164, 1.6201205253601074, 1.9139461517333984, 2.2077717781066895, 2.5015974044799805, 2.7954230308532715, 3.0892486572265625, 3.3830742835998535, 3.6768999099731445, 3.9707255363464355, 4.264551162719727, 4.558376789093018, 4.852202415466309, 5.1460280418396, 5.439853668212891, 5.733679294586182, 6.027504920959473, 6.321330547332764, 6.615156173706055, 6.908981800079346, 7.202807426452637, 7.496633052825928, 7.790458679199219, 8.084283828735352, 8.3781099319458, 8.67193603515625, 8.965761184692383]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 10.0, 8.0, 21.0, 24.0, 30.0, 53.0, 62.0, 115.0, 219.0, 404.0, 820.0, 1720.0, 4001.0, 9879.0, 23328.0, 59445.0, 399412.0, 442851.0, 63518.0, 24581.0, 10277.0, 4250.0, 1775.0, 829.0, 395.0, 200.0, 120.0, 63.0, 53.0, 31.0, 14.0, 18.0, 15.0, 6.0, 10.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.729736328125, -6.53759765625, -6.345458984375, -6.1533203125, -5.961181640625, -5.76904296875, -5.576904296875, -5.384765625, -5.192626953125, -5.00048828125, -4.808349609375, -4.6162109375, -4.424072265625, -4.23193359375, -4.039794921875, -3.84765625, -3.655517578125, -3.46337890625, -3.271240234375, -3.0791015625, -2.886962890625, -2.69482421875, -2.502685546875, -2.310546875, -2.118408203125, -1.92626953125, -1.734130859375, -1.5419921875, -1.349853515625, -1.15771484375, -0.965576171875, -0.7734375, -0.581298828125, -0.38916015625, -0.197021484375, -0.0048828125, 0.187255859375, 0.37939453125, 0.571533203125, 0.763671875, 0.955810546875, 1.14794921875, 1.340087890625, 1.5322265625, 1.724365234375, 1.91650390625, 2.108642578125, 2.30078125, 2.492919921875, 2.68505859375, 2.877197265625, 3.0693359375, 3.261474609375, 3.45361328125, 3.645751953125, 3.837890625, 4.030029296875, 4.22216796875, 4.414306640625, 4.6064453125, 4.798583984375, 4.99072265625, 5.182861328125, 5.375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 9.0, 8.0, 16.0, 21.0, 30.0, 24.0, 37.0, 29.0, 34.0, 49.0, 44.0, 46.0, 51.0, 44.0, 57.0, 57.0, 56.0, 56.0, 58.0, 37.0, 29.0, 35.0, 31.0, 30.0, 20.0, 16.0, 19.0, 18.0, 8.0, 7.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6572265625, -1.604705810546875, -1.55218505859375, -1.499664306640625, -1.4471435546875, -1.394622802734375, -1.34210205078125, -1.289581298828125, -1.237060546875, -1.184539794921875, -1.13201904296875, -1.079498291015625, -1.0269775390625, -0.974456787109375, -0.92193603515625, -0.869415283203125, -0.81689453125, -0.764373779296875, -0.71185302734375, -0.659332275390625, -0.6068115234375, -0.554290771484375, -0.50177001953125, -0.449249267578125, -0.396728515625, -0.344207763671875, -0.29168701171875, -0.239166259765625, -0.1866455078125, -0.134124755859375, -0.08160400390625, -0.029083251953125, 0.0234375, 0.075958251953125, 0.12847900390625, 0.180999755859375, 0.2335205078125, 0.286041259765625, 0.33856201171875, 0.391082763671875, 0.443603515625, 0.496124267578125, 0.54864501953125, 0.601165771484375, 0.6536865234375, 0.706207275390625, 0.75872802734375, 0.811248779296875, 0.86376953125, 0.916290283203125, 0.96881103515625, 1.021331787109375, 1.0738525390625, 1.126373291015625, 1.17889404296875, 1.231414794921875, 1.283935546875, 1.336456298828125, 1.38897705078125, 1.441497802734375, 1.4940185546875, 1.546539306640625, 1.59906005859375, 1.651580810546875, 1.7041015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 8.0, 6.0, 18.0, 31.0, 35.0, 59.0, 89.0, 134.0, 254.0, 456.0, 926.0, 1891.0, 4102.0, 10250.0, 25501.0, 66016.0, 720412.0, 154520.0, 37661.0, 14751.0, 6123.0, 2628.0, 1159.0, 620.0, 349.0, 186.0, 113.0, 66.0, 42.0, 29.0, 26.0, 20.0, 17.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0234375, -7.78546142578125, -7.5474853515625, -7.30950927734375, -7.071533203125, -6.83355712890625, -6.5955810546875, -6.35760498046875, -6.11962890625, -5.88165283203125, -5.6436767578125, -5.40570068359375, -5.167724609375, -4.92974853515625, -4.6917724609375, -4.45379638671875, -4.2158203125, -3.97784423828125, -3.7398681640625, -3.50189208984375, -3.263916015625, -3.02593994140625, -2.7879638671875, -2.54998779296875, -2.31201171875, -2.07403564453125, -1.8360595703125, -1.59808349609375, -1.360107421875, -1.12213134765625, -0.8841552734375, -0.64617919921875, -0.408203125, -0.17022705078125, 0.0677490234375, 0.30572509765625, 0.543701171875, 0.78167724609375, 1.0196533203125, 1.25762939453125, 1.49560546875, 1.73358154296875, 1.9715576171875, 2.20953369140625, 2.447509765625, 2.68548583984375, 2.9234619140625, 3.16143798828125, 3.3994140625, 3.63739013671875, 3.8753662109375, 4.11334228515625, 4.351318359375, 4.58929443359375, 4.8272705078125, 5.06524658203125, 5.30322265625, 5.54119873046875, 5.7791748046875, 6.01715087890625, 6.255126953125, 6.49310302734375, 6.7310791015625, 6.96905517578125, 7.20703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 12.0, 19.0, 20.0, 43.0, 43.0, 68.0, 52.0, 68.0, 67.0, 75.0, 75.0, 59.0, 76.0, 42.0, 49.0, 37.0, 32.0, 25.0, 26.0, 12.0, 11.0, 16.0, 9.0, 7.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.3203125, -10.024658203125, -9.72900390625, -9.433349609375, -9.1376953125, -8.842041015625, -8.54638671875, -8.250732421875, -7.955078125, -7.659423828125, -7.36376953125, -7.068115234375, -6.7724609375, -6.476806640625, -6.18115234375, -5.885498046875, -5.58984375, -5.294189453125, -4.99853515625, -4.702880859375, -4.4072265625, -4.111572265625, -3.81591796875, -3.520263671875, -3.224609375, -2.928955078125, -2.63330078125, -2.337646484375, -2.0419921875, -1.746337890625, -1.45068359375, -1.155029296875, -0.859375, -0.563720703125, -0.26806640625, 0.027587890625, 0.3232421875, 0.618896484375, 0.91455078125, 1.210205078125, 1.505859375, 1.801513671875, 2.09716796875, 2.392822265625, 2.6884765625, 2.984130859375, 3.27978515625, 3.575439453125, 3.87109375, 4.166748046875, 4.46240234375, 4.758056640625, 5.0537109375, 5.349365234375, 5.64501953125, 5.940673828125, 6.236328125, 6.531982421875, 6.82763671875, 7.123291015625, 7.4189453125, 7.714599609375, 8.01025390625, 8.305908203125, 8.6015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 6.0, 9.0, 15.0, 20.0, 26.0, 26.0, 38.0, 61.0, 78.0, 112.0, 168.0, 216.0, 334.0, 482.0, 713.0, 1087.0, 1731.0, 2999.0, 5205.0, 9397.0, 18159.0, 38319.0, 116443.0, 643943.0, 127054.0, 39631.0, 18934.0, 9674.0, 5306.0, 3134.0, 1788.0, 1094.0, 744.0, 519.0, 319.0, 226.0, 170.0, 92.0, 81.0, 51.0, 35.0, 26.0, 20.0, 15.0, 13.0, 6.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-3.033203125, -2.942718505859375, -2.85223388671875, -2.761749267578125, -2.6712646484375, -2.580780029296875, -2.49029541015625, -2.399810791015625, -2.309326171875, -2.218841552734375, -2.12835693359375, -2.037872314453125, -1.9473876953125, -1.856903076171875, -1.76641845703125, -1.675933837890625, -1.58544921875, -1.494964599609375, -1.40447998046875, -1.313995361328125, -1.2235107421875, -1.133026123046875, -1.04254150390625, -0.952056884765625, -0.861572265625, -0.771087646484375, -0.68060302734375, -0.590118408203125, -0.4996337890625, -0.409149169921875, -0.31866455078125, -0.228179931640625, -0.1376953125, -0.047210693359375, 0.04327392578125, 0.133758544921875, 0.2242431640625, 0.314727783203125, 0.40521240234375, 0.495697021484375, 0.586181640625, 0.676666259765625, 0.76715087890625, 0.857635498046875, 0.9481201171875, 1.038604736328125, 1.12908935546875, 1.219573974609375, 1.31005859375, 1.400543212890625, 1.49102783203125, 1.581512451171875, 1.6719970703125, 1.762481689453125, 1.85296630859375, 1.943450927734375, 2.033935546875, 2.124420166015625, 2.21490478515625, 2.305389404296875, 2.3958740234375, 2.486358642578125, 2.57684326171875, 2.667327880859375, 2.7578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 2.0, 6.0, 11.0, 3.0, 13.0, 15.0, 15.0, 16.0, 24.0, 66.0, 280.0, 345.0, 76.0, 24.0, 20.0, 14.0, 13.0, 16.0, 6.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0019063949584960938, -0.0018620938062667847, -0.0018177926540374756, -0.0017734915018081665, -0.0017291903495788574, -0.0016848891973495483, -0.0016405880451202393, -0.0015962868928909302, -0.001551985740661621, -0.001507684588432312, -0.001463383436203003, -0.0014190822839736938, -0.0013747811317443848, -0.0013304799795150757, -0.0012861788272857666, -0.0012418776750564575, -0.0011975765228271484, -0.0011532753705978394, -0.0011089742183685303, -0.0010646730661392212, -0.0010203719139099121, -0.000976070761680603, -0.0009317696094512939, -0.0008874684572219849, -0.0008431673049926758, -0.0007988661527633667, -0.0007545650005340576, -0.0007102638483047485, -0.0006659626960754395, -0.0006216615438461304, -0.0005773603916168213, -0.0005330592393875122, -0.0004887580871582031, -0.00044445693492889404, -0.00040015578269958496, -0.0003558546304702759, -0.0003115534782409668, -0.0002672523260116577, -0.00022295117378234863, -0.00017865002155303955, -0.00013434886932373047, -9.004771709442139e-05, -4.5746564865112305e-05, -1.4454126358032227e-06, 4.285573959350586e-05, 8.715689182281494e-05, 0.00013145804405212402, 0.0001757591962814331, 0.0002200603485107422, 0.00026436150074005127, 0.00030866265296936035, 0.00035296380519866943, 0.0003972649574279785, 0.0004415661096572876, 0.0004858672618865967, 0.0005301684141159058, 0.0005744695663452148, 0.0006187707185745239, 0.000663071870803833, 0.0007073730230331421, 0.0007516741752624512, 0.0007959753274917603, 0.0008402764797210693, 0.0008845776319503784, 0.0009288787841796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 10.0, 17.0, 32.0, 57.0, 65.0, 162.0, 290.0, 552.0, 1392.0, 3543.0, 10407.0, 33919.0, 228753.0, 685766.0, 58730.0, 15759.0, 5456.0, 1954.0, 851.0, 380.0, 173.0, 118.0, 57.0, 27.0, 24.0, 14.0, 9.0, 12.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.328125, -4.1689453125, -4.009765625, -3.8505859375, -3.69140625, -3.5322265625, -3.373046875, -3.2138671875, -3.0546875, -2.8955078125, -2.736328125, -2.5771484375, -2.41796875, -2.2587890625, -2.099609375, -1.9404296875, -1.78125, -1.6220703125, -1.462890625, -1.3037109375, -1.14453125, -0.9853515625, -0.826171875, -0.6669921875, -0.5078125, -0.3486328125, -0.189453125, -0.0302734375, 0.12890625, 0.2880859375, 0.447265625, 0.6064453125, 0.765625, 0.9248046875, 1.083984375, 1.2431640625, 1.40234375, 1.5615234375, 1.720703125, 1.8798828125, 2.0390625, 2.1982421875, 2.357421875, 2.5166015625, 2.67578125, 2.8349609375, 2.994140625, 3.1533203125, 3.3125, 3.4716796875, 3.630859375, 3.7900390625, 3.94921875, 4.1083984375, 4.267578125, 4.4267578125, 4.5859375, 4.7451171875, 4.904296875, 5.0634765625, 5.22265625, 5.3818359375, 5.541015625, 5.7001953125, 5.859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 5.0, 5.0, 10.0, 14.0, 3.0, 20.0, 24.0, 33.0, 46.0, 92.0, 147.0, 201.0, 160.0, 73.0, 45.0, 24.0, 16.0, 12.0, 11.0, 12.0, 9.0, 4.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.533294677734375, -3.40447998046875, -3.275665283203125, -3.1468505859375, -3.018035888671875, -2.88922119140625, -2.760406494140625, -2.631591796875, -2.502777099609375, -2.37396240234375, -2.245147705078125, -2.1163330078125, -1.987518310546875, -1.85870361328125, -1.729888916015625, -1.60107421875, -1.472259521484375, -1.34344482421875, -1.214630126953125, -1.0858154296875, -0.957000732421875, -0.82818603515625, -0.699371337890625, -0.570556640625, -0.441741943359375, -0.31292724609375, -0.184112548828125, -0.0552978515625, 0.073516845703125, 0.20233154296875, 0.331146240234375, 0.4599609375, 0.588775634765625, 0.71759033203125, 0.846405029296875, 0.9752197265625, 1.104034423828125, 1.23284912109375, 1.361663818359375, 1.490478515625, 1.619293212890625, 1.74810791015625, 1.876922607421875, 2.0057373046875, 2.134552001953125, 2.26336669921875, 2.392181396484375, 2.52099609375, 2.649810791015625, 2.77862548828125, 2.907440185546875, 3.0362548828125, 3.165069580078125, 3.29388427734375, 3.422698974609375, 3.551513671875, 3.680328369140625, 3.80914306640625, 3.937957763671875, 4.0667724609375, 4.195587158203125, 4.32440185546875, 4.453216552734375, 4.58203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 23.0, 59.0, 138.0, 262.0, 284.0, 160.0, 60.0, 12.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.45588684082031, -34.62067413330078, -30.785459518432617, -26.950246810913086, -23.115032196044922, -19.27981948852539, -15.44460678100586, -11.609392166137695, -7.774179458618164, -3.9389660358428955, -0.10375261306762695, 3.7314605712890625, 7.56667423248291, 11.401887893676758, 15.237100601196289, 19.072315216064453, 22.907527923583984, 26.742740631103516, 30.57795524597168, 34.413169860839844, 38.248382568359375, 42.083595275878906, 45.91880798339844, 49.75402069091797, 53.5892333984375, 57.42444610595703, 61.25965881347656, 65.0948715209961, 68.93008422851562, 72.76530456542969, 76.60050964355469, 80.43572998046875, 84.27094268798828, 88.10615539550781, 91.94136810302734, 95.77658081054688, 99.6117935180664, 103.44700622558594, 107.2822265625, 111.11743927001953, 114.95265197753906, 118.7878646850586, 122.62307739257812, 126.45829010009766, 130.2935028076172, 134.12872314453125, 137.96392822265625, 141.7991485595703, 145.6343536376953, 149.46957397460938, 153.30477905273438, 157.13999938964844, 160.97520446777344, 164.8104248046875, 168.6456298828125, 172.48085021972656, 176.31607055664062, 180.1512908935547, 183.9864959716797, 187.82171630859375, 191.65692138671875, 195.4921417236328, 199.3273468017578, 203.16256713867188, 206.99777221679688]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 10.0, 5.0, 10.0, 7.0, 7.0, 7.0, 19.0, 10.0, 8.0, 12.0, 12.0, 13.0, 22.0, 26.0, 30.0, 35.0, 35.0, 29.0, 29.0, 39.0, 25.0, 26.0, 35.0, 42.0, 48.0, 33.0, 33.0, 34.0, 29.0, 38.0, 53.0, 28.0, 34.0, 33.0, 12.0, 11.0, 18.0, 13.0, 16.0, 11.0, 8.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.71368408203125, -24.88907241821289, -24.064462661743164, -23.239850997924805, -22.415241241455078, -21.59062957763672, -20.766019821166992, -19.941408157348633, -19.116798400878906, -18.292186737060547, -17.46757698059082, -16.64296531677246, -15.818355560302734, -14.993743896484375, -14.169134140014648, -13.344522476196289, -12.519911766052246, -11.695301055908203, -10.87069034576416, -10.046079635620117, -9.221468925476074, -8.396858215332031, -7.57224702835083, -6.747636318206787, -5.923025608062744, -5.098414897918701, -4.273804187774658, -3.449193239212036, -2.624582529067993, -1.799971580505371, -0.9753608703613281, -0.15075016021728516, 0.6738605499267578, 1.4984712600708008, 2.3230819702148438, 3.147692918777466, 3.972303628921509, 4.796914577484131, 5.621525287628174, 6.446135997772217, 7.27074670791626, 8.095357894897461, 8.919968605041504, 9.744579315185547, 10.56919002532959, 11.393800735473633, 12.218411445617676, 13.043022155761719, 13.867632865905762, 14.692243576049805, 15.516854286193848, 16.34146499633789, 17.16607666015625, 17.990686416625977, 18.815298080444336, 19.639907836914062, 20.464519500732422, 21.28913116455078, 22.113740921020508, 22.938352584838867, 23.762962341308594, 24.587574005126953, 25.41218376159668, 26.23679542541504, 27.061405181884766]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 13.0, 10.0, 25.0, 27.0, 38.0, 64.0, 107.0, 173.0, 272.0, 544.0, 1066.0, 2214.0, 4871.0, 11897.0, 33475.0, 135461.0, 3429409.0, 475126.0, 64935.0, 20005.0, 7695.0, 3312.0, 1580.0, 784.0, 432.0, 271.0, 143.0, 104.0, 60.0, 39.0, 30.0, 21.0, 16.0, 15.0, 6.0, 11.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.8150634765625, -8.528564453125, -8.2420654296875, -7.95556640625, -7.6690673828125, -7.382568359375, -7.0960693359375, -6.8095703125, -6.5230712890625, -6.236572265625, -5.9500732421875, -5.66357421875, -5.3770751953125, -5.090576171875, -4.8040771484375, -4.517578125, -4.2310791015625, -3.944580078125, -3.6580810546875, -3.37158203125, -3.0850830078125, -2.798583984375, -2.5120849609375, -2.2255859375, -1.9390869140625, -1.652587890625, -1.3660888671875, -1.07958984375, -0.7930908203125, -0.506591796875, -0.2200927734375, 0.06640625, 0.3529052734375, 0.639404296875, 0.9259033203125, 1.21240234375, 1.4989013671875, 1.785400390625, 2.0718994140625, 2.3583984375, 2.6448974609375, 2.931396484375, 3.2178955078125, 3.50439453125, 3.7908935546875, 4.077392578125, 4.3638916015625, 4.650390625, 4.9368896484375, 5.223388671875, 5.5098876953125, 5.79638671875, 6.0828857421875, 6.369384765625, 6.6558837890625, 6.9423828125, 7.2288818359375, 7.515380859375, 7.8018798828125, 8.08837890625, 8.3748779296875, 8.661376953125, 8.9478759765625, 9.234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 11.0, 5.0, 17.0, 14.0, 15.0, 21.0, 19.0, 25.0, 40.0, 39.0, 38.0, 34.0, 47.0, 55.0, 37.0, 48.0, 50.0, 41.0, 48.0, 47.0, 42.0, 46.0, 46.0, 31.0, 28.0, 29.0, 22.0, 17.0, 12.0, 15.0, 11.0, 8.0, 8.0, 12.0, 5.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5654296875, -1.5124664306640625, -1.459503173828125, -1.4065399169921875, -1.35357666015625, -1.3006134033203125, -1.247650146484375, -1.1946868896484375, -1.1417236328125, -1.0887603759765625, -1.035797119140625, -0.9828338623046875, -0.92987060546875, -0.8769073486328125, -0.823944091796875, -0.7709808349609375, -0.718017578125, -0.6650543212890625, -0.612091064453125, -0.5591278076171875, -0.50616455078125, -0.4532012939453125, -0.400238037109375, -0.3472747802734375, -0.2943115234375, -0.2413482666015625, -0.188385009765625, -0.1354217529296875, -0.08245849609375, -0.0294952392578125, 0.023468017578125, 0.0764312744140625, 0.12939453125, 0.1823577880859375, 0.235321044921875, 0.2882843017578125, 0.34124755859375, 0.3942108154296875, 0.447174072265625, 0.5001373291015625, 0.5531005859375, 0.6060638427734375, 0.659027099609375, 0.7119903564453125, 0.76495361328125, 0.8179168701171875, 0.870880126953125, 0.9238433837890625, 0.976806640625, 1.0297698974609375, 1.082733154296875, 1.1356964111328125, 1.18865966796875, 1.2416229248046875, 1.294586181640625, 1.3475494384765625, 1.4005126953125, 1.4534759521484375, 1.506439208984375, 1.5594024658203125, 1.61236572265625, 1.6653289794921875, 1.718292236328125, 1.7712554931640625, 1.82421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 11.0, 8.0, 11.0, 13.0, 20.0, 32.0, 32.0, 37.0, 43.0, 72.0, 98.0, 142.0, 236.0, 332.0, 499.0, 724.0, 1122.0, 1777.0, 3115.0, 5851.0, 12838.0, 31363.0, 97560.0, 632371.0, 3129995.0, 189328.0, 49574.0, 18446.0, 8028.0, 4150.0, 2301.0, 1319.0, 916.0, 581.0, 402.0, 251.0, 184.0, 153.0, 100.0, 72.0, 47.0, 29.0, 31.0, 20.0, 12.0, 11.0, 9.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.803955078125, -8.52197265625, -8.239990234375, -7.9580078125, -7.676025390625, -7.39404296875, -7.112060546875, -6.830078125, -6.548095703125, -6.26611328125, -5.984130859375, -5.7021484375, -5.420166015625, -5.13818359375, -4.856201171875, -4.57421875, -4.292236328125, -4.01025390625, -3.728271484375, -3.4462890625, -3.164306640625, -2.88232421875, -2.600341796875, -2.318359375, -2.036376953125, -1.75439453125, -1.472412109375, -1.1904296875, -0.908447265625, -0.62646484375, -0.344482421875, -0.0625, 0.219482421875, 0.50146484375, 0.783447265625, 1.0654296875, 1.347412109375, 1.62939453125, 1.911376953125, 2.193359375, 2.475341796875, 2.75732421875, 3.039306640625, 3.3212890625, 3.603271484375, 3.88525390625, 4.167236328125, 4.44921875, 4.731201171875, 5.01318359375, 5.295166015625, 5.5771484375, 5.859130859375, 6.14111328125, 6.423095703125, 6.705078125, 6.987060546875, 7.26904296875, 7.551025390625, 7.8330078125, 8.114990234375, 8.39697265625, 8.678955078125, 8.9609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 10.0, 10.0, 4.0, 9.0, 23.0, 33.0, 52.0, 51.0, 101.0, 209.0, 561.0, 2047.0, 461.0, 205.0, 98.0, 61.0, 41.0, 28.0, 22.0, 13.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.0955810546875, -4.933349609375, -4.7711181640625, -4.60888671875, -4.4466552734375, -4.284423828125, -4.1221923828125, -3.9599609375, -3.7977294921875, -3.635498046875, -3.4732666015625, -3.31103515625, -3.1488037109375, -2.986572265625, -2.8243408203125, -2.662109375, -2.4998779296875, -2.337646484375, -2.1754150390625, -2.01318359375, -1.8509521484375, -1.688720703125, -1.5264892578125, -1.3642578125, -1.2020263671875, -1.039794921875, -0.8775634765625, -0.71533203125, -0.5531005859375, -0.390869140625, -0.2286376953125, -0.06640625, 0.0958251953125, 0.258056640625, 0.4202880859375, 0.58251953125, 0.7447509765625, 0.906982421875, 1.0692138671875, 1.2314453125, 1.3936767578125, 1.555908203125, 1.7181396484375, 1.88037109375, 2.0426025390625, 2.204833984375, 2.3670654296875, 2.529296875, 2.6915283203125, 2.853759765625, 3.0159912109375, 3.17822265625, 3.3404541015625, 3.502685546875, 3.6649169921875, 3.8271484375, 3.9893798828125, 4.151611328125, 4.3138427734375, 4.47607421875, 4.6383056640625, 4.800537109375, 4.9627685546875, 5.125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 11.0, 28.0, 51.0, 64.0, 129.0, 172.0, 136.0, 158.0, 103.0, 76.0, 38.0, 16.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.29506492614746, -27.174474716186523, -26.053884506225586, -24.93329429626465, -23.81270408630371, -22.692113876342773, -21.571523666381836, -20.4509334564209, -19.33034324645996, -18.209753036499023, -17.089162826538086, -15.968572616577148, -14.847982406616211, -13.727392196655273, -12.606801986694336, -11.486211776733398, -10.365621566772461, -9.245031356811523, -8.124441146850586, -7.003850936889648, -5.883260726928711, -4.762670516967773, -3.642080307006836, -2.5214900970458984, -1.400899887084961, -0.28030967712402344, 0.8402805328369141, 1.9608707427978516, 3.081460952758789, 4.202051162719727, 5.322641372680664, 6.443231582641602, 7.563819885253906, 8.684410095214844, 9.805000305175781, 10.925590515136719, 12.046180725097656, 13.166770935058594, 14.287361145019531, 15.407951354980469, 16.528541564941406, 17.649131774902344, 18.76972198486328, 19.89031219482422, 21.010902404785156, 22.131492614746094, 23.25208282470703, 24.37267303466797, 25.493263244628906, 26.613853454589844, 27.73444366455078, 28.85503387451172, 29.975624084472656, 31.096214294433594, 32.21680450439453, 33.33739471435547, 34.457984924316406, 35.578575134277344, 36.69916534423828, 37.81975555419922, 38.940345764160156, 40.060935974121094, 41.18152618408203, 42.30211639404297, 43.422706604003906]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 10.0, 2.0, 15.0, 8.0, 18.0, 17.0, 18.0, 15.0, 34.0, 28.0, 30.0, 33.0, 36.0, 30.0, 42.0, 36.0, 42.0, 43.0, 49.0, 41.0, 40.0, 34.0, 43.0, 39.0, 29.0, 23.0, 30.0, 31.0, 27.0, 22.0, 20.0, 24.0, 13.0, 8.0, 12.0, 11.0, 8.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.274073600769043, -11.870687484741211, -11.467302322387695, -11.063916206359863, -10.660530090332031, -10.257144927978516, -9.853758811950684, -9.450372695922852, -9.046987533569336, -8.643601417541504, -8.240216255187988, -7.836830139160156, -7.433444023132324, -7.03005838394165, -6.626672744750977, -6.2232866287231445, -5.8199005126953125, -5.416514873504639, -5.013128757476807, -4.609743118286133, -4.206357002258301, -3.802971363067627, -3.399585723876953, -2.9961998462677, -2.5928139686584473, -2.1894280910491943, -1.786042332649231, -1.3826565742492676, -0.9792706966400146, -0.5758848190307617, -0.1724991798400879, 0.23088669776916504, 0.6342735290527344, 1.0376594066619873, 1.4410451650619507, 1.844430923461914, 2.247816801071167, 2.65120267868042, 3.0545883178710938, 3.4579741954803467, 3.8613600730895996, 4.264745712280273, 4.6681318283081055, 5.071517467498779, 5.474903106689453, 5.878289222717285, 6.281674861907959, 6.685060501098633, 7.088446617126465, 7.491832256317139, 7.895218372344971, 8.298604011535645, 8.701990127563477, 9.105375289916992, 9.508761405944824, 9.912147521972656, 10.315532684326172, 10.718918800354004, 11.12230396270752, 11.525690078735352, 11.929076194763184, 12.332462310791016, 12.735847473144531, 13.139233589172363, 13.542619705200195]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 11.0, 26.0, 40.0, 48.0, 54.0, 133.0, 217.0, 377.0, 665.0, 1067.0, 1915.0, 3573.0, 6816.0, 12871.0, 25314.0, 49623.0, 96668.0, 213472.0, 328421.0, 152977.0, 74320.0, 38180.0, 19714.0, 10081.0, 5340.0, 2896.0, 1564.0, 914.0, 464.0, 320.0, 160.0, 105.0, 70.0, 37.0, 18.0, 15.0, 17.0, 8.0, 3.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.53125, -5.37890625, -5.2265625, -5.07421875, -4.921875, -4.76953125, -4.6171875, -4.46484375, -4.3125, -4.16015625, -4.0078125, -3.85546875, -3.703125, -3.55078125, -3.3984375, -3.24609375, -3.09375, -2.94140625, -2.7890625, -2.63671875, -2.484375, -2.33203125, -2.1796875, -2.02734375, -1.875, -1.72265625, -1.5703125, -1.41796875, -1.265625, -1.11328125, -0.9609375, -0.80859375, -0.65625, -0.50390625, -0.3515625, -0.19921875, -0.046875, 0.10546875, 0.2578125, 0.41015625, 0.5625, 0.71484375, 0.8671875, 1.01953125, 1.171875, 1.32421875, 1.4765625, 1.62890625, 1.78125, 1.93359375, 2.0859375, 2.23828125, 2.390625, 2.54296875, 2.6953125, 2.84765625, 3.0, 3.15234375, 3.3046875, 3.45703125, 3.609375, 3.76171875, 3.9140625, 4.06640625, 4.21875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 4.0, 9.0, 17.0, 15.0, 25.0, 16.0, 27.0, 25.0, 43.0, 30.0, 35.0, 52.0, 52.0, 53.0, 54.0, 49.0, 44.0, 35.0, 31.0, 51.0, 47.0, 33.0, 37.0, 38.0, 35.0, 19.0, 19.0, 16.0, 15.0, 14.0, 13.0, 8.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.52923583984375, -1.4725341796875, -1.41583251953125, -1.359130859375, -1.30242919921875, -1.2457275390625, -1.18902587890625, -1.13232421875, -1.07562255859375, -1.0189208984375, -0.96221923828125, -0.905517578125, -0.84881591796875, -0.7921142578125, -0.73541259765625, -0.6787109375, -0.62200927734375, -0.5653076171875, -0.50860595703125, -0.451904296875, -0.39520263671875, -0.3385009765625, -0.28179931640625, -0.22509765625, -0.16839599609375, -0.1116943359375, -0.05499267578125, 0.001708984375, 0.05841064453125, 0.1151123046875, 0.17181396484375, 0.228515625, 0.28521728515625, 0.3419189453125, 0.39862060546875, 0.455322265625, 0.51202392578125, 0.5687255859375, 0.62542724609375, 0.68212890625, 0.73883056640625, 0.7955322265625, 0.85223388671875, 0.908935546875, 0.96563720703125, 1.0223388671875, 1.07904052734375, 1.1357421875, 1.19244384765625, 1.2491455078125, 1.30584716796875, 1.362548828125, 1.41925048828125, 1.4759521484375, 1.53265380859375, 1.58935546875, 1.64605712890625, 1.7027587890625, 1.75946044921875, 1.816162109375, 1.87286376953125, 1.9295654296875, 1.98626708984375, 2.04296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 6.0, 8.0, 8.0, 19.0, 20.0, 33.0, 40.0, 64.0, 74.0, 107.0, 178.0, 221.0, 369.0, 572.0, 1003.0, 2389.0, 7230.0, 30316.0, 151231.0, 658565.0, 152778.0, 30916.0, 7228.0, 2338.0, 1048.0, 586.0, 349.0, 237.0, 177.0, 145.0, 77.0, 61.0, 45.0, 21.0, 21.0, 14.0, 16.0, 5.0, 11.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-11.84375, -11.50048828125, -11.1572265625, -10.81396484375, -10.470703125, -10.12744140625, -9.7841796875, -9.44091796875, -9.09765625, -8.75439453125, -8.4111328125, -8.06787109375, -7.724609375, -7.38134765625, -7.0380859375, -6.69482421875, -6.3515625, -6.00830078125, -5.6650390625, -5.32177734375, -4.978515625, -4.63525390625, -4.2919921875, -3.94873046875, -3.60546875, -3.26220703125, -2.9189453125, -2.57568359375, -2.232421875, -1.88916015625, -1.5458984375, -1.20263671875, -0.859375, -0.51611328125, -0.1728515625, 0.17041015625, 0.513671875, 0.85693359375, 1.2001953125, 1.54345703125, 1.88671875, 2.22998046875, 2.5732421875, 2.91650390625, 3.259765625, 3.60302734375, 3.9462890625, 4.28955078125, 4.6328125, 4.97607421875, 5.3193359375, 5.66259765625, 6.005859375, 6.34912109375, 6.6923828125, 7.03564453125, 7.37890625, 7.72216796875, 8.0654296875, 8.40869140625, 8.751953125, 9.09521484375, 9.4384765625, 9.78173828125, 10.125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 15.0, 26.0, 19.0, 21.0, 31.0, 42.0, 47.0, 50.0, 48.0, 44.0, 65.0, 57.0, 55.0, 45.0, 42.0, 42.0, 46.0, 52.0, 31.0, 25.0, 25.0, 25.0, 20.0, 12.0, 15.0, 3.0, 9.0, 11.0, 6.0, 4.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.1953125, -10.88427734375, -10.5732421875, -10.26220703125, -9.951171875, -9.64013671875, -9.3291015625, -9.01806640625, -8.70703125, -8.39599609375, -8.0849609375, -7.77392578125, -7.462890625, -7.15185546875, -6.8408203125, -6.52978515625, -6.21875, -5.90771484375, -5.5966796875, -5.28564453125, -4.974609375, -4.66357421875, -4.3525390625, -4.04150390625, -3.73046875, -3.41943359375, -3.1083984375, -2.79736328125, -2.486328125, -2.17529296875, -1.8642578125, -1.55322265625, -1.2421875, -0.93115234375, -0.6201171875, -0.30908203125, 0.001953125, 0.31298828125, 0.6240234375, 0.93505859375, 1.24609375, 1.55712890625, 1.8681640625, 2.17919921875, 2.490234375, 2.80126953125, 3.1123046875, 3.42333984375, 3.734375, 4.04541015625, 4.3564453125, 4.66748046875, 4.978515625, 5.28955078125, 5.6005859375, 5.91162109375, 6.22265625, 6.53369140625, 6.8447265625, 7.15576171875, 7.466796875, 7.77783203125, 8.0888671875, 8.39990234375, 8.7109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 16.0, 31.0, 56.0, 105.0, 222.0, 779.0, 4421.0, 79710.0, 897050.0, 61231.0, 3799.0, 717.0, 211.0, 73.0, 30.0, 28.0, 18.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3984375, -13.9407958984375, -13.483154296875, -13.0255126953125, -12.56787109375, -12.1102294921875, -11.652587890625, -11.1949462890625, -10.7373046875, -10.2796630859375, -9.822021484375, -9.3643798828125, -8.90673828125, -8.4490966796875, -7.991455078125, -7.5338134765625, -7.076171875, -6.6185302734375, -6.160888671875, -5.7032470703125, -5.24560546875, -4.7879638671875, -4.330322265625, -3.8726806640625, -3.4150390625, -2.9573974609375, -2.499755859375, -2.0421142578125, -1.58447265625, -1.1268310546875, -0.669189453125, -0.2115478515625, 0.24609375, 0.7037353515625, 1.161376953125, 1.6190185546875, 2.07666015625, 2.5343017578125, 2.991943359375, 3.4495849609375, 3.9072265625, 4.3648681640625, 4.822509765625, 5.2801513671875, 5.73779296875, 6.1954345703125, 6.653076171875, 7.1107177734375, 7.568359375, 8.0260009765625, 8.483642578125, 8.9412841796875, 9.39892578125, 9.8565673828125, 10.314208984375, 10.7718505859375, 11.2294921875, 11.6871337890625, 12.144775390625, 12.6024169921875, 13.06005859375, 13.5177001953125, 13.975341796875, 14.4329833984375, 14.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 9.0, 13.0, 15.0, 22.0, 37.0, 42.0, 67.0, 108.0, 285.0, 148.0, 77.0, 55.0, 47.0, 26.0, 19.0, 15.0, 9.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011196136474609375, -0.001062542200088501, -0.0010054707527160645, -0.0009483993053436279, -0.0008913278579711914, -0.0008342564105987549, -0.0007771849632263184, -0.0007201135158538818, -0.0006630420684814453, -0.0006059706211090088, -0.0005488991737365723, -0.0004918277263641357, -0.0004347562789916992, -0.0003776848316192627, -0.00032061338424682617, -0.00026354193687438965, -0.00020647048950195312, -0.0001493990421295166, -9.232759475708008e-05, -3.5256147384643555e-05, 2.181529998779297e-05, 7.888674736022949e-05, 0.00013595819473266602, 0.00019302964210510254, 0.00025010108947753906, 0.0003071725368499756, 0.0003642439842224121, 0.00042131543159484863, 0.00047838687896728516, 0.0005354583263397217, 0.0005925297737121582, 0.0006496012210845947, 0.0007066726684570312, 0.0007637441158294678, 0.0008208155632019043, 0.0008778870105743408, 0.0009349584579467773, 0.0009920299053192139, 0.0010491013526916504, 0.001106172800064087, 0.0011632442474365234, 0.00122031569480896, 0.0012773871421813965, 0.001334458589553833, 0.0013915300369262695, 0.001448601484298706, 0.0015056729316711426, 0.001562744379043579, 0.0016198158264160156, 0.0016768872737884521, 0.0017339587211608887, 0.0017910301685333252, 0.0018481016159057617, 0.0019051730632781982, 0.0019622445106506348, 0.0020193159580230713, 0.002076387405395508, 0.0021334588527679443, 0.002190530300140381, 0.0022476017475128174, 0.002304673194885254, 0.0023617446422576904, 0.002418816089630127, 0.0024758875370025635, 0.002532958984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 11.0, 26.0, 49.0, 153.0, 330.0, 1118.0, 10560.0, 890898.0, 141189.0, 3137.0, 651.0, 204.0, 110.0, 60.0, 19.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.4619140625, -22.767578125, -22.0732421875, -21.37890625, -20.6845703125, -19.990234375, -19.2958984375, -18.6015625, -17.9072265625, -17.212890625, -16.5185546875, -15.82421875, -15.1298828125, -14.435546875, -13.7412109375, -13.046875, -12.3525390625, -11.658203125, -10.9638671875, -10.26953125, -9.5751953125, -8.880859375, -8.1865234375, -7.4921875, -6.7978515625, -6.103515625, -5.4091796875, -4.71484375, -4.0205078125, -3.326171875, -2.6318359375, -1.9375, -1.2431640625, -0.548828125, 0.1455078125, 0.83984375, 1.5341796875, 2.228515625, 2.9228515625, 3.6171875, 4.3115234375, 5.005859375, 5.7001953125, 6.39453125, 7.0888671875, 7.783203125, 8.4775390625, 9.171875, 9.8662109375, 10.560546875, 11.2548828125, 11.94921875, 12.6435546875, 13.337890625, 14.0322265625, 14.7265625, 15.4208984375, 16.115234375, 16.8095703125, 17.50390625, 18.1982421875, 18.892578125, 19.5869140625, 20.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 10.0, 11.0, 9.0, 12.0, 11.0, 16.0, 29.0, 35.0, 47.0, 67.0, 122.0, 169.0, 117.0, 90.0, 66.0, 54.0, 39.0, 26.0, 19.0, 10.0, 11.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01953125, -4.80035400390625, -4.5811767578125, -4.36199951171875, -4.142822265625, -3.92364501953125, -3.7044677734375, -3.48529052734375, -3.26611328125, -3.04693603515625, -2.8277587890625, -2.60858154296875, -2.389404296875, -2.17022705078125, -1.9510498046875, -1.73187255859375, -1.5126953125, -1.29351806640625, -1.0743408203125, -0.85516357421875, -0.635986328125, -0.41680908203125, -0.1976318359375, 0.02154541015625, 0.24072265625, 0.45989990234375, 0.6790771484375, 0.89825439453125, 1.117431640625, 1.33660888671875, 1.5557861328125, 1.77496337890625, 1.994140625, 2.21331787109375, 2.4324951171875, 2.65167236328125, 2.870849609375, 3.09002685546875, 3.3092041015625, 3.52838134765625, 3.74755859375, 3.96673583984375, 4.1859130859375, 4.40509033203125, 4.624267578125, 4.84344482421875, 5.0626220703125, 5.28179931640625, 5.5009765625, 5.72015380859375, 5.9393310546875, 6.15850830078125, 6.377685546875, 6.59686279296875, 6.8160400390625, 7.03521728515625, 7.25439453125, 7.47357177734375, 7.6927490234375, 7.91192626953125, 8.131103515625, 8.35028076171875, 8.5694580078125, 8.78863525390625, 9.0078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 20.0, 48.0, 79.0, 134.0, 152.0, 179.0, 163.0, 89.0, 61.0, 27.0, 20.0, 11.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.14193725585938, -78.0390853881836, -74.93622589111328, -71.8333740234375, -68.73051452636719, -65.6276626586914, -62.524810791015625, -59.42195510864258, -56.31909942626953, -53.216243743896484, -50.11338806152344, -47.010536193847656, -43.90768051147461, -40.80482482910156, -37.70197296142578, -34.599117279052734, -31.496261596679688, -28.39340591430664, -25.290552139282227, -22.187698364257812, -19.084842681884766, -15.981987953186035, -12.879133224487305, -9.77627944946289, -6.673423767089844, -3.5705690383911133, -0.4677143096923828, 2.6351404190063477, 5.737995147705078, 8.840849876403809, 11.943704605102539, 15.046558380126953, 18.14942169189453, 21.252277374267578, 24.355131149291992, 27.457984924316406, 30.560840606689453, 33.6636962890625, 36.76654815673828, 39.86940383911133, 42.972259521484375, 46.07511520385742, 49.17797088623047, 52.28082275390625, 55.3836784362793, 58.486534118652344, 61.589385986328125, 64.69224548339844, 67.79509735107422, 70.89794921875, 74.00080871582031, 77.1036605834961, 80.20651245117188, 83.30937194824219, 86.41222381591797, 89.51507568359375, 92.61793518066406, 95.72078704833984, 98.82364654541016, 101.92649841308594, 105.02935791015625, 108.13220977783203, 111.23506164550781, 114.33792114257812, 117.4407730102539]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 4.0, 10.0, 9.0, 9.0, 11.0, 13.0, 15.0, 22.0, 19.0, 21.0, 25.0, 22.0, 37.0, 35.0, 39.0, 35.0, 39.0, 47.0, 39.0, 44.0, 44.0, 37.0, 41.0, 48.0, 43.0, 35.0, 30.0, 30.0, 20.0, 18.0, 23.0, 25.0, 17.0, 16.0, 14.0, 11.0, 14.0, 7.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.88931655883789, -39.408870697021484, -37.92842483520508, -36.44797897338867, -34.967529296875, -33.487083435058594, -32.00663757324219, -30.52619171142578, -29.045745849609375, -27.56529998779297, -26.084854125976562, -24.604406356811523, -23.123960494995117, -21.64351463317871, -20.163066864013672, -18.682621002197266, -17.20217514038086, -15.721729278564453, -14.24128246307373, -12.760835647583008, -11.280389785766602, -9.799943923950195, -8.319497108459473, -6.83905029296875, -5.358604431152344, -3.8781580924987793, -2.397711753845215, -0.9172654151916504, 0.5631809234619141, 2.0436272621154785, 3.524073600769043, 5.004520416259766, 6.4849700927734375, 7.965416431427002, 9.445862770080566, 10.926309585571289, 12.406755447387695, 13.887201309204102, 15.367648124694824, 16.848094940185547, 18.328540802001953, 19.80898666381836, 21.289432525634766, 22.769880294799805, 24.25032615661621, 25.730772018432617, 27.211219787597656, 28.691665649414062, 30.17211151123047, 31.652557373046875, 33.13300323486328, 34.61344909667969, 36.093894958496094, 37.574344635009766, 39.05479049682617, 40.53523635864258, 42.015682220458984, 43.49612808227539, 44.9765739440918, 46.4570198059082, 47.937469482421875, 49.41791534423828, 50.89836120605469, 52.378807067871094, 53.8592529296875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 8.0, 6.0, 8.0, 15.0, 13.0, 16.0, 20.0, 23.0, 43.0, 53.0, 59.0, 109.0, 142.0, 206.0, 301.0, 451.0, 661.0, 1271.0, 2105.0, 4160.0, 8457.0, 19002.0, 48402.0, 164186.0, 2439652.0, 1284121.0, 142724.0, 43689.0, 17250.0, 7802.0, 3969.0, 2026.0, 1139.0, 765.0, 418.0, 261.0, 186.0, 134.0, 101.0, 77.0, 54.0, 45.0, 30.0, 26.0, 27.0, 8.0, 20.0, 12.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-7.328125, -7.0987548828125, -6.869384765625, -6.6400146484375, -6.41064453125, -6.1812744140625, -5.951904296875, -5.7225341796875, -5.4931640625, -5.2637939453125, -5.034423828125, -4.8050537109375, -4.57568359375, -4.3463134765625, -4.116943359375, -3.8875732421875, -3.658203125, -3.4288330078125, -3.199462890625, -2.9700927734375, -2.74072265625, -2.5113525390625, -2.281982421875, -2.0526123046875, -1.8232421875, -1.5938720703125, -1.364501953125, -1.1351318359375, -0.90576171875, -0.6763916015625, -0.447021484375, -0.2176513671875, 0.01171875, 0.2410888671875, 0.470458984375, 0.6998291015625, 0.92919921875, 1.1585693359375, 1.387939453125, 1.6173095703125, 1.8466796875, 2.0760498046875, 2.305419921875, 2.5347900390625, 2.76416015625, 2.9935302734375, 3.222900390625, 3.4522705078125, 3.681640625, 3.9110107421875, 4.140380859375, 4.3697509765625, 4.59912109375, 4.8284912109375, 5.057861328125, 5.2872314453125, 5.5166015625, 5.7459716796875, 5.975341796875, 6.2047119140625, 6.43408203125, 6.6634521484375, 6.892822265625, 7.1221923828125, 7.3515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 5.0, 11.0, 11.0, 13.0, 16.0, 8.0, 12.0, 24.0, 36.0, 33.0, 28.0, 33.0, 33.0, 46.0, 41.0, 49.0, 46.0, 50.0, 34.0, 41.0, 35.0, 48.0, 44.0, 33.0, 30.0, 31.0, 32.0, 23.0, 25.0, 17.0, 21.0, 16.0, 12.0, 12.0, 5.0, 8.0, 5.0, 7.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541015625, -1.484344482421875, -1.42767333984375, -1.371002197265625, -1.3143310546875, -1.257659912109375, -1.20098876953125, -1.144317626953125, -1.087646484375, -1.030975341796875, -0.97430419921875, -0.917633056640625, -0.8609619140625, -0.804290771484375, -0.74761962890625, -0.690948486328125, -0.63427734375, -0.577606201171875, -0.52093505859375, -0.464263916015625, -0.4075927734375, -0.350921630859375, -0.29425048828125, -0.237579345703125, -0.180908203125, -0.124237060546875, -0.06756591796875, -0.010894775390625, 0.0457763671875, 0.102447509765625, 0.15911865234375, 0.215789794921875, 0.2724609375, 0.329132080078125, 0.38580322265625, 0.442474365234375, 0.4991455078125, 0.555816650390625, 0.61248779296875, 0.669158935546875, 0.725830078125, 0.782501220703125, 0.83917236328125, 0.895843505859375, 0.9525146484375, 1.009185791015625, 1.06585693359375, 1.122528076171875, 1.17919921875, 1.235870361328125, 1.29254150390625, 1.349212646484375, 1.4058837890625, 1.462554931640625, 1.51922607421875, 1.575897216796875, 1.632568359375, 1.689239501953125, 1.74591064453125, 1.802581787109375, 1.8592529296875, 1.915924072265625, 1.97259521484375, 2.029266357421875, 2.0859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 9.0, 8.0, 15.0, 23.0, 26.0, 48.0, 63.0, 97.0, 147.0, 264.0, 373.0, 622.0, 933.0, 1820.0, 3275.0, 6764.0, 15870.0, 50205.0, 236782.0, 3061244.0, 672004.0, 97217.0, 26510.0, 9809.0, 4423.0, 2289.0, 1309.0, 757.0, 456.0, 296.0, 206.0, 128.0, 86.0, 58.0, 42.0, 25.0, 24.0, 18.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1015625, -11.753173828125, -11.40478515625, -11.056396484375, -10.7080078125, -10.359619140625, -10.01123046875, -9.662841796875, -9.314453125, -8.966064453125, -8.61767578125, -8.269287109375, -7.9208984375, -7.572509765625, -7.22412109375, -6.875732421875, -6.52734375, -6.178955078125, -5.83056640625, -5.482177734375, -5.1337890625, -4.785400390625, -4.43701171875, -4.088623046875, -3.740234375, -3.391845703125, -3.04345703125, -2.695068359375, -2.3466796875, -1.998291015625, -1.64990234375, -1.301513671875, -0.953125, -0.604736328125, -0.25634765625, 0.092041015625, 0.4404296875, 0.788818359375, 1.13720703125, 1.485595703125, 1.833984375, 2.182373046875, 2.53076171875, 2.879150390625, 3.2275390625, 3.575927734375, 3.92431640625, 4.272705078125, 4.62109375, 4.969482421875, 5.31787109375, 5.666259765625, 6.0146484375, 6.363037109375, 6.71142578125, 7.059814453125, 7.408203125, 7.756591796875, 8.10498046875, 8.453369140625, 8.8017578125, 9.150146484375, 9.49853515625, 9.846923828125, 10.1953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 4.0, 5.0, 8.0, 10.0, 17.0, 20.0, 23.0, 48.0, 68.0, 75.0, 149.0, 192.0, 346.0, 834.0, 1170.0, 416.0, 213.0, 138.0, 94.0, 56.0, 50.0, 29.0, 17.0, 23.0, 15.0, 10.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-5.55078125, -5.39251708984375, -5.2342529296875, -5.07598876953125, -4.917724609375, -4.75946044921875, -4.6011962890625, -4.44293212890625, -4.28466796875, -4.12640380859375, -3.9681396484375, -3.80987548828125, -3.651611328125, -3.49334716796875, -3.3350830078125, -3.17681884765625, -3.0185546875, -2.86029052734375, -2.7020263671875, -2.54376220703125, -2.385498046875, -2.22723388671875, -2.0689697265625, -1.91070556640625, -1.75244140625, -1.59417724609375, -1.4359130859375, -1.27764892578125, -1.119384765625, -0.96112060546875, -0.8028564453125, -0.64459228515625, -0.486328125, -0.32806396484375, -0.1697998046875, -0.01153564453125, 0.146728515625, 0.30499267578125, 0.4632568359375, 0.62152099609375, 0.77978515625, 0.93804931640625, 1.0963134765625, 1.25457763671875, 1.412841796875, 1.57110595703125, 1.7293701171875, 1.88763427734375, 2.0458984375, 2.20416259765625, 2.3624267578125, 2.52069091796875, 2.678955078125, 2.83721923828125, 2.9954833984375, 3.15374755859375, 3.31201171875, 3.47027587890625, 3.6285400390625, 3.78680419921875, 3.945068359375, 4.10333251953125, 4.2615966796875, 4.41986083984375, 4.578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 22.0, 43.0, 41.0, 85.0, 97.0, 128.0, 139.0, 112.0, 115.0, 78.0, 40.0, 41.0, 21.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.89153289794922, -29.588531494140625, -28.2855281829834, -26.982526779174805, -25.67952537536621, -24.376522064208984, -23.07352066040039, -21.770519256591797, -20.467517852783203, -19.16451644897461, -17.861513137817383, -16.55851173400879, -15.255510330200195, -13.952507972717285, -12.649505615234375, -11.346504211425781, -10.043500900268555, -8.740498542785645, -7.437497138977051, -6.134494781494141, -4.831492900848389, -3.5284910202026367, -2.2254886627197266, -0.9224872589111328, 0.38051509857177734, 1.6835170984268188, 2.9865190982818604, 4.289521217346191, 5.592523097991943, 6.895524978637695, 8.198527336120605, 9.5015287399292, 10.80453109741211, 12.10753345489502, 13.410534858703613, 14.713537216186523, 16.016538619995117, 17.319541931152344, 18.622543334960938, 19.92554473876953, 21.228546142578125, 22.53154754638672, 23.834550857543945, 25.13755226135254, 26.440553665161133, 27.74355697631836, 29.046558380126953, 30.349559783935547, 31.652563095092773, 32.95556640625, 34.258567810058594, 35.56156921386719, 36.86457061767578, 38.167572021484375, 39.47057342529297, 40.77357482910156, 42.07658004760742, 43.379581451416016, 44.68258285522461, 45.98558807373047, 47.28858947753906, 48.591590881347656, 49.89459228515625, 51.197593688964844, 52.50059509277344]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 5.0, 8.0, 9.0, 14.0, 8.0, 17.0, 26.0, 21.0, 21.0, 31.0, 28.0, 30.0, 30.0, 33.0, 34.0, 41.0, 49.0, 54.0, 46.0, 34.0, 34.0, 48.0, 32.0, 33.0, 24.0, 31.0, 24.0, 30.0, 25.0, 21.0, 19.0, 12.0, 19.0, 14.0, 12.0, 15.0, 12.0, 13.0, 4.0, 6.0, 10.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.8762845993042, -15.333589553833008, -14.7908935546875, -14.248198509216309, -13.705503463745117, -13.16280746459961, -12.620112419128418, -12.077417373657227, -11.534721374511719, -10.992026329040527, -10.44933032989502, -9.906635284423828, -9.36393928527832, -8.821244239807129, -8.278549194335938, -7.735853672027588, -7.193158149719238, -6.650462627410889, -6.107767105102539, -5.565072059631348, -5.022376537322998, -4.479681015014648, -3.936985731124878, -3.3942904472351074, -2.851594924926758, -2.308899402618408, -1.7662041187286377, -1.2235087156295776, -0.6808133125305176, -0.13811779022216797, 0.40457749366760254, 0.947272777557373, 1.4899673461914062, 2.032662868499756, 2.5753581523895264, 3.118053436279297, 3.6607489585876465, 4.203444480895996, 4.7461395263671875, 5.288835048675537, 5.831530570983887, 6.374226093292236, 6.916921615600586, 7.459616661071777, 8.002311706542969, 8.545007705688477, 9.087702751159668, 9.63039779663086, 10.173093795776367, 10.715788841247559, 11.258484840393066, 11.801179885864258, 12.343875885009766, 12.886570930480957, 13.429265975952148, 13.971961975097656, 14.514657020568848, 15.057352066040039, 15.600048065185547, 16.142744064331055, 16.68543815612793, 17.228134155273438, 17.770830154418945, 18.31352424621582, 18.856220245361328]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 13.0, 14.0, 13.0, 20.0, 29.0, 38.0, 69.0, 89.0, 122.0, 210.0, 292.0, 521.0, 858.0, 1649.0, 3229.0, 6813.0, 16000.0, 39163.0, 98695.0, 237288.0, 336155.0, 181982.0, 72942.0, 29255.0, 12013.0, 5241.0, 2544.0, 1304.0, 776.0, 403.0, 257.0, 166.0, 97.0, 95.0, 45.0, 37.0, 33.0, 22.0, 13.0, 14.0, 13.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.109375, -6.8961181640625, -6.682861328125, -6.4696044921875, -6.25634765625, -6.0430908203125, -5.829833984375, -5.6165771484375, -5.4033203125, -5.1900634765625, -4.976806640625, -4.7635498046875, -4.55029296875, -4.3370361328125, -4.123779296875, -3.9105224609375, -3.697265625, -3.4840087890625, -3.270751953125, -3.0574951171875, -2.84423828125, -2.6309814453125, -2.417724609375, -2.2044677734375, -1.9912109375, -1.7779541015625, -1.564697265625, -1.3514404296875, -1.13818359375, -0.9249267578125, -0.711669921875, -0.4984130859375, -0.28515625, -0.0718994140625, 0.141357421875, 0.3546142578125, 0.56787109375, 0.7811279296875, 0.994384765625, 1.2076416015625, 1.4208984375, 1.6341552734375, 1.847412109375, 2.0606689453125, 2.27392578125, 2.4871826171875, 2.700439453125, 2.9136962890625, 3.126953125, 3.3402099609375, 3.553466796875, 3.7667236328125, 3.97998046875, 4.1932373046875, 4.406494140625, 4.6197509765625, 4.8330078125, 5.0462646484375, 5.259521484375, 5.4727783203125, 5.68603515625, 5.8992919921875, 6.112548828125, 6.3258056640625, 6.5390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 6.0, 8.0, 7.0, 4.0, 16.0, 13.0, 20.0, 17.0, 28.0, 27.0, 34.0, 30.0, 29.0, 42.0, 47.0, 46.0, 34.0, 42.0, 51.0, 42.0, 49.0, 40.0, 41.0, 45.0, 33.0, 28.0, 32.0, 21.0, 28.0, 20.0, 15.0, 10.0, 15.0, 17.0, 6.0, 13.0, 5.0, 11.0, 13.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.646026611328125, -1.58502197265625, -1.524017333984375, -1.4630126953125, -1.402008056640625, -1.34100341796875, -1.279998779296875, -1.218994140625, -1.157989501953125, -1.09698486328125, -1.035980224609375, -0.9749755859375, -0.913970947265625, -0.85296630859375, -0.791961669921875, -0.73095703125, -0.669952392578125, -0.60894775390625, -0.547943115234375, -0.4869384765625, -0.425933837890625, -0.36492919921875, -0.303924560546875, -0.242919921875, -0.181915283203125, -0.12091064453125, -0.059906005859375, 0.0010986328125, 0.062103271484375, 0.12310791015625, 0.184112548828125, 0.2451171875, 0.306121826171875, 0.36712646484375, 0.428131103515625, 0.4891357421875, 0.550140380859375, 0.61114501953125, 0.672149658203125, 0.733154296875, 0.794158935546875, 0.85516357421875, 0.916168212890625, 0.9771728515625, 1.038177490234375, 1.09918212890625, 1.160186767578125, 1.22119140625, 1.282196044921875, 1.34320068359375, 1.404205322265625, 1.4652099609375, 1.526214599609375, 1.58721923828125, 1.648223876953125, 1.709228515625, 1.770233154296875, 1.83123779296875, 1.892242431640625, 1.9532470703125, 2.014251708984375, 2.07525634765625, 2.136260986328125, 2.197265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 11.0, 28.0, 26.0, 35.0, 47.0, 71.0, 82.0, 141.0, 262.0, 389.0, 671.0, 1160.0, 2588.0, 8387.0, 39521.0, 259989.0, 588270.0, 117849.0, 19801.0, 4972.0, 1870.0, 929.0, 490.0, 315.0, 203.0, 142.0, 94.0, 49.0, 35.0, 29.0, 15.0, 15.0, 7.0, 8.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-13.1484375, -12.7535400390625, -12.358642578125, -11.9637451171875, -11.56884765625, -11.1739501953125, -10.779052734375, -10.3841552734375, -9.9892578125, -9.5943603515625, -9.199462890625, -8.8045654296875, -8.40966796875, -8.0147705078125, -7.619873046875, -7.2249755859375, -6.830078125, -6.4351806640625, -6.040283203125, -5.6453857421875, -5.25048828125, -4.8555908203125, -4.460693359375, -4.0657958984375, -3.6708984375, -3.2760009765625, -2.881103515625, -2.4862060546875, -2.09130859375, -1.6964111328125, -1.301513671875, -0.9066162109375, -0.51171875, -0.1168212890625, 0.278076171875, 0.6729736328125, 1.06787109375, 1.4627685546875, 1.857666015625, 2.2525634765625, 2.6474609375, 3.0423583984375, 3.437255859375, 3.8321533203125, 4.22705078125, 4.6219482421875, 5.016845703125, 5.4117431640625, 5.806640625, 6.2015380859375, 6.596435546875, 6.9913330078125, 7.38623046875, 7.7811279296875, 8.176025390625, 8.5709228515625, 8.9658203125, 9.3607177734375, 9.755615234375, 10.1505126953125, 10.54541015625, 10.9403076171875, 11.335205078125, 11.7301025390625, 12.125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 14.0, 7.0, 16.0, 12.0, 22.0, 20.0, 36.0, 26.0, 37.0, 36.0, 47.0, 50.0, 59.0, 64.0, 49.0, 43.0, 45.0, 42.0, 44.0, 44.0, 46.0, 32.0, 28.0, 23.0, 21.0, 18.0, 17.0, 17.0, 12.0, 14.0, 9.0, 8.0, 7.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.5546875, -12.1851806640625, -11.815673828125, -11.4461669921875, -11.07666015625, -10.7071533203125, -10.337646484375, -9.9681396484375, -9.5986328125, -9.2291259765625, -8.859619140625, -8.4901123046875, -8.12060546875, -7.7510986328125, -7.381591796875, -7.0120849609375, -6.642578125, -6.2730712890625, -5.903564453125, -5.5340576171875, -5.16455078125, -4.7950439453125, -4.425537109375, -4.0560302734375, -3.6865234375, -3.3170166015625, -2.947509765625, -2.5780029296875, -2.20849609375, -1.8389892578125, -1.469482421875, -1.0999755859375, -0.73046875, -0.3609619140625, 0.008544921875, 0.3780517578125, 0.74755859375, 1.1170654296875, 1.486572265625, 1.8560791015625, 2.2255859375, 2.5950927734375, 2.964599609375, 3.3341064453125, 3.70361328125, 4.0731201171875, 4.442626953125, 4.8121337890625, 5.181640625, 5.5511474609375, 5.920654296875, 6.2901611328125, 6.65966796875, 7.0291748046875, 7.398681640625, 7.7681884765625, 8.1376953125, 8.5072021484375, 8.876708984375, 9.2462158203125, 9.61572265625, 9.9852294921875, 10.354736328125, 10.7242431640625, 11.09375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 6.0, 12.0, 27.0, 47.0, 68.0, 115.0, 214.0, 435.0, 963.0, 2623.0, 9480.0, 46501.0, 303743.0, 555674.0, 103397.0, 18148.0, 4390.0, 1495.0, 600.0, 288.0, 132.0, 59.0, 47.0, 35.0, 14.0, 10.0, 8.0, 10.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.03790283203125, -5.7984619140625, -5.55902099609375, -5.319580078125, -5.08013916015625, -4.8406982421875, -4.60125732421875, -4.36181640625, -4.12237548828125, -3.8829345703125, -3.64349365234375, -3.404052734375, -3.16461181640625, -2.9251708984375, -2.68572998046875, -2.4462890625, -2.20684814453125, -1.9674072265625, -1.72796630859375, -1.488525390625, -1.24908447265625, -1.0096435546875, -0.77020263671875, -0.53076171875, -0.29132080078125, -0.0518798828125, 0.18756103515625, 0.427001953125, 0.66644287109375, 0.9058837890625, 1.14532470703125, 1.384765625, 1.62420654296875, 1.8636474609375, 2.10308837890625, 2.342529296875, 2.58197021484375, 2.8214111328125, 3.06085205078125, 3.30029296875, 3.53973388671875, 3.7791748046875, 4.01861572265625, 4.258056640625, 4.49749755859375, 4.7369384765625, 4.97637939453125, 5.2158203125, 5.45526123046875, 5.6947021484375, 5.93414306640625, 6.173583984375, 6.41302490234375, 6.6524658203125, 6.89190673828125, 7.13134765625, 7.37078857421875, 7.6102294921875, 7.84967041015625, 8.089111328125, 8.32855224609375, 8.5679931640625, 8.80743408203125, 9.046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 12.0, 31.0, 80.0, 190.0, 294.0, 221.0, 99.0, 32.0, 17.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005657196044921875, -0.005524396896362305, -0.005391597747802734, -0.005258798599243164, -0.005125999450683594, -0.0049932003021240234, -0.004860401153564453, -0.004727602005004883, -0.0045948028564453125, -0.004462003707885742, -0.004329204559326172, -0.0041964054107666016, -0.004063606262207031, -0.003930807113647461, -0.0037980079650878906, -0.0036652088165283203, -0.00353240966796875, -0.0033996105194091797, -0.0032668113708496094, -0.003134012222290039, -0.0030012130737304688, -0.0028684139251708984, -0.002735614776611328, -0.002602815628051758, -0.0024700164794921875, -0.002337217330932617, -0.002204418182373047, -0.0020716190338134766, -0.0019388198852539062, -0.001806020736694336, -0.0016732215881347656, -0.0015404224395751953, -0.001407623291015625, -0.0012748241424560547, -0.0011420249938964844, -0.001009225845336914, -0.0008764266967773438, -0.0007436275482177734, -0.0006108283996582031, -0.0004780292510986328, -0.0003452301025390625, -0.0002124309539794922, -7.963180541992188e-05, 5.316734313964844e-05, 0.00018596649169921875, 0.00031876564025878906, 0.0004515647888183594, 0.0005843639373779297, 0.0007171630859375, 0.0008499622344970703, 0.0009827613830566406, 0.001115560531616211, 0.0012483596801757812, 0.0013811588287353516, 0.0015139579772949219, 0.0016467571258544922, 0.0017795562744140625, 0.0019123554229736328, 0.002045154571533203, 0.0021779537200927734, 0.0023107528686523438, 0.002443552017211914, 0.0025763511657714844, 0.0027091503143310547, 0.002841949462890625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 12.0, 16.0, 11.0, 24.0, 39.0, 55.0, 119.0, 215.0, 395.0, 903.0, 2018.0, 6182.0, 25801.0, 163766.0, 602494.0, 203868.0, 31139.0, 7223.0, 2246.0, 962.0, 476.0, 236.0, 126.0, 80.0, 45.0, 24.0, 19.0, 14.0, 9.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.6650390625, -6.431640625, -6.1982421875, -5.96484375, -5.7314453125, -5.498046875, -5.2646484375, -5.03125, -4.7978515625, -4.564453125, -4.3310546875, -4.09765625, -3.8642578125, -3.630859375, -3.3974609375, -3.1640625, -2.9306640625, -2.697265625, -2.4638671875, -2.23046875, -1.9970703125, -1.763671875, -1.5302734375, -1.296875, -1.0634765625, -0.830078125, -0.5966796875, -0.36328125, -0.1298828125, 0.103515625, 0.3369140625, 0.5703125, 0.8037109375, 1.037109375, 1.2705078125, 1.50390625, 1.7373046875, 1.970703125, 2.2041015625, 2.4375, 2.6708984375, 2.904296875, 3.1376953125, 3.37109375, 3.6044921875, 3.837890625, 4.0712890625, 4.3046875, 4.5380859375, 4.771484375, 5.0048828125, 5.23828125, 5.4716796875, 5.705078125, 5.9384765625, 6.171875, 6.4052734375, 6.638671875, 6.8720703125, 7.10546875, 7.3388671875, 7.572265625, 7.8056640625, 8.0390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 12.0, 15.0, 14.0, 33.0, 44.0, 39.0, 53.0, 83.0, 76.0, 88.0, 82.0, 73.0, 91.0, 69.0, 53.0, 48.0, 32.0, 24.0, 16.0, 15.0, 12.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.677978515625, -4.49267578125, -4.307373046875, -4.1220703125, -3.936767578125, -3.75146484375, -3.566162109375, -3.380859375, -3.195556640625, -3.01025390625, -2.824951171875, -2.6396484375, -2.454345703125, -2.26904296875, -2.083740234375, -1.8984375, -1.713134765625, -1.52783203125, -1.342529296875, -1.1572265625, -0.971923828125, -0.78662109375, -0.601318359375, -0.416015625, -0.230712890625, -0.04541015625, 0.139892578125, 0.3251953125, 0.510498046875, 0.69580078125, 0.881103515625, 1.06640625, 1.251708984375, 1.43701171875, 1.622314453125, 1.8076171875, 1.992919921875, 2.17822265625, 2.363525390625, 2.548828125, 2.734130859375, 2.91943359375, 3.104736328125, 3.2900390625, 3.475341796875, 3.66064453125, 3.845947265625, 4.03125, 4.216552734375, 4.40185546875, 4.587158203125, 4.7724609375, 4.957763671875, 5.14306640625, 5.328369140625, 5.513671875, 5.698974609375, 5.88427734375, 6.069580078125, 6.2548828125, 6.440185546875, 6.62548828125, 6.810791015625, 6.99609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 19.0, 28.0, 80.0, 136.0, 185.0, 213.0, 151.0, 103.0, 49.0, 21.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.40628051757812, -138.2462615966797, -134.0862579345703, -129.92623901367188, -125.76622009277344, -121.60620880126953, -117.44619750976562, -113.28617858886719, -109.12615966796875, -104.96614837646484, -100.8061294555664, -96.6461181640625, -92.48609924316406, -88.32608795166016, -84.16607666015625, -80.00605773925781, -75.8460464477539, -71.68603515625, -67.52601623535156, -63.366004943847656, -59.20598602294922, -55.04597473144531, -50.88595962524414, -46.72594451904297, -42.5659294128418, -38.405914306640625, -34.24589920043945, -30.085886001586914, -25.925870895385742, -21.76585578918457, -17.60584259033203, -13.44582748413086, -9.285820007324219, -5.125805377960205, -0.9657907485961914, 3.194223403930664, 7.354238510131836, 11.514253616333008, 15.674266815185547, 19.83428192138672, 23.99429702758789, 28.154312133789062, 32.314327239990234, 36.474342346191406, 40.63435363769531, 44.79437255859375, 48.954383850097656, 53.11439895629883, 57.2744140625, 61.43442916870117, 65.59444427490234, 69.75445556640625, 73.91447448730469, 78.0744857788086, 82.2344970703125, 86.39451599121094, 90.55453491210938, 94.71454620361328, 98.87456512451172, 103.03457641601562, 107.19459533691406, 111.35460662841797, 115.51461791992188, 119.67463684082031, 123.83464813232422]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 3.0, 10.0, 2.0, 5.0, 6.0, 11.0, 11.0, 17.0, 18.0, 24.0, 22.0, 34.0, 26.0, 28.0, 36.0, 47.0, 46.0, 39.0, 43.0, 43.0, 45.0, 51.0, 50.0, 46.0, 37.0, 28.0, 40.0, 30.0, 34.0, 22.0, 18.0, 19.0, 17.0, 13.0, 14.0, 8.0, 11.0, 3.0, 10.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.26339340209961, -44.57250213623047, -42.88160705566406, -41.19071578979492, -39.49982452392578, -37.808929443359375, -36.118038177490234, -34.427146911621094, -32.73625183105469, -31.045358657836914, -29.35446548461914, -27.66357421875, -25.972681045532227, -24.281787872314453, -22.590896606445312, -20.90000343322754, -19.209110260009766, -17.518217086791992, -15.827324867248535, -14.136432647705078, -12.445539474487305, -10.754646301269531, -9.063754081726074, -7.372861862182617, -5.681968688964844, -3.9910759925842285, -2.3001832962036133, -0.609290599822998, 1.0816020965576172, 2.7724952697753906, 4.463387489318848, 6.154279708862305, 7.8451690673828125, 9.536062240600586, 11.226954460144043, 12.9178466796875, 14.608739852905273, 16.299633026123047, 17.990524291992188, 19.68141746520996, 21.372310638427734, 23.063203811645508, 24.75409698486328, 26.444988250732422, 28.135881423950195, 29.82677459716797, 31.51766586303711, 33.20855712890625, 34.899452209472656, 36.5903434753418, 38.2812385559082, 39.972129821777344, 41.66302490234375, 43.35391616821289, 45.04480743408203, 46.73570251464844, 48.42659378051758, 50.11748504638672, 51.808380126953125, 53.499271392822266, 55.190162658691406, 56.88105773925781, 58.57194900512695, 60.262840270996094, 61.9537353515625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 14.0, 17.0, 26.0, 29.0, 60.0, 62.0, 104.0, 146.0, 218.0, 352.0, 501.0, 879.0, 1486.0, 2812.0, 6001.0, 18151.0, 153186.0, 3946978.0, 43494.0, 10342.0, 4290.0, 2040.0, 1093.0, 696.0, 432.0, 248.0, 179.0, 137.0, 78.0, 51.0, 44.0, 31.0, 19.0, 13.0, 13.0, 10.0, 7.0, 4.0, 8.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-16.515625, -16.0472412109375, -15.578857421875, -15.1104736328125, -14.64208984375, -14.1737060546875, -13.705322265625, -13.2369384765625, -12.7685546875, -12.3001708984375, -11.831787109375, -11.3634033203125, -10.89501953125, -10.4266357421875, -9.958251953125, -9.4898681640625, -9.021484375, -8.5531005859375, -8.084716796875, -7.6163330078125, -7.14794921875, -6.6795654296875, -6.211181640625, -5.7427978515625, -5.2744140625, -4.8060302734375, -4.337646484375, -3.8692626953125, -3.40087890625, -2.9324951171875, -2.464111328125, -1.9957275390625, -1.52734375, -1.0589599609375, -0.590576171875, -0.1221923828125, 0.34619140625, 0.8145751953125, 1.282958984375, 1.7513427734375, 2.2197265625, 2.6881103515625, 3.156494140625, 3.6248779296875, 4.09326171875, 4.5616455078125, 5.030029296875, 5.4984130859375, 5.966796875, 6.4351806640625, 6.903564453125, 7.3719482421875, 7.84033203125, 8.3087158203125, 8.777099609375, 9.2454833984375, 9.7138671875, 10.1822509765625, 10.650634765625, 11.1190185546875, 11.58740234375, 12.0557861328125, 12.524169921875, 12.9925537109375, 13.4609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 6.0, 9.0, 6.0, 12.0, 16.0, 33.0, 21.0, 22.0, 23.0, 27.0, 32.0, 40.0, 51.0, 51.0, 45.0, 56.0, 42.0, 46.0, 48.0, 60.0, 38.0, 30.0, 33.0, 37.0, 43.0, 26.0, 26.0, 28.0, 18.0, 16.0, 9.0, 9.0, 7.0, 7.0, 1.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.061004638671875, -1.98529052734375, -1.909576416015625, -1.8338623046875, -1.758148193359375, -1.68243408203125, -1.606719970703125, -1.531005859375, -1.455291748046875, -1.37957763671875, -1.303863525390625, -1.2281494140625, -1.152435302734375, -1.07672119140625, -1.001007080078125, -0.92529296875, -0.849578857421875, -0.77386474609375, -0.698150634765625, -0.6224365234375, -0.546722412109375, -0.47100830078125, -0.395294189453125, -0.319580078125, -0.243865966796875, -0.16815185546875, -0.092437744140625, -0.0167236328125, 0.058990478515625, 0.13470458984375, 0.210418701171875, 0.2861328125, 0.361846923828125, 0.43756103515625, 0.513275146484375, 0.5889892578125, 0.664703369140625, 0.74041748046875, 0.816131591796875, 0.891845703125, 0.967559814453125, 1.04327392578125, 1.118988037109375, 1.1947021484375, 1.270416259765625, 1.34613037109375, 1.421844482421875, 1.49755859375, 1.573272705078125, 1.64898681640625, 1.724700927734375, 1.8004150390625, 1.876129150390625, 1.95184326171875, 2.027557373046875, 2.103271484375, 2.178985595703125, 2.25469970703125, 2.330413818359375, 2.4061279296875, 2.481842041015625, 2.55755615234375, 2.633270263671875, 2.708984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 5.0, 5.0, 6.0, 15.0, 10.0, 14.0, 33.0, 38.0, 46.0, 67.0, 129.0, 184.0, 376.0, 792.0, 2038.0, 8325.0, 168842.0, 3994515.0, 13965.0, 2761.0, 1056.0, 450.0, 232.0, 129.0, 85.0, 45.0, 28.0, 29.0, 13.0, 16.0, 7.0, 6.0, 6.0, 1.0, 3.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.126953125, -45.66015625, -44.193359375, -42.7265625, -41.259765625, -39.79296875, -38.326171875, -36.859375, -35.392578125, -33.92578125, -32.458984375, -30.9921875, -29.525390625, -28.05859375, -26.591796875, -25.125, -23.658203125, -22.19140625, -20.724609375, -19.2578125, -17.791015625, -16.32421875, -14.857421875, -13.390625, -11.923828125, -10.45703125, -8.990234375, -7.5234375, -6.056640625, -4.58984375, -3.123046875, -1.65625, -0.189453125, 1.27734375, 2.744140625, 4.2109375, 5.677734375, 7.14453125, 8.611328125, 10.078125, 11.544921875, 13.01171875, 14.478515625, 15.9453125, 17.412109375, 18.87890625, 20.345703125, 21.8125, 23.279296875, 24.74609375, 26.212890625, 27.6796875, 29.146484375, 30.61328125, 32.080078125, 33.546875, 35.013671875, 36.48046875, 37.947265625, 39.4140625, 40.880859375, 42.34765625, 43.814453125, 45.28125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 18.0, 34.0, 116.0, 3406.0, 354.0, 60.0, 33.0, 12.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.5831298828125, -9.353759765625, -9.1243896484375, -8.89501953125, -8.6656494140625, -8.436279296875, -8.2069091796875, -7.9775390625, -7.7481689453125, -7.518798828125, -7.2894287109375, -7.06005859375, -6.8306884765625, -6.601318359375, -6.3719482421875, -6.142578125, -5.9132080078125, -5.683837890625, -5.4544677734375, -5.22509765625, -4.9957275390625, -4.766357421875, -4.5369873046875, -4.3076171875, -4.0782470703125, -3.848876953125, -3.6195068359375, -3.39013671875, -3.1607666015625, -2.931396484375, -2.7020263671875, -2.47265625, -2.2432861328125, -2.013916015625, -1.7845458984375, -1.55517578125, -1.3258056640625, -1.096435546875, -0.8670654296875, -0.6376953125, -0.4083251953125, -0.178955078125, 0.0504150390625, 0.27978515625, 0.5091552734375, 0.738525390625, 0.9678955078125, 1.197265625, 1.4266357421875, 1.656005859375, 1.8853759765625, 2.11474609375, 2.3441162109375, 2.573486328125, 2.8028564453125, 3.0322265625, 3.2615966796875, 3.490966796875, 3.7203369140625, 3.94970703125, 4.1790771484375, 4.408447265625, 4.6378173828125, 4.8671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 18.0, 18.0, 22.0, 31.0, 39.0, 38.0, 58.0, 51.0, 70.0, 87.0, 77.0, 85.0, 61.0, 45.0, 60.0, 35.0, 36.0, 30.0, 19.0, 23.0, 15.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.881790161132812, -10.496482849121094, -10.111175537109375, -9.72586727142334, -9.340559959411621, -8.955252647399902, -8.569944381713867, -8.184637069702148, -7.79932975769043, -7.414022445678711, -7.028714656829834, -6.643406867980957, -6.258099555969238, -5.8727922439575195, -5.487484455108643, -5.102176666259766, -4.716869354248047, -4.331562042236328, -3.946254253387451, -3.5609467029571533, -3.1756391525268555, -2.7903316020965576, -2.4050240516662598, -2.019716501235962, -1.634408950805664, -1.2491014003753662, -0.8637938499450684, -0.4784862995147705, -0.09317874908447266, 0.2921288013458252, 0.677436351776123, 1.062743902206421, 1.4480524063110352, 1.833359956741333, 2.218667507171631, 2.6039750576019287, 2.9892826080322266, 3.3745901584625244, 3.7598977088928223, 4.145205497741699, 4.530512809753418, 4.915820121765137, 5.301127910614014, 5.686435699462891, 6.071743011474609, 6.457050323486328, 6.842358112335205, 7.227665901184082, 7.612973213195801, 7.9982805252075195, 8.383588790893555, 8.768896102905273, 9.154203414916992, 9.539510726928711, 9.92481803894043, 10.310126304626465, 10.695433616638184, 11.080740928649902, 11.466049194335938, 11.851356506347656, 12.236663818359375, 12.621971130371094, 13.007278442382812, 13.392586708068848, 13.777894020080566]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 8.0, 6.0, 11.0, 5.0, 15.0, 14.0, 12.0, 11.0, 19.0, 13.0, 22.0, 20.0, 22.0, 34.0, 40.0, 33.0, 42.0, 34.0, 30.0, 38.0, 35.0, 43.0, 31.0, 40.0, 39.0, 50.0, 43.0, 30.0, 27.0, 25.0, 35.0, 26.0, 13.0, 25.0, 16.0, 15.0, 9.0, 9.0, 7.0, 4.0, 13.0, 6.0, 3.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.925076961517334, -7.673674583435059, -7.422272205352783, -7.170869827270508, -6.919467449188232, -6.668065071105957, -6.416662216186523, -6.165260314941406, -5.913857460021973, -5.662455081939697, -5.411052703857422, -5.1596503257751465, -4.908247947692871, -4.656845569610596, -4.40544319152832, -4.154040336608887, -3.9026384353637695, -3.651236057281494, -3.3998336791992188, -3.1484313011169434, -2.897028923034668, -2.6456265449523926, -2.394223928451538, -2.1428215503692627, -1.8914191722869873, -1.640016794204712, -1.3886144161224365, -1.1372119188308716, -0.8858095407485962, -0.6344071626663208, -0.38300466537475586, -0.13160228729248047, 0.11980056762695312, 0.3712029755115509, 0.6226053833961487, 0.8740078210830688, 1.1254101991653442, 1.3768125772476196, 1.6282150745391846, 1.87961745262146, 2.1310198307037354, 2.3824222087860107, 2.633824586868286, 2.8852272033691406, 3.136629581451416, 3.3880319595336914, 3.639434337615967, 3.890836715698242, 4.142239093780518, 4.393641471862793, 4.645043849945068, 4.896446228027344, 5.147848606109619, 5.3992509841918945, 5.650653839111328, 5.902055740356445, 6.153458595275879, 6.404860973358154, 6.65626335144043, 6.907665729522705, 7.1590681076049805, 7.410470485687256, 7.661872863769531, 7.913275718688965, 8.164677619934082]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 12.0, 12.0, 17.0, 22.0, 31.0, 25.0, 45.0, 69.0, 88.0, 110.0, 157.0, 263.0, 452.0, 741.0, 1247.0, 2363.0, 4753.0, 9825.0, 20749.0, 44704.0, 96348.0, 193620.0, 273974.0, 203746.0, 103496.0, 47876.0, 22257.0, 10507.0, 5084.0, 2510.0, 1360.0, 757.0, 419.0, 272.0, 188.0, 116.0, 104.0, 56.0, 43.0, 31.0, 26.0, 17.0, 13.0, 10.0, 5.0, 13.0, 3.0, 3.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0], "bins": [-6.3046875, -6.1109619140625, -5.917236328125, -5.7235107421875, -5.52978515625, -5.3360595703125, -5.142333984375, -4.9486083984375, -4.7548828125, -4.5611572265625, -4.367431640625, -4.1737060546875, -3.97998046875, -3.7862548828125, -3.592529296875, -3.3988037109375, -3.205078125, -3.0113525390625, -2.817626953125, -2.6239013671875, -2.43017578125, -2.2364501953125, -2.042724609375, -1.8489990234375, -1.6552734375, -1.4615478515625, -1.267822265625, -1.0740966796875, -0.88037109375, -0.6866455078125, -0.492919921875, -0.2991943359375, -0.10546875, 0.0882568359375, 0.281982421875, 0.4757080078125, 0.66943359375, 0.8631591796875, 1.056884765625, 1.2506103515625, 1.4443359375, 1.6380615234375, 1.831787109375, 2.0255126953125, 2.21923828125, 2.4129638671875, 2.606689453125, 2.8004150390625, 2.994140625, 3.1878662109375, 3.381591796875, 3.5753173828125, 3.76904296875, 3.9627685546875, 4.156494140625, 4.3502197265625, 4.5439453125, 4.7376708984375, 4.931396484375, 5.1251220703125, 5.31884765625, 5.5125732421875, 5.706298828125, 5.9000244140625, 6.09375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 8.0, 11.0, 14.0, 19.0, 21.0, 18.0, 26.0, 26.0, 30.0, 42.0, 39.0, 40.0, 53.0, 47.0, 42.0, 46.0, 46.0, 40.0, 40.0, 49.0, 41.0, 34.0, 37.0, 31.0, 34.0, 27.0, 18.0, 20.0, 14.0, 20.0, 5.0, 11.0, 6.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.619140625, -2.531707763671875, -2.44427490234375, -2.356842041015625, -2.2694091796875, -2.181976318359375, -2.09454345703125, -2.007110595703125, -1.919677734375, -1.832244873046875, -1.74481201171875, -1.657379150390625, -1.5699462890625, -1.482513427734375, -1.39508056640625, -1.307647705078125, -1.22021484375, -1.132781982421875, -1.04534912109375, -0.957916259765625, -0.8704833984375, -0.783050537109375, -0.69561767578125, -0.608184814453125, -0.520751953125, -0.433319091796875, -0.34588623046875, -0.258453369140625, -0.1710205078125, -0.083587646484375, 0.00384521484375, 0.091278076171875, 0.1787109375, 0.266143798828125, 0.35357666015625, 0.441009521484375, 0.5284423828125, 0.615875244140625, 0.70330810546875, 0.790740966796875, 0.878173828125, 0.965606689453125, 1.05303955078125, 1.140472412109375, 1.2279052734375, 1.315338134765625, 1.40277099609375, 1.490203857421875, 1.57763671875, 1.665069580078125, 1.75250244140625, 1.839935302734375, 1.9273681640625, 2.014801025390625, 2.10223388671875, 2.189666748046875, 2.277099609375, 2.364532470703125, 2.45196533203125, 2.539398193359375, 2.6268310546875, 2.714263916015625, 2.80169677734375, 2.889129638671875, 2.9765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 5.0, 11.0, 15.0, 28.0, 23.0, 35.0, 49.0, 67.0, 117.0, 141.0, 248.0, 322.0, 526.0, 872.0, 1829.0, 4862.0, 18801.0, 102247.0, 559403.0, 296311.0, 46175.0, 9976.0, 3069.0, 1358.0, 725.0, 445.0, 278.0, 176.0, 129.0, 87.0, 57.0, 48.0, 27.0, 22.0, 16.0, 15.0, 5.0, 9.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.109375, -13.678955078125, -13.24853515625, -12.818115234375, -12.3876953125, -11.957275390625, -11.52685546875, -11.096435546875, -10.666015625, -10.235595703125, -9.80517578125, -9.374755859375, -8.9443359375, -8.513916015625, -8.08349609375, -7.653076171875, -7.22265625, -6.792236328125, -6.36181640625, -5.931396484375, -5.5009765625, -5.070556640625, -4.64013671875, -4.209716796875, -3.779296875, -3.348876953125, -2.91845703125, -2.488037109375, -2.0576171875, -1.627197265625, -1.19677734375, -0.766357421875, -0.3359375, 0.094482421875, 0.52490234375, 0.955322265625, 1.3857421875, 1.816162109375, 2.24658203125, 2.677001953125, 3.107421875, 3.537841796875, 3.96826171875, 4.398681640625, 4.8291015625, 5.259521484375, 5.68994140625, 6.120361328125, 6.55078125, 6.981201171875, 7.41162109375, 7.842041015625, 8.2724609375, 8.702880859375, 9.13330078125, 9.563720703125, 9.994140625, 10.424560546875, 10.85498046875, 11.285400390625, 11.7158203125, 12.146240234375, 12.57666015625, 13.007080078125, 13.4375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 10.0, 12.0, 9.0, 11.0, 15.0, 30.0, 25.0, 41.0, 29.0, 28.0, 59.0, 49.0, 59.0, 52.0, 53.0, 62.0, 56.0, 50.0, 49.0, 51.0, 39.0, 39.0, 31.0, 36.0, 30.0, 20.0, 14.0, 11.0, 5.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.015625, -22.4276123046875, -21.839599609375, -21.2515869140625, -20.66357421875, -20.0755615234375, -19.487548828125, -18.8995361328125, -18.3115234375, -17.7235107421875, -17.135498046875, -16.5474853515625, -15.95947265625, -15.3714599609375, -14.783447265625, -14.1954345703125, -13.607421875, -13.0194091796875, -12.431396484375, -11.8433837890625, -11.25537109375, -10.6673583984375, -10.079345703125, -9.4913330078125, -8.9033203125, -8.3153076171875, -7.727294921875, -7.1392822265625, -6.55126953125, -5.9632568359375, -5.375244140625, -4.7872314453125, -4.19921875, -3.6112060546875, -3.023193359375, -2.4351806640625, -1.84716796875, -1.2591552734375, -0.671142578125, -0.0831298828125, 0.5048828125, 1.0928955078125, 1.680908203125, 2.2689208984375, 2.85693359375, 3.4449462890625, 4.032958984375, 4.6209716796875, 5.208984375, 5.7969970703125, 6.385009765625, 6.9730224609375, 7.56103515625, 8.1490478515625, 8.737060546875, 9.3250732421875, 9.9130859375, 10.5010986328125, 11.089111328125, 11.6771240234375, 12.26513671875, 12.8531494140625, 13.441162109375, 14.0291748046875, 14.6171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 7.0, 6.0, 8.0, 11.0, 16.0, 32.0, 44.0, 71.0, 108.0, 200.0, 259.0, 427.0, 837.0, 1580.0, 3362.0, 7971.0, 23399.0, 91761.0, 410063.0, 385387.0, 86014.0, 22469.0, 7751.0, 3205.0, 1510.0, 804.0, 494.0, 250.0, 159.0, 114.0, 88.0, 38.0, 33.0, 21.0, 20.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.80291748046875, -5.6214599609375, -5.44000244140625, -5.258544921875, -5.07708740234375, -4.8956298828125, -4.71417236328125, -4.53271484375, -4.35125732421875, -4.1697998046875, -3.98834228515625, -3.806884765625, -3.62542724609375, -3.4439697265625, -3.26251220703125, -3.0810546875, -2.89959716796875, -2.7181396484375, -2.53668212890625, -2.355224609375, -2.17376708984375, -1.9923095703125, -1.81085205078125, -1.62939453125, -1.44793701171875, -1.2664794921875, -1.08502197265625, -0.903564453125, -0.72210693359375, -0.5406494140625, -0.35919189453125, -0.177734375, 0.00372314453125, 0.1851806640625, 0.36663818359375, 0.548095703125, 0.72955322265625, 0.9110107421875, 1.09246826171875, 1.27392578125, 1.45538330078125, 1.6368408203125, 1.81829833984375, 1.999755859375, 2.18121337890625, 2.3626708984375, 2.54412841796875, 2.7255859375, 2.90704345703125, 3.0885009765625, 3.26995849609375, 3.451416015625, 3.63287353515625, 3.8143310546875, 3.99578857421875, 4.17724609375, 4.35870361328125, 4.5401611328125, 4.72161865234375, 4.903076171875, 5.08453369140625, 5.2659912109375, 5.44744873046875, 5.62890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 11.0, 17.0, 22.0, 29.0, 46.0, 53.0, 89.0, 92.0, 101.0, 107.0, 90.0, 82.0, 55.0, 48.0, 46.0, 27.0, 23.0, 19.0, 10.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011491775512695312, -0.0011051446199417114, -0.0010611116886138916, -0.0010170787572860718, -0.000973045825958252, -0.0009290128946304321, -0.0008849799633026123, -0.0008409470319747925, -0.0007969141006469727, -0.0007528811693191528, -0.000708848237991333, -0.0006648153066635132, -0.0006207823753356934, -0.0005767494440078735, -0.0005327165126800537, -0.0004886835813522339, -0.00044465065002441406, -0.00040061771869659424, -0.0003565847873687744, -0.0003125518560409546, -0.00026851892471313477, -0.00022448599338531494, -0.00018045306205749512, -0.0001364201307296753, -9.238719940185547e-05, -4.8354268074035645e-05, -4.32133674621582e-06, 3.9711594581604004e-05, 8.374452590942383e-05, 0.00012777745723724365, 0.00017181038856506348, 0.0002158433198928833, 0.0002598762512207031, 0.00030390918254852295, 0.0003479421138763428, 0.0003919750452041626, 0.0004360079765319824, 0.00048004090785980225, 0.0005240738391876221, 0.0005681067705154419, 0.0006121397018432617, 0.0006561726331710815, 0.0007002055644989014, 0.0007442384958267212, 0.000788271427154541, 0.0008323043584823608, 0.0008763372898101807, 0.0009203702211380005, 0.0009644031524658203, 0.0010084360837936401, 0.00105246901512146, 0.0010965019464492798, 0.0011405348777770996, 0.0011845678091049194, 0.0012286007404327393, 0.001272633671760559, 0.001316666603088379, 0.0013606995344161987, 0.0014047324657440186, 0.0014487653970718384, 0.0014927983283996582, 0.001536831259727478, 0.0015808641910552979, 0.0016248971223831177, 0.0016689300537109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 17.0, 20.0, 23.0, 48.0, 80.0, 137.0, 366.0, 831.0, 2863.0, 14212.0, 205896.0, 760407.0, 54619.0, 6316.0, 1659.0, 525.0, 235.0, 115.0, 59.0, 38.0, 21.0, 17.0, 12.0, 6.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.6776123046875, -12.284912109375, -11.8922119140625, -11.49951171875, -11.1068115234375, -10.714111328125, -10.3214111328125, -9.9287109375, -9.5360107421875, -9.143310546875, -8.7506103515625, -8.35791015625, -7.9652099609375, -7.572509765625, -7.1798095703125, -6.787109375, -6.3944091796875, -6.001708984375, -5.6090087890625, -5.21630859375, -4.8236083984375, -4.430908203125, -4.0382080078125, -3.6455078125, -3.2528076171875, -2.860107421875, -2.4674072265625, -2.07470703125, -1.6820068359375, -1.289306640625, -0.8966064453125, -0.50390625, -0.1112060546875, 0.281494140625, 0.6741943359375, 1.06689453125, 1.4595947265625, 1.852294921875, 2.2449951171875, 2.6376953125, 3.0303955078125, 3.423095703125, 3.8157958984375, 4.20849609375, 4.6011962890625, 4.993896484375, 5.3865966796875, 5.779296875, 6.1719970703125, 6.564697265625, 6.9573974609375, 7.35009765625, 7.7427978515625, 8.135498046875, 8.5281982421875, 8.9208984375, 9.3135986328125, 9.706298828125, 10.0989990234375, 10.49169921875, 10.8843994140625, 11.277099609375, 11.6697998046875, 12.0625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 7.0, 7.0, 8.0, 15.0, 23.0, 22.0, 44.0, 71.0, 92.0, 96.0, 101.0, 98.0, 105.0, 95.0, 51.0, 47.0, 38.0, 31.0, 20.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26953125, -5.99798583984375, -5.7264404296875, -5.45489501953125, -5.183349609375, -4.91180419921875, -4.6402587890625, -4.36871337890625, -4.09716796875, -3.82562255859375, -3.5540771484375, -3.28253173828125, -3.010986328125, -2.73944091796875, -2.4678955078125, -2.19635009765625, -1.9248046875, -1.65325927734375, -1.3817138671875, -1.11016845703125, -0.838623046875, -0.56707763671875, -0.2955322265625, -0.02398681640625, 0.24755859375, 0.51910400390625, 0.7906494140625, 1.06219482421875, 1.333740234375, 1.60528564453125, 1.8768310546875, 2.14837646484375, 2.419921875, 2.69146728515625, 2.9630126953125, 3.23455810546875, 3.506103515625, 3.77764892578125, 4.0491943359375, 4.32073974609375, 4.59228515625, 4.86383056640625, 5.1353759765625, 5.40692138671875, 5.678466796875, 5.95001220703125, 6.2215576171875, 6.49310302734375, 6.7646484375, 7.03619384765625, 7.3077392578125, 7.57928466796875, 7.850830078125, 8.12237548828125, 8.3939208984375, 8.66546630859375, 8.93701171875, 9.20855712890625, 9.4801025390625, 9.75164794921875, 10.023193359375, 10.29473876953125, 10.5662841796875, 10.83782958984375, 11.109375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 16.0, 26.0, 51.0, 62.0, 109.0, 148.0, 144.0, 151.0, 99.0, 86.0, 51.0, 24.0, 12.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.41873931884766, -110.5461654663086, -106.67359924316406, -102.801025390625, -98.92845916748047, -95.0558853149414, -91.18331909179688, -87.31074523925781, -83.43817138671875, -79.56559753417969, -75.69303131103516, -71.8204574584961, -67.94789123535156, -64.0753173828125, -60.2027473449707, -56.330177307128906, -52.457611083984375, -48.58504104614258, -44.71247100830078, -40.83989715576172, -36.96733093261719, -33.094757080078125, -29.222187042236328, -25.34961700439453, -21.477046966552734, -17.604476928710938, -13.731905937194824, -9.859334945678711, -5.986764907836914, -2.114194869995117, 1.7583770751953125, 5.630947113037109, 9.503524780273438, 13.376094818115234, 17.24866485595703, 21.12123680114746, 24.993806838989258, 28.866376876831055, 32.738948822021484, 36.61151885986328, 40.48408889770508, 44.356658935546875, 48.22922897338867, 52.10179901123047, 55.97437286376953, 59.84693908691406, 63.719512939453125, 67.59208679199219, 71.46465301513672, 75.33722686767578, 79.20979309082031, 83.08236694335938, 86.9549331665039, 90.82750701904297, 94.7000732421875, 98.57264709472656, 102.44522094726562, 106.31779479980469, 110.19036102294922, 114.06293487548828, 117.93550109863281, 121.80807495117188, 125.68064880371094, 129.55322265625, 133.42578125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 8.0, 8.0, 13.0, 20.0, 14.0, 20.0, 13.0, 24.0, 20.0, 25.0, 38.0, 43.0, 33.0, 51.0, 38.0, 52.0, 50.0, 48.0, 50.0, 43.0, 61.0, 26.0, 45.0, 37.0, 38.0, 19.0, 34.0, 16.0, 16.0, 11.0, 15.0, 6.0, 6.0, 8.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-83.64219665527344, -81.24267578125, -78.84315490722656, -76.44363403320312, -74.04411315917969, -71.64459228515625, -69.24507141113281, -66.84555053710938, -64.44602966308594, -62.0465087890625, -59.64698791503906, -57.247467041015625, -54.84794616699219, -52.44842529296875, -50.04890823364258, -47.64938735961914, -45.24987030029297, -42.85034942626953, -40.450828552246094, -38.051307678222656, -35.65178680419922, -33.25226593017578, -30.85274887084961, -28.453227996826172, -26.053707122802734, -23.654186248779297, -21.25466537475586, -18.855146408081055, -16.455625534057617, -14.05610466003418, -11.656584739685059, -9.257064819335938, -6.857551574707031, -4.458031177520752, -2.0585107803344727, 0.34100961685180664, 2.740530014038086, 5.140050888061523, 7.5395708084106445, 9.939090728759766, 12.338611602783203, 14.73813247680664, 17.137653350830078, 19.537172317504883, 21.93669319152832, 24.336214065551758, 26.735733032226562, 29.13525390625, 31.534774780273438, 33.934295654296875, 36.33381652832031, 38.73333740234375, 41.13285827636719, 43.532379150390625, 45.9318962097168, 48.331417083740234, 50.73093795776367, 53.13045883178711, 55.52997970581055, 57.929500579833984, 60.329017639160156, 62.728538513183594, 65.12805938720703, 67.52758026123047, 69.9271011352539]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 12.0, 17.0, 18.0, 13.0, 35.0, 45.0, 57.0, 55.0, 72.0, 105.0, 179.0, 279.0, 510.0, 1002.0, 2435.0, 6873.0, 31128.0, 3934465.0, 192177.0, 16486.0, 4644.0, 1696.0, 770.0, 432.0, 221.0, 139.0, 96.0, 70.0, 56.0, 43.0, 27.0, 24.0, 26.0, 21.0, 8.0, 10.0, 11.0, 7.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.776611328125, -15.20947265625, -14.642333984375, -14.0751953125, -13.508056640625, -12.94091796875, -12.373779296875, -11.806640625, -11.239501953125, -10.67236328125, -10.105224609375, -9.5380859375, -8.970947265625, -8.40380859375, -7.836669921875, -7.26953125, -6.702392578125, -6.13525390625, -5.568115234375, -5.0009765625, -4.433837890625, -3.86669921875, -3.299560546875, -2.732421875, -2.165283203125, -1.59814453125, -1.031005859375, -0.4638671875, 0.103271484375, 0.67041015625, 1.237548828125, 1.8046875, 2.371826171875, 2.93896484375, 3.506103515625, 4.0732421875, 4.640380859375, 5.20751953125, 5.774658203125, 6.341796875, 6.908935546875, 7.47607421875, 8.043212890625, 8.6103515625, 9.177490234375, 9.74462890625, 10.311767578125, 10.87890625, 11.446044921875, 12.01318359375, 12.580322265625, 13.1474609375, 13.714599609375, 14.28173828125, 14.848876953125, 15.416015625, 15.983154296875, 16.55029296875, 17.117431640625, 17.6845703125, 18.251708984375, 18.81884765625, 19.385986328125, 19.953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 3.0, 4.0, 11.0, 9.0, 8.0, 20.0, 30.0, 27.0, 27.0, 30.0, 24.0, 31.0, 43.0, 47.0, 45.0, 56.0, 46.0, 52.0, 50.0, 48.0, 49.0, 51.0, 40.0, 38.0, 39.0, 27.0, 18.0, 18.0, 23.0, 18.0, 8.0, 10.0, 7.0, 2.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.68536376953125, -2.5914306640625, -2.49749755859375, -2.403564453125, -2.30963134765625, -2.2156982421875, -2.12176513671875, -2.02783203125, -1.93389892578125, -1.8399658203125, -1.74603271484375, -1.652099609375, -1.55816650390625, -1.4642333984375, -1.37030029296875, -1.2763671875, -1.18243408203125, -1.0885009765625, -0.99456787109375, -0.900634765625, -0.80670166015625, -0.7127685546875, -0.61883544921875, -0.52490234375, -0.43096923828125, -0.3370361328125, -0.24310302734375, -0.149169921875, -0.05523681640625, 0.0386962890625, 0.13262939453125, 0.2265625, 0.32049560546875, 0.4144287109375, 0.50836181640625, 0.602294921875, 0.69622802734375, 0.7901611328125, 0.88409423828125, 0.97802734375, 1.07196044921875, 1.1658935546875, 1.25982666015625, 1.353759765625, 1.44769287109375, 1.5416259765625, 1.63555908203125, 1.7294921875, 1.82342529296875, 1.9173583984375, 2.01129150390625, 2.105224609375, 2.19915771484375, 2.2930908203125, 2.38702392578125, 2.48095703125, 2.57489013671875, 2.6688232421875, 2.76275634765625, 2.856689453125, 2.95062255859375, 3.0445556640625, 3.13848876953125, 3.232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 10.0, 10.0, 12.0, 17.0, 34.0, 41.0, 36.0, 59.0, 83.0, 146.0, 214.0, 358.0, 673.0, 1169.0, 2606.0, 7870.0, 34805.0, 3914178.0, 204410.0, 18324.0, 5013.0, 1918.0, 933.0, 449.0, 306.0, 187.0, 130.0, 86.0, 60.0, 42.0, 19.0, 23.0, 15.0, 6.0, 7.0, 6.0, 9.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.6396484375, -23.888671875, -23.1376953125, -22.38671875, -21.6357421875, -20.884765625, -20.1337890625, -19.3828125, -18.6318359375, -17.880859375, -17.1298828125, -16.37890625, -15.6279296875, -14.876953125, -14.1259765625, -13.375, -12.6240234375, -11.873046875, -11.1220703125, -10.37109375, -9.6201171875, -8.869140625, -8.1181640625, -7.3671875, -6.6162109375, -5.865234375, -5.1142578125, -4.36328125, -3.6123046875, -2.861328125, -2.1103515625, -1.359375, -0.6083984375, 0.142578125, 0.8935546875, 1.64453125, 2.3955078125, 3.146484375, 3.8974609375, 4.6484375, 5.3994140625, 6.150390625, 6.9013671875, 7.65234375, 8.4033203125, 9.154296875, 9.9052734375, 10.65625, 11.4072265625, 12.158203125, 12.9091796875, 13.66015625, 14.4111328125, 15.162109375, 15.9130859375, 16.6640625, 17.4150390625, 18.166015625, 18.9169921875, 19.66796875, 20.4189453125, 21.169921875, 21.9208984375, 22.671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 11.0, 14.0, 12.0, 24.0, 40.0, 123.0, 2665.0, 953.0, 112.0, 50.0, 26.0, 13.0, 9.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.5, -7.31695556640625, -7.1339111328125, -6.95086669921875, -6.767822265625, -6.58477783203125, -6.4017333984375, -6.21868896484375, -6.03564453125, -5.85260009765625, -5.6695556640625, -5.48651123046875, -5.303466796875, -5.12042236328125, -4.9373779296875, -4.75433349609375, -4.5712890625, -4.38824462890625, -4.2052001953125, -4.02215576171875, -3.839111328125, -3.65606689453125, -3.4730224609375, -3.28997802734375, -3.10693359375, -2.92388916015625, -2.7408447265625, -2.55780029296875, -2.374755859375, -2.19171142578125, -2.0086669921875, -1.82562255859375, -1.642578125, -1.45953369140625, -1.2764892578125, -1.09344482421875, -0.910400390625, -0.72735595703125, -0.5443115234375, -0.36126708984375, -0.17822265625, 0.00482177734375, 0.1878662109375, 0.37091064453125, 0.553955078125, 0.73699951171875, 0.9200439453125, 1.10308837890625, 1.2861328125, 1.46917724609375, 1.6522216796875, 1.83526611328125, 2.018310546875, 2.20135498046875, 2.3843994140625, 2.56744384765625, 2.75048828125, 2.93353271484375, 3.1165771484375, 3.29962158203125, 3.482666015625, 3.66571044921875, 3.8487548828125, 4.03179931640625, 4.21484375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 10.0, 15.0, 18.0, 23.0, 34.0, 50.0, 56.0, 93.0, 81.0, 90.0, 93.0, 96.0, 79.0, 80.0, 59.0, 45.0, 22.0, 18.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.420623779296875, -17.859588623046875, -17.298551559448242, -16.737516403198242, -16.17647933959961, -15.61544418334961, -15.05440902709961, -14.493372917175293, -13.932336807250977, -13.37130069732666, -12.810264587402344, -12.249229431152344, -11.688193321228027, -11.127157211303711, -10.566122055053711, -10.005085945129395, -9.444049835205078, -8.883013725280762, -8.321977615356445, -7.760942459106445, -7.199906349182129, -6.6388702392578125, -6.077834606170654, -5.516798973083496, -4.95576286315918, -4.394726753234863, -3.833691120147705, -3.2726552486419678, -2.7116193771362305, -2.150583505630493, -1.5895476341247559, -1.0285117626190186, -0.46747589111328125, 0.09355998039245605, 0.6545958518981934, 1.2156317234039307, 1.776667594909668, 2.3377034664154053, 2.8987393379211426, 3.45977520942688, 4.020811080932617, 4.581847190856934, 5.142882823944092, 5.70391845703125, 6.264954566955566, 6.825990676879883, 7.387026309967041, 7.948061943054199, 8.509098052978516, 9.070134162902832, 9.631170272827148, 10.192205429077148, 10.753241539001465, 11.314277648925781, 11.875312805175781, 12.436348915100098, 12.997385025024414, 13.55842113494873, 14.119457244873047, 14.680492401123047, 15.241528511047363, 15.80256462097168, 16.36359977722168, 16.924636840820312, 17.485671997070312]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 11.0, 13.0, 11.0, 15.0, 9.0, 12.0, 12.0, 20.0, 23.0, 23.0, 38.0, 28.0, 29.0, 45.0, 37.0, 36.0, 48.0, 42.0, 47.0, 42.0, 36.0, 46.0, 41.0, 28.0, 36.0, 33.0, 26.0, 33.0, 27.0, 29.0, 18.0, 16.0, 20.0, 10.0, 8.0, 10.0, 9.0, 4.0, 3.0, 2.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.576684951782227, -11.26180362701416, -10.946922302246094, -10.632040977478027, -10.317159652709961, -10.002278327941895, -9.687397003173828, -9.372515678405762, -9.057634353637695, -8.742753028869629, -8.427871704101562, -8.112990379333496, -7.79810905456543, -7.483227729797363, -7.168346405029297, -6.8534650802612305, -6.538584232330322, -6.223702907562256, -5.9088215827941895, -5.593940258026123, -5.279058933258057, -4.96417760848999, -4.649296760559082, -4.334415435791016, -4.019534111022949, -3.704652786254883, -3.3897714614868164, -3.07489013671875, -2.7600088119506836, -2.445127487182617, -2.13024640083313, -1.8153650760650635, -1.500483512878418, -1.1856021881103516, -0.8707209229469299, -0.5558396577835083, -0.2409583330154419, 0.07392299175262451, 0.38880419731140137, 0.7036855220794678, 1.0185668468475342, 1.3334481716156006, 1.648329496383667, 1.9632107019424438, 2.2780919075012207, 2.592973232269287, 2.9078545570373535, 3.22273588180542, 3.5376172065734863, 3.8524985313415527, 4.167379856109619, 4.4822611808776855, 4.797142505645752, 5.112023830413818, 5.426904678344727, 5.741786003112793, 6.056667327880859, 6.371548652648926, 6.686429977416992, 7.001311302185059, 7.316192626953125, 7.631073951721191, 7.945955276489258, 8.260836601257324, 8.57571792602539]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 6.0, 17.0, 20.0, 34.0, 53.0, 97.0, 168.0, 292.0, 450.0, 880.0, 1432.0, 2501.0, 4588.0, 8555.0, 16882.0, 35386.0, 79303.0, 175447.0, 297179.0, 225352.0, 106272.0, 47493.0, 22079.0, 11054.0, 5693.0, 3092.0, 1741.0, 1018.0, 613.0, 330.0, 225.0, 111.0, 74.0, 46.0, 23.0, 14.0, 14.0, 8.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.6053466796875, -5.409912109375, -5.2144775390625, -5.01904296875, -4.8236083984375, -4.628173828125, -4.4327392578125, -4.2373046875, -4.0418701171875, -3.846435546875, -3.6510009765625, -3.45556640625, -3.2601318359375, -3.064697265625, -2.8692626953125, -2.673828125, -2.4783935546875, -2.282958984375, -2.0875244140625, -1.89208984375, -1.6966552734375, -1.501220703125, -1.3057861328125, -1.1103515625, -0.9149169921875, -0.719482421875, -0.5240478515625, -0.32861328125, -0.1331787109375, 0.062255859375, 0.2576904296875, 0.453125, 0.6485595703125, 0.843994140625, 1.0394287109375, 1.23486328125, 1.4302978515625, 1.625732421875, 1.8211669921875, 2.0166015625, 2.2120361328125, 2.407470703125, 2.6029052734375, 2.79833984375, 2.9937744140625, 3.189208984375, 3.3846435546875, 3.580078125, 3.7755126953125, 3.970947265625, 4.1663818359375, 4.36181640625, 4.5572509765625, 4.752685546875, 4.9481201171875, 5.1435546875, 5.3389892578125, 5.534423828125, 5.7298583984375, 5.92529296875, 6.1207275390625, 6.316162109375, 6.5115966796875, 6.70703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 6.0, 12.0, 13.0, 19.0, 12.0, 22.0, 22.0, 25.0, 33.0, 47.0, 45.0, 45.0, 49.0, 50.0, 42.0, 57.0, 67.0, 60.0, 50.0, 43.0, 35.0, 36.0, 35.0, 28.0, 24.0, 28.0, 21.0, 8.0, 11.0, 9.0, 8.0, 0.0, 8.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.734375, -3.62200927734375, -3.5096435546875, -3.39727783203125, -3.284912109375, -3.17254638671875, -3.0601806640625, -2.94781494140625, -2.83544921875, -2.72308349609375, -2.6107177734375, -2.49835205078125, -2.385986328125, -2.27362060546875, -2.1612548828125, -2.04888916015625, -1.9365234375, -1.82415771484375, -1.7117919921875, -1.59942626953125, -1.487060546875, -1.37469482421875, -1.2623291015625, -1.14996337890625, -1.03759765625, -0.92523193359375, -0.8128662109375, -0.70050048828125, -0.588134765625, -0.47576904296875, -0.3634033203125, -0.25103759765625, -0.138671875, -0.02630615234375, 0.0860595703125, 0.19842529296875, 0.310791015625, 0.42315673828125, 0.5355224609375, 0.64788818359375, 0.76025390625, 0.87261962890625, 0.9849853515625, 1.09735107421875, 1.209716796875, 1.32208251953125, 1.4344482421875, 1.54681396484375, 1.6591796875, 1.77154541015625, 1.8839111328125, 1.99627685546875, 2.108642578125, 2.22100830078125, 2.3333740234375, 2.44573974609375, 2.55810546875, 2.67047119140625, 2.7828369140625, 2.89520263671875, 3.007568359375, 3.11993408203125, 3.2322998046875, 3.34466552734375, 3.45703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 9.0, 11.0, 17.0, 20.0, 22.0, 45.0, 88.0, 93.0, 158.0, 254.0, 460.0, 816.0, 1674.0, 4893.0, 25524.0, 309692.0, 641605.0, 50499.0, 7963.0, 2260.0, 964.0, 539.0, 316.0, 216.0, 150.0, 79.0, 46.0, 43.0, 22.0, 20.0, 13.0, 7.0, 3.0, 12.0, 7.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.71875, -13.15087890625, -12.5830078125, -12.01513671875, -11.447265625, -10.87939453125, -10.3115234375, -9.74365234375, -9.17578125, -8.60791015625, -8.0400390625, -7.47216796875, -6.904296875, -6.33642578125, -5.7685546875, -5.20068359375, -4.6328125, -4.06494140625, -3.4970703125, -2.92919921875, -2.361328125, -1.79345703125, -1.2255859375, -0.65771484375, -0.08984375, 0.47802734375, 1.0458984375, 1.61376953125, 2.181640625, 2.74951171875, 3.3173828125, 3.88525390625, 4.453125, 5.02099609375, 5.5888671875, 6.15673828125, 6.724609375, 7.29248046875, 7.8603515625, 8.42822265625, 8.99609375, 9.56396484375, 10.1318359375, 10.69970703125, 11.267578125, 11.83544921875, 12.4033203125, 12.97119140625, 13.5390625, 14.10693359375, 14.6748046875, 15.24267578125, 15.810546875, 16.37841796875, 16.9462890625, 17.51416015625, 18.08203125, 18.64990234375, 19.2177734375, 19.78564453125, 20.353515625, 20.92138671875, 21.4892578125, 22.05712890625, 22.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 12.0, 12.0, 9.0, 14.0, 5.0, 17.0, 18.0, 23.0, 26.0, 21.0, 35.0, 31.0, 25.0, 43.0, 43.0, 45.0, 46.0, 42.0, 44.0, 49.0, 38.0, 46.0, 42.0, 41.0, 30.0, 41.0, 25.0, 21.0, 28.0, 24.0, 13.0, 18.0, 14.0, 19.0, 10.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.984375, -14.5062255859375, -14.028076171875, -13.5499267578125, -13.07177734375, -12.5936279296875, -12.115478515625, -11.6373291015625, -11.1591796875, -10.6810302734375, -10.202880859375, -9.7247314453125, -9.24658203125, -8.7684326171875, -8.290283203125, -7.8121337890625, -7.333984375, -6.8558349609375, -6.377685546875, -5.8995361328125, -5.42138671875, -4.9432373046875, -4.465087890625, -3.9869384765625, -3.5087890625, -3.0306396484375, -2.552490234375, -2.0743408203125, -1.59619140625, -1.1180419921875, -0.639892578125, -0.1617431640625, 0.31640625, 0.7945556640625, 1.272705078125, 1.7508544921875, 2.22900390625, 2.7071533203125, 3.185302734375, 3.6634521484375, 4.1416015625, 4.6197509765625, 5.097900390625, 5.5760498046875, 6.05419921875, 6.5323486328125, 7.010498046875, 7.4886474609375, 7.966796875, 8.4449462890625, 8.923095703125, 9.4012451171875, 9.87939453125, 10.3575439453125, 10.835693359375, 11.3138427734375, 11.7919921875, 12.2701416015625, 12.748291015625, 13.2264404296875, 13.70458984375, 14.1827392578125, 14.660888671875, 15.1390380859375, 15.6171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 15.0, 38.0, 56.0, 89.0, 229.0, 534.0, 1692.0, 7976.0, 96468.0, 820399.0, 109645.0, 8599.0, 1847.0, 548.0, 204.0, 106.0, 40.0, 27.0, 13.0, 8.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.38128662109375, -5.0555419921875, -4.72979736328125, -4.404052734375, -4.07830810546875, -3.7525634765625, -3.42681884765625, -3.10107421875, -2.77532958984375, -2.4495849609375, -2.12384033203125, -1.798095703125, -1.47235107421875, -1.1466064453125, -0.82086181640625, -0.4951171875, -0.16937255859375, 0.1563720703125, 0.48211669921875, 0.807861328125, 1.13360595703125, 1.4593505859375, 1.78509521484375, 2.11083984375, 2.43658447265625, 2.7623291015625, 3.08807373046875, 3.413818359375, 3.73956298828125, 4.0653076171875, 4.39105224609375, 4.716796875, 5.04254150390625, 5.3682861328125, 5.69403076171875, 6.019775390625, 6.34552001953125, 6.6712646484375, 6.99700927734375, 7.32275390625, 7.64849853515625, 7.9742431640625, 8.29998779296875, 8.625732421875, 8.95147705078125, 9.2772216796875, 9.60296630859375, 9.9287109375, 10.25445556640625, 10.5802001953125, 10.90594482421875, 11.231689453125, 11.55743408203125, 11.8831787109375, 12.20892333984375, 12.53466796875, 12.86041259765625, 13.1861572265625, 13.51190185546875, 13.837646484375, 14.16339111328125, 14.4891357421875, 14.81488037109375, 15.140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 9.0, 11.0, 12.0, 16.0, 23.0, 22.0, 30.0, 43.0, 57.0, 78.0, 78.0, 102.0, 97.0, 71.0, 81.0, 64.0, 42.0, 40.0, 24.0, 15.0, 20.0, 11.0, 13.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012674331665039062, -0.001230284571647644, -0.0011931359767913818, -0.0011559873819351196, -0.0011188387870788574, -0.0010816901922225952, -0.001044541597366333, -0.0010073930025100708, -0.0009702444076538086, -0.0009330958127975464, -0.0008959472179412842, -0.000858798623085022, -0.0008216500282287598, -0.0007845014333724976, -0.0007473528385162354, -0.0007102042436599731, -0.0006730556488037109, -0.0006359070539474487, -0.0005987584590911865, -0.0005616098642349243, -0.0005244612693786621, -0.0004873126745223999, -0.0004501640796661377, -0.0004130154848098755, -0.0003758668899536133, -0.0003387182950973511, -0.00030156970024108887, -0.00026442110538482666, -0.00022727251052856445, -0.00019012391567230225, -0.00015297532081604004, -0.00011582672595977783, -7.867813110351562e-05, -4.152953624725342e-05, -4.380941390991211e-06, 3.2767653465270996e-05, 6.99162483215332e-05, 0.00010706484317779541, 0.00014421343803405762, 0.00018136203289031982, 0.00021851062774658203, 0.00025565922260284424, 0.00029280781745910645, 0.00032995641231536865, 0.00036710500717163086, 0.00040425360202789307, 0.0004414021968841553, 0.0004785507917404175, 0.0005156993865966797, 0.0005528479814529419, 0.0005899965763092041, 0.0006271451711654663, 0.0006642937660217285, 0.0007014423608779907, 0.0007385909557342529, 0.0007757395505905151, 0.0008128881454467773, 0.0008500367403030396, 0.0008871853351593018, 0.000924333930015564, 0.0009614825248718262, 0.0009986311197280884, 0.0010357797145843506, 0.0010729283094406128, 0.001110076904296875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 10.0, 22.0, 38.0, 51.0, 51.0, 87.0, 174.0, 305.0, 632.0, 1421.0, 3936.0, 17931.0, 179036.0, 714060.0, 112421.0, 12802.0, 3202.0, 1184.0, 579.0, 245.0, 145.0, 64.0, 56.0, 29.0, 14.0, 11.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8284912109375, -7.571044921875, -7.3135986328125, -7.05615234375, -6.7987060546875, -6.541259765625, -6.2838134765625, -6.0263671875, -5.7689208984375, -5.511474609375, -5.2540283203125, -4.99658203125, -4.7391357421875, -4.481689453125, -4.2242431640625, -3.966796875, -3.7093505859375, -3.451904296875, -3.1944580078125, -2.93701171875, -2.6795654296875, -2.422119140625, -2.1646728515625, -1.9072265625, -1.6497802734375, -1.392333984375, -1.1348876953125, -0.87744140625, -0.6199951171875, -0.362548828125, -0.1051025390625, 0.15234375, 0.4097900390625, 0.667236328125, 0.9246826171875, 1.18212890625, 1.4395751953125, 1.697021484375, 1.9544677734375, 2.2119140625, 2.4693603515625, 2.726806640625, 2.9842529296875, 3.24169921875, 3.4991455078125, 3.756591796875, 4.0140380859375, 4.271484375, 4.5289306640625, 4.786376953125, 5.0438232421875, 5.30126953125, 5.5587158203125, 5.816162109375, 6.0736083984375, 6.3310546875, 6.5885009765625, 6.845947265625, 7.1033935546875, 7.36083984375, 7.6182861328125, 7.875732421875, 8.1331787109375, 8.390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 9.0, 12.0, 26.0, 49.0, 63.0, 115.0, 147.0, 173.0, 143.0, 109.0, 51.0, 49.0, 26.0, 18.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.35565185546875, -7.0277099609375, -6.69976806640625, -6.371826171875, -6.04388427734375, -5.7159423828125, -5.38800048828125, -5.06005859375, -4.73211669921875, -4.4041748046875, -4.07623291015625, -3.748291015625, -3.42034912109375, -3.0924072265625, -2.76446533203125, -2.4365234375, -2.10858154296875, -1.7806396484375, -1.45269775390625, -1.124755859375, -0.79681396484375, -0.4688720703125, -0.14093017578125, 0.18701171875, 0.51495361328125, 0.8428955078125, 1.17083740234375, 1.498779296875, 1.82672119140625, 2.1546630859375, 2.48260498046875, 2.810546875, 3.13848876953125, 3.4664306640625, 3.79437255859375, 4.122314453125, 4.45025634765625, 4.7781982421875, 5.10614013671875, 5.43408203125, 5.76202392578125, 6.0899658203125, 6.41790771484375, 6.745849609375, 7.07379150390625, 7.4017333984375, 7.72967529296875, 8.0576171875, 8.38555908203125, 8.7135009765625, 9.04144287109375, 9.369384765625, 9.69732666015625, 10.0252685546875, 10.35321044921875, 10.68115234375, 11.00909423828125, 11.3370361328125, 11.66497802734375, 11.992919921875, 12.32086181640625, 12.6488037109375, 12.97674560546875, 13.3046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 10.0, 14.0, 31.0, 52.0, 58.0, 79.0, 86.0, 118.0, 92.0, 107.0, 109.0, 78.0, 61.0, 45.0, 23.0, 15.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-124.03025817871094, -121.30207061767578, -118.57388305664062, -115.84569549560547, -113.11750793457031, -110.38931274414062, -107.66112518310547, -104.93293762207031, -102.20475006103516, -99.4765625, -96.74837493896484, -94.02018737792969, -91.2919921875, -88.56380462646484, -85.83561706542969, -83.10742950439453, -80.37924194335938, -77.65105438232422, -74.92286682128906, -72.1946792602539, -69.46649169921875, -66.73829650878906, -64.0101089477539, -61.28192138671875, -58.553733825683594, -55.82554626464844, -53.09735870361328, -50.36916732788086, -47.6409797668457, -44.91279220581055, -42.184600830078125, -39.45641326904297, -36.72822570800781, -34.000038146972656, -31.271848678588867, -28.543659210205078, -25.815471649169922, -23.087284088134766, -20.359094619750977, -17.630905151367188, -14.902717590332031, -12.174529075622559, -9.446340560913086, -6.718152046203613, -3.9899635314941406, -1.261775016784668, 1.4664134979248047, 4.194602966308594, 6.92279052734375, 9.650979042053223, 12.379167556762695, 15.107356071472168, 17.83554458618164, 20.563732147216797, 23.291921615600586, 26.020111083984375, 28.74829864501953, 31.476486206054688, 34.204673767089844, 36.932865142822266, 39.66105270385742, 42.38924026489258, 45.117431640625, 47.845619201660156, 50.57380676269531]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 7.0, 12.0, 10.0, 14.0, 25.0, 24.0, 18.0, 21.0, 19.0, 29.0, 46.0, 47.0, 39.0, 38.0, 53.0, 42.0, 58.0, 56.0, 46.0, 35.0, 53.0, 41.0, 39.0, 36.0, 27.0, 22.0, 25.0, 28.0, 20.0, 17.0, 6.0, 5.0, 5.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-80.1348876953125, -77.80195617675781, -75.46902465820312, -73.1360855102539, -70.80315399169922, -68.47022247314453, -66.13728332519531, -63.804351806640625, -61.47142028808594, -59.13848876953125, -56.8055534362793, -54.472618103027344, -52.139686584472656, -49.80675506591797, -47.473819732666016, -45.14088439941406, -42.807952880859375, -40.47502136230469, -38.142086029052734, -35.80915069580078, -33.476219177246094, -31.143285751342773, -28.810352325439453, -26.477418899536133, -24.144485473632812, -21.811552047729492, -19.478618621826172, -17.14568519592285, -14.812751770019531, -12.479818344116211, -10.14688491821289, -7.81395149230957, -5.481010437011719, -3.1480770111083984, -0.8151435852050781, 1.5177898406982422, 3.8507232666015625, 6.183656692504883, 8.516590118408203, 10.849523544311523, 13.182456970214844, 15.515390396118164, 17.848323822021484, 20.181257247924805, 22.514190673828125, 24.847124099731445, 27.180057525634766, 29.512990951538086, 31.845924377441406, 34.178855895996094, 36.51179122924805, 38.8447265625, 41.17765808105469, 43.510589599609375, 45.84352493286133, 48.17646026611328, 50.50939178466797, 52.842323303222656, 55.17525863647461, 57.50819396972656, 59.84112548828125, 62.17405700683594, 64.50698852539062, 66.83992767333984, 69.17285919189453]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 15.0, 14.0, 16.0, 32.0, 38.0, 34.0, 62.0, 80.0, 140.0, 204.0, 312.0, 448.0, 798.0, 1399.0, 2785.0, 6549.0, 21852.0, 3688724.0, 438214.0, 20078.0, 6324.0, 2675.0, 1340.0, 749.0, 447.0, 261.0, 210.0, 161.0, 77.0, 74.0, 41.0, 34.0, 24.0, 15.0, 15.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-16.5625, -16.074951171875, -15.58740234375, -15.099853515625, -14.6123046875, -14.124755859375, -13.63720703125, -13.149658203125, -12.662109375, -12.174560546875, -11.68701171875, -11.199462890625, -10.7119140625, -10.224365234375, -9.73681640625, -9.249267578125, -8.76171875, -8.274169921875, -7.78662109375, -7.299072265625, -6.8115234375, -6.323974609375, -5.83642578125, -5.348876953125, -4.861328125, -4.373779296875, -3.88623046875, -3.398681640625, -2.9111328125, -2.423583984375, -1.93603515625, -1.448486328125, -0.9609375, -0.473388671875, 0.01416015625, 0.501708984375, 0.9892578125, 1.476806640625, 1.96435546875, 2.451904296875, 2.939453125, 3.427001953125, 3.91455078125, 4.402099609375, 4.8896484375, 5.377197265625, 5.86474609375, 6.352294921875, 6.83984375, 7.327392578125, 7.81494140625, 8.302490234375, 8.7900390625, 9.277587890625, 9.76513671875, 10.252685546875, 10.740234375, 11.227783203125, 11.71533203125, 12.202880859375, 12.6904296875, 13.177978515625, 13.66552734375, 14.153076171875, 14.640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 11.0, 13.0, 15.0, 17.0, 13.0, 31.0, 28.0, 29.0, 50.0, 52.0, 49.0, 50.0, 60.0, 60.0, 55.0, 48.0, 68.0, 59.0, 45.0, 40.0, 37.0, 32.0, 35.0, 10.0, 18.0, 14.0, 7.0, 12.0, 4.0, 6.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0], "bins": [-4.58984375, -4.466400146484375, -4.34295654296875, -4.219512939453125, -4.0960693359375, -3.972625732421875, -3.84918212890625, -3.725738525390625, -3.602294921875, -3.478851318359375, -3.35540771484375, -3.231964111328125, -3.1085205078125, -2.985076904296875, -2.86163330078125, -2.738189697265625, -2.61474609375, -2.491302490234375, -2.36785888671875, -2.244415283203125, -2.1209716796875, -1.997528076171875, -1.87408447265625, -1.750640869140625, -1.627197265625, -1.503753662109375, -1.38031005859375, -1.256866455078125, -1.1334228515625, -1.009979248046875, -0.88653564453125, -0.763092041015625, -0.6396484375, -0.516204833984375, -0.39276123046875, -0.269317626953125, -0.1458740234375, -0.022430419921875, 0.10101318359375, 0.224456787109375, 0.347900390625, 0.471343994140625, 0.59478759765625, 0.718231201171875, 0.8416748046875, 0.965118408203125, 1.08856201171875, 1.212005615234375, 1.33544921875, 1.458892822265625, 1.58233642578125, 1.705780029296875, 1.8292236328125, 1.952667236328125, 2.07611083984375, 2.199554443359375, 2.322998046875, 2.446441650390625, 2.56988525390625, 2.693328857421875, 2.8167724609375, 2.940216064453125, 3.06365966796875, 3.187103271484375, 3.310546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 18.0, 23.0, 16.0, 25.0, 26.0, 55.0, 68.0, 150.0, 275.0, 609.0, 1385.0, 4027.0, 16449.0, 3923365.0, 230449.0, 11822.0, 3273.0, 1136.0, 529.0, 223.0, 126.0, 57.0, 36.0, 30.0, 26.0, 19.0, 15.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.03125, -28.199462890625, -27.36767578125, -26.535888671875, -25.7041015625, -24.872314453125, -24.04052734375, -23.208740234375, -22.376953125, -21.545166015625, -20.71337890625, -19.881591796875, -19.0498046875, -18.218017578125, -17.38623046875, -16.554443359375, -15.72265625, -14.890869140625, -14.05908203125, -13.227294921875, -12.3955078125, -11.563720703125, -10.73193359375, -9.900146484375, -9.068359375, -8.236572265625, -7.40478515625, -6.572998046875, -5.7412109375, -4.909423828125, -4.07763671875, -3.245849609375, -2.4140625, -1.582275390625, -0.75048828125, 0.081298828125, 0.9130859375, 1.744873046875, 2.57666015625, 3.408447265625, 4.240234375, 5.072021484375, 5.90380859375, 6.735595703125, 7.5673828125, 8.399169921875, 9.23095703125, 10.062744140625, 10.89453125, 11.726318359375, 12.55810546875, 13.389892578125, 14.2216796875, 15.053466796875, 15.88525390625, 16.717041015625, 17.548828125, 18.380615234375, 19.21240234375, 20.044189453125, 20.8759765625, 21.707763671875, 22.53955078125, 23.371337890625, 24.203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 23.0, 41.0, 117.0, 3267.0, 450.0, 82.0, 25.0, 15.0, 11.0, 5.0, 4.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.13287353515625, -6.9805908203125, -6.82830810546875, -6.676025390625, -6.52374267578125, -6.3714599609375, -6.21917724609375, -6.06689453125, -5.91461181640625, -5.7623291015625, -5.61004638671875, -5.457763671875, -5.30548095703125, -5.1531982421875, -5.00091552734375, -4.8486328125, -4.69635009765625, -4.5440673828125, -4.39178466796875, -4.239501953125, -4.08721923828125, -3.9349365234375, -3.78265380859375, -3.63037109375, -3.47808837890625, -3.3258056640625, -3.17352294921875, -3.021240234375, -2.86895751953125, -2.7166748046875, -2.56439208984375, -2.412109375, -2.25982666015625, -2.1075439453125, -1.95526123046875, -1.802978515625, -1.65069580078125, -1.4984130859375, -1.34613037109375, -1.19384765625, -1.04156494140625, -0.8892822265625, -0.73699951171875, -0.584716796875, -0.43243408203125, -0.2801513671875, -0.12786865234375, 0.0244140625, 0.17669677734375, 0.3289794921875, 0.48126220703125, 0.633544921875, 0.78582763671875, 0.9381103515625, 1.09039306640625, 1.24267578125, 1.39495849609375, 1.5472412109375, 1.69952392578125, 1.851806640625, 2.00408935546875, 2.1563720703125, 2.30865478515625, 2.4609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 11.0, 12.0, 26.0, 67.0, 121.0, 169.0, 151.0, 194.0, 113.0, 71.0, 30.0, 15.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71933364868164, -19.006885528564453, -18.294437408447266, -17.581987380981445, -16.869539260864258, -16.15709114074707, -15.444642066955566, -14.732192993164062, -14.019744873046875, -13.307296752929688, -12.594847679138184, -11.88239860534668, -11.169950485229492, -10.457502365112305, -9.7450532913208, -9.032604217529297, -8.32015609741211, -7.607707500457764, -6.895258903503418, -6.182810306549072, -5.470361709594727, -4.757913112640381, -4.045464515686035, -3.3330159187316895, -2.6205673217773438, -1.908118724822998, -1.1956701278686523, -0.48322153091430664, 0.22922706604003906, 0.9416756629943848, 1.6541242599487305, 2.366572856903076, 3.079021453857422, 3.7914700508117676, 4.503918647766113, 5.216367244720459, 5.928815841674805, 6.64126443862915, 7.353713035583496, 8.066162109375, 8.778610229492188, 9.491058349609375, 10.203507423400879, 10.915956497192383, 11.62840461730957, 12.340852737426758, 13.053301811218262, 13.765750885009766, 14.478199005126953, 15.19064712524414, 15.903096199035645, 16.61554527282715, 17.327993392944336, 18.040441513061523, 18.752891540527344, 19.46533966064453, 20.17778778076172, 20.890235900878906, 21.602684020996094, 22.315134048461914, 23.0275821685791, 23.74003028869629, 24.45248031616211, 25.164928436279297, 25.877376556396484]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 3.0, 10.0, 16.0, 17.0, 14.0, 18.0, 17.0, 20.0, 15.0, 28.0, 24.0, 38.0, 32.0, 28.0, 42.0, 37.0, 28.0, 32.0, 42.0, 29.0, 48.0, 30.0, 29.0, 31.0, 31.0, 22.0, 26.0, 38.0, 31.0, 35.0, 27.0, 18.0, 23.0, 17.0, 9.0, 12.0, 8.0, 21.0, 8.0, 9.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.202105522155762, -6.00049352645874, -5.798881530761719, -5.597269058227539, -5.395657062530518, -5.194045066833496, -4.992432594299316, -4.790820598602295, -4.589208602905273, -4.387596607208252, -4.1859846115112305, -3.984372138977051, -3.7827601432800293, -3.581148147583008, -3.3795359134674072, -3.1779236793518066, -2.976311683654785, -2.7746996879577637, -2.573087453842163, -2.3714752197265625, -2.169863224029541, -1.96825110912323, -1.766638994216919, -1.565026879310608, -1.3634147644042969, -1.1618026494979858, -0.9601905345916748, -0.7585784196853638, -0.5569663047790527, -0.3553541898727417, -0.15374207496643066, 0.04787003993988037, 0.2494821548461914, 0.45109426975250244, 0.6527063846588135, 0.8543184995651245, 1.0559306144714355, 1.2575427293777466, 1.4591548442840576, 1.6607669591903687, 1.8623790740966797, 2.063991069793701, 2.2656033039093018, 2.4672155380249023, 2.668827533721924, 2.8704395294189453, 3.072051763534546, 3.2736639976501465, 3.475275993347168, 3.6768879890441895, 3.87850022315979, 4.080112457275391, 4.281724452972412, 4.483336448669434, 4.684948921203613, 4.886560916900635, 5.088172912597656, 5.289784908294678, 5.491396903991699, 5.693009376525879, 5.8946213722229, 6.096233367919922, 6.297845840454102, 6.499457836151123, 6.7010698318481445]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 18.0, 33.0, 41.0, 66.0, 98.0, 140.0, 223.0, 320.0, 537.0, 834.0, 1355.0, 2097.0, 3529.0, 6082.0, 10424.0, 18977.0, 36379.0, 70949.0, 142106.0, 252501.0, 236495.0, 127420.0, 63991.0, 32832.0, 17200.0, 9523.0, 5608.0, 3301.0, 1970.0, 1216.0, 769.0, 522.0, 318.0, 212.0, 152.0, 105.0, 58.0, 37.0, 26.0, 19.0, 8.0, 8.0, 4.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0], "bins": [-5.578125, -5.41839599609375, -5.2586669921875, -5.09893798828125, -4.939208984375, -4.77947998046875, -4.6197509765625, -4.46002197265625, -4.30029296875, -4.14056396484375, -3.9808349609375, -3.82110595703125, -3.661376953125, -3.50164794921875, -3.3419189453125, -3.18218994140625, -3.0224609375, -2.86273193359375, -2.7030029296875, -2.54327392578125, -2.383544921875, -2.22381591796875, -2.0640869140625, -1.90435791015625, -1.74462890625, -1.58489990234375, -1.4251708984375, -1.26544189453125, -1.105712890625, -0.94598388671875, -0.7862548828125, -0.62652587890625, -0.466796875, -0.30706787109375, -0.1473388671875, 0.01239013671875, 0.172119140625, 0.33184814453125, 0.4915771484375, 0.65130615234375, 0.81103515625, 0.97076416015625, 1.1304931640625, 1.29022216796875, 1.449951171875, 1.60968017578125, 1.7694091796875, 1.92913818359375, 2.0888671875, 2.24859619140625, 2.4083251953125, 2.56805419921875, 2.727783203125, 2.88751220703125, 3.0472412109375, 3.20697021484375, 3.36669921875, 3.52642822265625, 3.6861572265625, 3.84588623046875, 4.005615234375, 4.16534423828125, 4.3250732421875, 4.48480224609375, 4.64453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 5.0, 8.0, 6.0, 18.0, 17.0, 14.0, 26.0, 26.0, 29.0, 42.0, 39.0, 64.0, 50.0, 62.0, 56.0, 44.0, 66.0, 57.0, 45.0, 59.0, 39.0, 37.0, 25.0, 32.0, 26.0, 14.0, 19.0, 14.0, 9.0, 16.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.833984375, -3.705230712890625, -3.57647705078125, -3.447723388671875, -3.3189697265625, -3.190216064453125, -3.06146240234375, -2.932708740234375, -2.803955078125, -2.675201416015625, -2.54644775390625, -2.417694091796875, -2.2889404296875, -2.160186767578125, -2.03143310546875, -1.902679443359375, -1.77392578125, -1.645172119140625, -1.51641845703125, -1.387664794921875, -1.2589111328125, -1.130157470703125, -1.00140380859375, -0.872650146484375, -0.743896484375, -0.615142822265625, -0.48638916015625, -0.357635498046875, -0.2288818359375, -0.100128173828125, 0.02862548828125, 0.157379150390625, 0.2861328125, 0.414886474609375, 0.54364013671875, 0.672393798828125, 0.8011474609375, 0.929901123046875, 1.05865478515625, 1.187408447265625, 1.316162109375, 1.444915771484375, 1.57366943359375, 1.702423095703125, 1.8311767578125, 1.959930419921875, 2.08868408203125, 2.217437744140625, 2.34619140625, 2.474945068359375, 2.60369873046875, 2.732452392578125, 2.8612060546875, 2.989959716796875, 3.11871337890625, 3.247467041015625, 3.376220703125, 3.504974365234375, 3.63372802734375, 3.762481689453125, 3.8912353515625, 4.019989013671875, 4.14874267578125, 4.277496337890625, 4.40625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 12.0, 6.0, 15.0, 20.0, 16.0, 31.0, 51.0, 60.0, 82.0, 121.0, 188.0, 272.0, 396.0, 629.0, 1001.0, 2209.0, 6305.0, 32233.0, 339839.0, 597207.0, 52756.0, 8992.0, 2770.0, 1250.0, 667.0, 417.0, 331.0, 182.0, 139.0, 97.0, 70.0, 59.0, 26.0, 24.0, 16.0, 22.0, 10.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.26171875, -13.84375, -13.42578125, -13.0078125, -12.58984375, -12.171875, -11.75390625, -11.3359375, -10.91796875, -10.5, -10.08203125, -9.6640625, -9.24609375, -8.828125, -8.41015625, -7.9921875, -7.57421875, -7.15625, -6.73828125, -6.3203125, -5.90234375, -5.484375, -5.06640625, -4.6484375, -4.23046875, -3.8125, -3.39453125, -2.9765625, -2.55859375, -2.140625, -1.72265625, -1.3046875, -0.88671875, -0.46875, -0.05078125, 0.3671875, 0.78515625, 1.203125, 1.62109375, 2.0390625, 2.45703125, 2.875, 3.29296875, 3.7109375, 4.12890625, 4.546875, 4.96484375, 5.3828125, 5.80078125, 6.21875, 6.63671875, 7.0546875, 7.47265625, 7.890625, 8.30859375, 8.7265625, 9.14453125, 9.5625, 9.98046875, 10.3984375, 10.81640625, 11.234375, 11.65234375, 12.0703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 4.0, 11.0, 13.0, 14.0, 28.0, 21.0, 11.0, 38.0, 26.0, 35.0, 43.0, 37.0, 53.0, 34.0, 61.0, 45.0, 61.0, 58.0, 48.0, 44.0, 49.0, 44.0, 38.0, 36.0, 23.0, 24.0, 14.0, 22.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.484375, -20.912109375, -20.33984375, -19.767578125, -19.1953125, -18.623046875, -18.05078125, -17.478515625, -16.90625, -16.333984375, -15.76171875, -15.189453125, -14.6171875, -14.044921875, -13.47265625, -12.900390625, -12.328125, -11.755859375, -11.18359375, -10.611328125, -10.0390625, -9.466796875, -8.89453125, -8.322265625, -7.75, -7.177734375, -6.60546875, -6.033203125, -5.4609375, -4.888671875, -4.31640625, -3.744140625, -3.171875, -2.599609375, -2.02734375, -1.455078125, -0.8828125, -0.310546875, 0.26171875, 0.833984375, 1.40625, 1.978515625, 2.55078125, 3.123046875, 3.6953125, 4.267578125, 4.83984375, 5.412109375, 5.984375, 6.556640625, 7.12890625, 7.701171875, 8.2734375, 8.845703125, 9.41796875, 9.990234375, 10.5625, 11.134765625, 11.70703125, 12.279296875, 12.8515625, 13.423828125, 13.99609375, 14.568359375, 15.140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 10.0, 10.0, 9.0, 7.0, 15.0, 29.0, 41.0, 64.0, 80.0, 146.0, 220.0, 462.0, 961.0, 2445.0, 8747.0, 53812.0, 642031.0, 302921.0, 27614.0, 5467.0, 1776.0, 744.0, 383.0, 219.0, 118.0, 68.0, 44.0, 31.0, 23.0, 16.0, 10.0, 7.0, 2.0, 7.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.3515625, -6.1234130859375, -5.895263671875, -5.6671142578125, -5.43896484375, -5.2108154296875, -4.982666015625, -4.7545166015625, -4.5263671875, -4.2982177734375, -4.070068359375, -3.8419189453125, -3.61376953125, -3.3856201171875, -3.157470703125, -2.9293212890625, -2.701171875, -2.4730224609375, -2.244873046875, -2.0167236328125, -1.78857421875, -1.5604248046875, -1.332275390625, -1.1041259765625, -0.8759765625, -0.6478271484375, -0.419677734375, -0.1915283203125, 0.03662109375, 0.2647705078125, 0.492919921875, 0.7210693359375, 0.94921875, 1.1773681640625, 1.405517578125, 1.6336669921875, 1.86181640625, 2.0899658203125, 2.318115234375, 2.5462646484375, 2.7744140625, 3.0025634765625, 3.230712890625, 3.4588623046875, 3.68701171875, 3.9151611328125, 4.143310546875, 4.3714599609375, 4.599609375, 4.8277587890625, 5.055908203125, 5.2840576171875, 5.51220703125, 5.7403564453125, 5.968505859375, 6.1966552734375, 6.4248046875, 6.6529541015625, 6.881103515625, 7.1092529296875, 7.33740234375, 7.5655517578125, 7.793701171875, 8.0218505859375, 8.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 11.0, 9.0, 14.0, 15.0, 17.0, 14.0, 17.0, 47.0, 49.0, 80.0, 88.0, 120.0, 117.0, 119.0, 71.0, 60.0, 32.0, 28.0, 25.0, 14.0, 14.0, 8.0, 12.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001056671142578125, -0.0010175108909606934, -0.0009783506393432617, -0.0009391903877258301, -0.0009000301361083984, -0.0008608698844909668, -0.0008217096328735352, -0.0007825493812561035, -0.0007433891296386719, -0.0007042288780212402, -0.0006650686264038086, -0.000625908374786377, -0.0005867481231689453, -0.0005475878715515137, -0.000508427619934082, -0.0004692673683166504, -0.00043010711669921875, -0.0003909468650817871, -0.00035178661346435547, -0.00031262636184692383, -0.0002734661102294922, -0.00023430585861206055, -0.0001951456069946289, -0.00015598535537719727, -0.00011682510375976562, -7.766485214233398e-05, -3.8504600524902344e-05, 6.556510925292969e-07, 3.981590270996094e-05, 7.897615432739258e-05, 0.00011813640594482422, 0.00015729665756225586, 0.0001964569091796875, 0.00023561716079711914, 0.0002747774124145508, 0.0003139376640319824, 0.00035309791564941406, 0.0003922581672668457, 0.00043141841888427734, 0.000470578670501709, 0.0005097389221191406, 0.0005488991737365723, 0.0005880594253540039, 0.0006272196769714355, 0.0006663799285888672, 0.0007055401802062988, 0.0007447004318237305, 0.0007838606834411621, 0.0008230209350585938, 0.0008621811866760254, 0.000901341438293457, 0.0009405016899108887, 0.0009796619415283203, 0.001018822193145752, 0.0010579824447631836, 0.0010971426963806152, 0.0011363029479980469, 0.0011754631996154785, 0.0012146234512329102, 0.0012537837028503418, 0.0012929439544677734, 0.001332104206085205, 0.0013712644577026367, 0.0014104247093200684, 0.0014495849609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 25.0, 50.0, 116.0, 218.0, 530.0, 1420.0, 5430.0, 57688.0, 851369.0, 120531.0, 8123.0, 1815.0, 705.0, 263.0, 137.0, 48.0, 29.0, 15.0, 10.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.65625, -11.3194580078125, -10.982666015625, -10.6458740234375, -10.30908203125, -9.9722900390625, -9.635498046875, -9.2987060546875, -8.9619140625, -8.6251220703125, -8.288330078125, -7.9515380859375, -7.61474609375, -7.2779541015625, -6.941162109375, -6.6043701171875, -6.267578125, -5.9307861328125, -5.593994140625, -5.2572021484375, -4.92041015625, -4.5836181640625, -4.246826171875, -3.9100341796875, -3.5732421875, -3.2364501953125, -2.899658203125, -2.5628662109375, -2.22607421875, -1.8892822265625, -1.552490234375, -1.2156982421875, -0.87890625, -0.5421142578125, -0.205322265625, 0.1314697265625, 0.46826171875, 0.8050537109375, 1.141845703125, 1.4786376953125, 1.8154296875, 2.1522216796875, 2.489013671875, 2.8258056640625, 3.16259765625, 3.4993896484375, 3.836181640625, 4.1729736328125, 4.509765625, 4.8465576171875, 5.183349609375, 5.5201416015625, 5.85693359375, 6.1937255859375, 6.530517578125, 6.8673095703125, 7.2041015625, 7.5408935546875, 7.877685546875, 8.2144775390625, 8.55126953125, 8.8880615234375, 9.224853515625, 9.5616455078125, 9.8984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 11.0, 15.0, 31.0, 22.0, 42.0, 41.0, 44.0, 78.0, 95.0, 112.0, 96.0, 88.0, 78.0, 68.0, 48.0, 42.0, 28.0, 17.0, 9.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.25, -9.035888671875, -8.82177734375, -8.607666015625, -8.3935546875, -8.179443359375, -7.96533203125, -7.751220703125, -7.537109375, -7.322998046875, -7.10888671875, -6.894775390625, -6.6806640625, -6.466552734375, -6.25244140625, -6.038330078125, -5.82421875, -5.610107421875, -5.39599609375, -5.181884765625, -4.9677734375, -4.753662109375, -4.53955078125, -4.325439453125, -4.111328125, -3.897216796875, -3.68310546875, -3.468994140625, -3.2548828125, -3.040771484375, -2.82666015625, -2.612548828125, -2.3984375, -2.184326171875, -1.97021484375, -1.756103515625, -1.5419921875, -1.327880859375, -1.11376953125, -0.899658203125, -0.685546875, -0.471435546875, -0.25732421875, -0.043212890625, 0.1708984375, 0.385009765625, 0.59912109375, 0.813232421875, 1.02734375, 1.241455078125, 1.45556640625, 1.669677734375, 1.8837890625, 2.097900390625, 2.31201171875, 2.526123046875, 2.740234375, 2.954345703125, 3.16845703125, 3.382568359375, 3.5966796875, 3.810791015625, 4.02490234375, 4.239013671875, 4.453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 12.0, 32.0, 70.0, 110.0, 169.0, 196.0, 178.0, 101.0, 72.0, 35.0, 10.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-171.42236328125, -167.47799682617188, -163.53363037109375, -159.58926391601562, -155.6448974609375, -151.70053100585938, -147.75616455078125, -143.81179809570312, -139.867431640625, -135.92306518554688, -131.97869873046875, -128.03433227539062, -124.0899658203125, -120.14559936523438, -116.20123291015625, -112.25686645507812, -108.3125, -104.36813354492188, -100.42376708984375, -96.47940063476562, -92.5350341796875, -88.59066772460938, -84.64630126953125, -80.70193481445312, -76.757568359375, -72.81320190429688, -68.86883544921875, -64.92446899414062, -60.9801025390625, -57.035736083984375, -53.09136962890625, -49.147003173828125, -45.20264434814453, -41.258277893066406, -37.31391143798828, -33.369544982910156, -29.42517852783203, -25.480812072753906, -21.53644561767578, -17.592079162597656, -13.647712707519531, -9.703346252441406, -5.758979797363281, -1.8146133422851562, 2.1297531127929688, 6.074119567871094, 10.018486022949219, 13.962852478027344, 17.90721893310547, 21.851585388183594, 25.79595184326172, 29.740318298339844, 33.68468475341797, 37.629051208496094, 41.57341766357422, 45.517784118652344, 49.46215057373047, 53.406517028808594, 57.35088348388672, 61.295249938964844, 65.23961639404297, 69.1839828491211, 73.12834930419922, 77.07271575927734, 81.01708221435547]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 13.0, 11.0, 14.0, 16.0, 11.0, 14.0, 15.0, 28.0, 28.0, 34.0, 42.0, 48.0, 37.0, 51.0, 44.0, 48.0, 57.0, 51.0, 46.0, 49.0, 44.0, 41.0, 31.0, 30.0, 33.0, 25.0, 22.0, 21.0, 11.0, 19.0, 15.0, 3.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.32884216308594, -78.93712615966797, -76.54541778564453, -74.15370178222656, -71.76199340820312, -69.37027740478516, -66.97856140136719, -64.58685302734375, -62.19513702392578, -59.80342483520508, -57.411712646484375, -55.019996643066406, -52.6282844543457, -50.236572265625, -47.84485626220703, -45.45314407348633, -43.061431884765625, -40.66971969604492, -38.27800750732422, -35.88629150390625, -33.49457931518555, -31.102867126464844, -28.711153030395508, -26.319438934326172, -23.92772674560547, -21.536014556884766, -19.14430046081543, -16.752586364746094, -14.36087417602539, -11.969161033630371, -9.577447891235352, -7.185733795166016, -4.794029235839844, -2.402316093444824, -0.010602951049804688, 2.381110191345215, 4.772823333740234, 7.164536476135254, 9.556249618530273, 11.94796371459961, 14.339675903320312, 16.731388092041016, 19.12310218811035, 21.514816284179688, 23.90652847290039, 26.298240661621094, 28.68995475769043, 31.081668853759766, 33.47338104248047, 35.86509323120117, 38.256805419921875, 40.648521423339844, 43.04023361206055, 45.43194580078125, 47.82366180419922, 50.21537399291992, 52.607086181640625, 54.99879837036133, 57.39051055908203, 59.7822265625, 62.1739387512207, 64.5656509399414, 66.95736694335938, 69.34907531738281, 71.74079132080078]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 11.0, 18.0, 15.0, 25.0, 43.0, 57.0, 64.0, 77.0, 131.0, 161.0, 219.0, 248.0, 436.0, 662.0, 1032.0, 1596.0, 2778.0, 5024.0, 10009.0, 24339.0, 87721.0, 3607874.0, 368110.0, 49041.0, 16784.0, 7412.0, 3917.0, 2294.0, 1345.0, 893.0, 547.0, 417.0, 265.0, 155.0, 135.0, 99.0, 69.0, 63.0, 53.0, 31.0, 23.0, 16.0, 17.0, 9.0, 9.0, 10.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-8.2421875, -7.9830322265625, -7.723876953125, -7.4647216796875, -7.20556640625, -6.9464111328125, -6.687255859375, -6.4281005859375, -6.1689453125, -5.9097900390625, -5.650634765625, -5.3914794921875, -5.13232421875, -4.8731689453125, -4.614013671875, -4.3548583984375, -4.095703125, -3.8365478515625, -3.577392578125, -3.3182373046875, -3.05908203125, -2.7999267578125, -2.540771484375, -2.2816162109375, -2.0224609375, -1.7633056640625, -1.504150390625, -1.2449951171875, -0.98583984375, -0.7266845703125, -0.467529296875, -0.2083740234375, 0.05078125, 0.3099365234375, 0.569091796875, 0.8282470703125, 1.08740234375, 1.3465576171875, 1.605712890625, 1.8648681640625, 2.1240234375, 2.3831787109375, 2.642333984375, 2.9014892578125, 3.16064453125, 3.4197998046875, 3.678955078125, 3.9381103515625, 4.197265625, 4.4564208984375, 4.715576171875, 4.9747314453125, 5.23388671875, 5.4930419921875, 5.752197265625, 6.0113525390625, 6.2705078125, 6.5296630859375, 6.788818359375, 7.0479736328125, 7.30712890625, 7.5662841796875, 7.825439453125, 8.0845947265625, 8.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 11.0, 7.0, 11.0, 16.0, 30.0, 21.0, 17.0, 36.0, 48.0, 52.0, 56.0, 58.0, 64.0, 63.0, 60.0, 64.0, 65.0, 47.0, 41.0, 37.0, 39.0, 32.0, 23.0, 20.0, 18.0, 14.0, 16.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.341400146484375, -4.21014404296875, -4.078887939453125, -3.9476318359375, -3.816375732421875, -3.68511962890625, -3.553863525390625, -3.422607421875, -3.291351318359375, -3.16009521484375, -3.028839111328125, -2.8975830078125, -2.766326904296875, -2.63507080078125, -2.503814697265625, -2.37255859375, -2.241302490234375, -2.11004638671875, -1.978790283203125, -1.8475341796875, -1.716278076171875, -1.58502197265625, -1.453765869140625, -1.322509765625, -1.191253662109375, -1.05999755859375, -0.928741455078125, -0.7974853515625, -0.666229248046875, -0.53497314453125, -0.403717041015625, -0.2724609375, -0.141204833984375, -0.00994873046875, 0.121307373046875, 0.2525634765625, 0.383819580078125, 0.51507568359375, 0.646331787109375, 0.777587890625, 0.908843994140625, 1.04010009765625, 1.171356201171875, 1.3026123046875, 1.433868408203125, 1.56512451171875, 1.696380615234375, 1.82763671875, 1.958892822265625, 2.09014892578125, 2.221405029296875, 2.3526611328125, 2.483917236328125, 2.61517333984375, 2.746429443359375, 2.877685546875, 3.008941650390625, 3.14019775390625, 3.271453857421875, 3.4027099609375, 3.533966064453125, 3.66522216796875, 3.796478271484375, 3.927734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 7.0, 15.0, 27.0, 45.0, 39.0, 91.0, 125.0, 212.0, 387.0, 648.0, 1127.0, 2128.0, 4279.0, 9531.0, 27740.0, 145922.0, 3759618.0, 189727.0, 31856.0, 10734.0, 4694.0, 2342.0, 1237.0, 667.0, 393.0, 214.0, 158.0, 103.0, 84.0, 40.0, 32.0, 24.0, 9.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.4576416015625, -10.126220703125, -9.7947998046875, -9.46337890625, -9.1319580078125, -8.800537109375, -8.4691162109375, -8.1376953125, -7.8062744140625, -7.474853515625, -7.1434326171875, -6.81201171875, -6.4805908203125, -6.149169921875, -5.8177490234375, -5.486328125, -5.1549072265625, -4.823486328125, -4.4920654296875, -4.16064453125, -3.8292236328125, -3.497802734375, -3.1663818359375, -2.8349609375, -2.5035400390625, -2.172119140625, -1.8406982421875, -1.50927734375, -1.1778564453125, -0.846435546875, -0.5150146484375, -0.18359375, 0.1478271484375, 0.479248046875, 0.8106689453125, 1.14208984375, 1.4735107421875, 1.804931640625, 2.1363525390625, 2.4677734375, 2.7991943359375, 3.130615234375, 3.4620361328125, 3.79345703125, 4.1248779296875, 4.456298828125, 4.7877197265625, 5.119140625, 5.4505615234375, 5.781982421875, 6.1134033203125, 6.44482421875, 6.7762451171875, 7.107666015625, 7.4390869140625, 7.7705078125, 8.1019287109375, 8.433349609375, 8.7647705078125, 9.09619140625, 9.4276123046875, 9.759033203125, 10.0904541015625, 10.421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 18.0, 13.0, 27.0, 45.0, 63.0, 140.0, 305.0, 2079.0, 864.0, 192.0, 85.0, 63.0, 42.0, 21.0, 10.0, 17.0, 14.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.1439208984375, -3.006591796875, -2.8692626953125, -2.73193359375, -2.5946044921875, -2.457275390625, -2.3199462890625, -2.1826171875, -2.0452880859375, -1.907958984375, -1.7706298828125, -1.63330078125, -1.4959716796875, -1.358642578125, -1.2213134765625, -1.083984375, -0.9466552734375, -0.809326171875, -0.6719970703125, -0.53466796875, -0.3973388671875, -0.260009765625, -0.1226806640625, 0.0146484375, 0.1519775390625, 0.289306640625, 0.4266357421875, 0.56396484375, 0.7012939453125, 0.838623046875, 0.9759521484375, 1.11328125, 1.2506103515625, 1.387939453125, 1.5252685546875, 1.66259765625, 1.7999267578125, 1.937255859375, 2.0745849609375, 2.2119140625, 2.3492431640625, 2.486572265625, 2.6239013671875, 2.76123046875, 2.8985595703125, 3.035888671875, 3.1732177734375, 3.310546875, 3.4478759765625, 3.585205078125, 3.7225341796875, 3.85986328125, 3.9971923828125, 4.134521484375, 4.2718505859375, 4.4091796875, 4.5465087890625, 4.683837890625, 4.8211669921875, 4.95849609375, 5.0958251953125, 5.233154296875, 5.3704833984375, 5.5078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 13.0, 17.0, 22.0, 41.0, 60.0, 87.0, 105.0, 121.0, 114.0, 94.0, 78.0, 66.0, 57.0, 35.0, 18.0, 24.0, 19.0, 11.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.327024459838867, -18.627227783203125, -17.927433013916016, -17.227636337280273, -16.527841567993164, -15.828044891357422, -15.128249168395996, -14.42845344543457, -13.728657722473145, -13.028861999511719, -12.329066276550293, -11.629270553588867, -10.929473876953125, -10.229679107666016, -9.529882431030273, -8.830086708068848, -8.130290985107422, -7.430495262145996, -6.73069953918457, -6.030903339385986, -5.3311076164245605, -4.631311893463135, -3.931515693664551, -3.231719970703125, -2.531924247741699, -1.8321284055709839, -1.1323325634002686, -0.43253660202026367, 0.2672591209411621, 0.9670548439025879, 1.6668510437011719, 2.3666467666625977, 3.0664443969726562, 3.766240119934082, 4.466035842895508, 5.165832042694092, 5.865627765655518, 6.565423488616943, 7.265219688415527, 7.965015411376953, 8.664811134338379, 9.364606857299805, 10.06440258026123, 10.764198303222656, 11.463994979858398, 12.163789749145508, 12.86358642578125, 13.563382148742676, 14.263177871704102, 14.962973594665527, 15.662769317626953, 16.362565994262695, 17.062360763549805, 17.762157440185547, 18.461952209472656, 19.1617488861084, 19.86154556274414, 20.561342239379883, 21.261137008666992, 21.960933685302734, 22.660728454589844, 23.360525131225586, 24.060321807861328, 24.760116577148438, 25.459911346435547]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 3.0, 13.0, 6.0, 21.0, 15.0, 19.0, 22.0, 33.0, 21.0, 21.0, 29.0, 38.0, 39.0, 46.0, 45.0, 44.0, 43.0, 45.0, 43.0, 47.0, 49.0, 41.0, 32.0, 36.0, 36.0, 34.0, 19.0, 30.0, 16.0, 14.0, 16.0, 10.0, 14.0, 12.0, 10.0, 7.0, 3.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5743989944458, -12.15159797668457, -11.728796005249023, -11.305994033813477, -10.883193016052246, -10.460391998291016, -10.037590026855469, -9.614788055419922, -9.191987037658691, -8.769186019897461, -8.346384048461914, -7.923582553863525, -7.500781059265137, -7.077979564666748, -6.655178070068359, -6.232376575469971, -5.809575080871582, -5.386773586273193, -4.963972091674805, -4.541170597076416, -4.118369102478027, -3.6955676078796387, -3.27276611328125, -2.8499646186828613, -2.4271631240844727, -2.004361629486084, -1.5815601348876953, -1.1587586402893066, -0.735957145690918, -0.3131556510925293, 0.10964584350585938, 0.532447338104248, 0.9552497863769531, 1.3780512809753418, 1.8008527755737305, 2.223654270172119, 2.646455764770508, 3.0692572593688965, 3.492058753967285, 3.914860248565674, 4.3376617431640625, 4.760463237762451, 5.18326473236084, 5.6060662269592285, 6.028867721557617, 6.451669216156006, 6.8744707107543945, 7.297272205352783, 7.720073699951172, 8.142875671386719, 8.56567668914795, 8.98847770690918, 9.411279678344727, 9.834081649780273, 10.256882667541504, 10.679683685302734, 11.102485656738281, 11.525287628173828, 11.948088645935059, 12.370889663696289, 12.793691635131836, 13.216493606567383, 13.639294624328613, 14.062095642089844, 14.48489761352539]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 16.0, 15.0, 31.0, 26.0, 54.0, 73.0, 94.0, 151.0, 224.0, 337.0, 485.0, 701.0, 1082.0, 1693.0, 2532.0, 4183.0, 6782.0, 11054.0, 18531.0, 30985.0, 53219.0, 96128.0, 184509.0, 267094.0, 162964.0, 85574.0, 48184.0, 27912.0, 16697.0, 9986.0, 6319.0, 3876.0, 2483.0, 1538.0, 1042.0, 677.0, 411.0, 267.0, 201.0, 143.0, 95.0, 57.0, 42.0, 31.0, 31.0, 13.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.27728271484375, -5.1092529296875, -4.94122314453125, -4.773193359375, -4.60516357421875, -4.4371337890625, -4.26910400390625, -4.10107421875, -3.93304443359375, -3.7650146484375, -3.59698486328125, -3.428955078125, -3.26092529296875, -3.0928955078125, -2.92486572265625, -2.7568359375, -2.58880615234375, -2.4207763671875, -2.25274658203125, -2.084716796875, -1.91668701171875, -1.7486572265625, -1.58062744140625, -1.41259765625, -1.24456787109375, -1.0765380859375, -0.90850830078125, -0.740478515625, -0.57244873046875, -0.4044189453125, -0.23638916015625, -0.068359375, 0.09967041015625, 0.2677001953125, 0.43572998046875, 0.603759765625, 0.77178955078125, 0.9398193359375, 1.10784912109375, 1.27587890625, 1.44390869140625, 1.6119384765625, 1.77996826171875, 1.947998046875, 2.11602783203125, 2.2840576171875, 2.45208740234375, 2.6201171875, 2.78814697265625, 2.9561767578125, 3.12420654296875, 3.292236328125, 3.46026611328125, 3.6282958984375, 3.79632568359375, 3.96435546875, 4.13238525390625, 4.3004150390625, 4.46844482421875, 4.636474609375, 4.80450439453125, 4.9725341796875, 5.14056396484375, 5.30859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 6.0, 10.0, 7.0, 22.0, 19.0, 19.0, 16.0, 33.0, 45.0, 37.0, 33.0, 54.0, 43.0, 51.0, 59.0, 47.0, 43.0, 54.0, 45.0, 49.0, 37.0, 42.0, 32.0, 30.0, 29.0, 20.0, 17.0, 16.0, 13.0, 10.0, 8.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.564453125, -3.45159912109375, -3.3387451171875, -3.22589111328125, -3.113037109375, -3.00018310546875, -2.8873291015625, -2.77447509765625, -2.66162109375, -2.54876708984375, -2.4359130859375, -2.32305908203125, -2.210205078125, -2.09735107421875, -1.9844970703125, -1.87164306640625, -1.7587890625, -1.64593505859375, -1.5330810546875, -1.42022705078125, -1.307373046875, -1.19451904296875, -1.0816650390625, -0.96881103515625, -0.85595703125, -0.74310302734375, -0.6302490234375, -0.51739501953125, -0.404541015625, -0.29168701171875, -0.1788330078125, -0.06597900390625, 0.046875, 0.15972900390625, 0.2725830078125, 0.38543701171875, 0.498291015625, 0.61114501953125, 0.7239990234375, 0.83685302734375, 0.94970703125, 1.06256103515625, 1.1754150390625, 1.28826904296875, 1.401123046875, 1.51397705078125, 1.6268310546875, 1.73968505859375, 1.8525390625, 1.96539306640625, 2.0782470703125, 2.19110107421875, 2.303955078125, 2.41680908203125, 2.5296630859375, 2.64251708984375, 2.75537109375, 2.86822509765625, 2.9810791015625, 3.09393310546875, 3.206787109375, 3.31964111328125, 3.4324951171875, 3.54534912109375, 3.658203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 14.0, 15.0, 18.0, 31.0, 37.0, 66.0, 92.0, 133.0, 177.0, 282.0, 426.0, 753.0, 1363.0, 3080.0, 11408.0, 86300.0, 745239.0, 172324.0, 18583.0, 4160.0, 1693.0, 863.0, 480.0, 324.0, 217.0, 155.0, 88.0, 69.0, 46.0, 37.0, 21.0, 13.0, 8.0, 9.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.4375, -15.91796875, -15.3984375, -14.87890625, -14.359375, -13.83984375, -13.3203125, -12.80078125, -12.28125, -11.76171875, -11.2421875, -10.72265625, -10.203125, -9.68359375, -9.1640625, -8.64453125, -8.125, -7.60546875, -7.0859375, -6.56640625, -6.046875, -5.52734375, -5.0078125, -4.48828125, -3.96875, -3.44921875, -2.9296875, -2.41015625, -1.890625, -1.37109375, -0.8515625, -0.33203125, 0.1875, 0.70703125, 1.2265625, 1.74609375, 2.265625, 2.78515625, 3.3046875, 3.82421875, 4.34375, 4.86328125, 5.3828125, 5.90234375, 6.421875, 6.94140625, 7.4609375, 7.98046875, 8.5, 9.01953125, 9.5390625, 10.05859375, 10.578125, 11.09765625, 11.6171875, 12.13671875, 12.65625, 13.17578125, 13.6953125, 14.21484375, 14.734375, 15.25390625, 15.7734375, 16.29296875, 16.8125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 16.0, 11.0, 10.0, 11.0, 16.0, 24.0, 24.0, 25.0, 38.0, 44.0, 45.0, 47.0, 47.0, 44.0, 47.0, 51.0, 34.0, 44.0, 41.0, 43.0, 40.0, 38.0, 34.0, 26.0, 26.0, 26.0, 28.0, 18.0, 14.0, 13.0, 9.0, 12.0, 8.0, 7.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.7109375, -12.286865234375, -11.86279296875, -11.438720703125, -11.0146484375, -10.590576171875, -10.16650390625, -9.742431640625, -9.318359375, -8.894287109375, -8.47021484375, -8.046142578125, -7.6220703125, -7.197998046875, -6.77392578125, -6.349853515625, -5.92578125, -5.501708984375, -5.07763671875, -4.653564453125, -4.2294921875, -3.805419921875, -3.38134765625, -2.957275390625, -2.533203125, -2.109130859375, -1.68505859375, -1.260986328125, -0.8369140625, -0.412841796875, 0.01123046875, 0.435302734375, 0.859375, 1.283447265625, 1.70751953125, 2.131591796875, 2.5556640625, 2.979736328125, 3.40380859375, 3.827880859375, 4.251953125, 4.676025390625, 5.10009765625, 5.524169921875, 5.9482421875, 6.372314453125, 6.79638671875, 7.220458984375, 7.64453125, 8.068603515625, 8.49267578125, 8.916748046875, 9.3408203125, 9.764892578125, 10.18896484375, 10.613037109375, 11.037109375, 11.461181640625, 11.88525390625, 12.309326171875, 12.7333984375, 13.157470703125, 13.58154296875, 14.005615234375, 14.4296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 17.0, 9.0, 32.0, 39.0, 89.0, 133.0, 295.0, 653.0, 1781.0, 5984.0, 33448.0, 366373.0, 580176.0, 48102.0, 7862.0, 2063.0, 772.0, 341.0, 169.0, 90.0, 52.0, 29.0, 17.0, 10.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.46875, -8.26263427734375, -8.0565185546875, -7.85040283203125, -7.644287109375, -7.43817138671875, -7.2320556640625, -7.02593994140625, -6.81982421875, -6.61370849609375, -6.4075927734375, -6.20147705078125, -5.995361328125, -5.78924560546875, -5.5831298828125, -5.37701416015625, -5.1708984375, -4.96478271484375, -4.7586669921875, -4.55255126953125, -4.346435546875, -4.14031982421875, -3.9342041015625, -3.72808837890625, -3.52197265625, -3.31585693359375, -3.1097412109375, -2.90362548828125, -2.697509765625, -2.49139404296875, -2.2852783203125, -2.07916259765625, -1.873046875, -1.66693115234375, -1.4608154296875, -1.25469970703125, -1.048583984375, -0.84246826171875, -0.6363525390625, -0.43023681640625, -0.22412109375, -0.01800537109375, 0.1881103515625, 0.39422607421875, 0.600341796875, 0.80645751953125, 1.0125732421875, 1.21868896484375, 1.4248046875, 1.63092041015625, 1.8370361328125, 2.04315185546875, 2.249267578125, 2.45538330078125, 2.6614990234375, 2.86761474609375, 3.07373046875, 3.27984619140625, 3.4859619140625, 3.69207763671875, 3.898193359375, 4.10430908203125, 4.3104248046875, 4.51654052734375, 4.72265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 16.0, 14.0, 11.0, 13.0, 20.0, 22.0, 25.0, 29.0, 36.0, 41.0, 57.0, 93.0, 101.0, 83.0, 84.0, 54.0, 44.0, 37.0, 31.0, 23.0, 20.0, 19.0, 20.0, 11.0, 17.0, 13.0, 9.0, 7.0, 5.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0009093284606933594, -0.0008789822459220886, -0.0008486360311508179, -0.0008182898163795471, -0.0007879436016082764, -0.0007575973868370056, -0.0007272511720657349, -0.0006969049572944641, -0.0006665587425231934, -0.0006362125277519226, -0.0006058663129806519, -0.0005755200982093811, -0.0005451738834381104, -0.0005148276686668396, -0.00048448145389556885, -0.0004541352391242981, -0.00042378902435302734, -0.0003934428095817566, -0.00036309659481048584, -0.0003327503800392151, -0.00030240416526794434, -0.0002720579504966736, -0.00024171173572540283, -0.00021136552095413208, -0.00018101930618286133, -0.00015067309141159058, -0.00012032687664031982, -8.998066186904907e-05, -5.963444709777832e-05, -2.928823232650757e-05, 1.0579824447631836e-06, 3.1404197216033936e-05, 6.175041198730469e-05, 9.209662675857544e-05, 0.0001224428415298462, 0.00015278905630111694, 0.0001831352710723877, 0.00021348148584365845, 0.0002438277006149292, 0.00027417391538619995, 0.0003045201301574707, 0.00033486634492874146, 0.0003652125597000122, 0.00039555877447128296, 0.0004259049892425537, 0.00045625120401382446, 0.0004865974187850952, 0.000516943633556366, 0.0005472898483276367, 0.0005776360630989075, 0.0006079822778701782, 0.000638328492641449, 0.0006686747074127197, 0.0006990209221839905, 0.0007293671369552612, 0.000759713351726532, 0.0007900595664978027, 0.0008204057812690735, 0.0008507519960403442, 0.000881098210811615, 0.0009114444255828857, 0.0009417906403541565, 0.0009721368551254272, 0.001002483069896698, 0.0010328292846679688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 10.0, 15.0, 24.0, 59.0, 101.0, 206.0, 382.0, 844.0, 2384.0, 10548.0, 134087.0, 823545.0, 66025.0, 7019.0, 1843.0, 720.0, 337.0, 195.0, 86.0, 45.0, 30.0, 11.0, 6.0, 12.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.75567626953125, -6.4996337890625, -6.24359130859375, -5.987548828125, -5.73150634765625, -5.4754638671875, -5.21942138671875, -4.96337890625, -4.70733642578125, -4.4512939453125, -4.19525146484375, -3.939208984375, -3.68316650390625, -3.4271240234375, -3.17108154296875, -2.9150390625, -2.65899658203125, -2.4029541015625, -2.14691162109375, -1.890869140625, -1.63482666015625, -1.3787841796875, -1.12274169921875, -0.86669921875, -0.61065673828125, -0.3546142578125, -0.09857177734375, 0.157470703125, 0.41351318359375, 0.6695556640625, 0.92559814453125, 1.181640625, 1.43768310546875, 1.6937255859375, 1.94976806640625, 2.205810546875, 2.46185302734375, 2.7178955078125, 2.97393798828125, 3.22998046875, 3.48602294921875, 3.7420654296875, 3.99810791015625, 4.254150390625, 4.51019287109375, 4.7662353515625, 5.02227783203125, 5.2783203125, 5.53436279296875, 5.7904052734375, 6.04644775390625, 6.302490234375, 6.55853271484375, 6.8145751953125, 7.07061767578125, 7.32666015625, 7.58270263671875, 7.8387451171875, 8.09478759765625, 8.350830078125, 8.60687255859375, 8.8629150390625, 9.11895751953125, 9.375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 10.0, 8.0, 12.0, 15.0, 20.0, 19.0, 13.0, 37.0, 39.0, 45.0, 51.0, 64.0, 95.0, 77.0, 92.0, 77.0, 64.0, 53.0, 47.0, 36.0, 33.0, 23.0, 12.0, 13.0, 16.0, 14.0, 6.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.2489013671875, -4.103271484375, -3.9576416015625, -3.81201171875, -3.6663818359375, -3.520751953125, -3.3751220703125, -3.2294921875, -3.0838623046875, -2.938232421875, -2.7926025390625, -2.64697265625, -2.5013427734375, -2.355712890625, -2.2100830078125, -2.064453125, -1.9188232421875, -1.773193359375, -1.6275634765625, -1.48193359375, -1.3363037109375, -1.190673828125, -1.0450439453125, -0.8994140625, -0.7537841796875, -0.608154296875, -0.4625244140625, -0.31689453125, -0.1712646484375, -0.025634765625, 0.1199951171875, 0.265625, 0.4112548828125, 0.556884765625, 0.7025146484375, 0.84814453125, 0.9937744140625, 1.139404296875, 1.2850341796875, 1.4306640625, 1.5762939453125, 1.721923828125, 1.8675537109375, 2.01318359375, 2.1588134765625, 2.304443359375, 2.4500732421875, 2.595703125, 2.7413330078125, 2.886962890625, 3.0325927734375, 3.17822265625, 3.3238525390625, 3.469482421875, 3.6151123046875, 3.7607421875, 3.9063720703125, 4.052001953125, 4.1976318359375, 4.34326171875, 4.4888916015625, 4.634521484375, 4.7801513671875, 4.92578125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 19.0, 43.0, 123.0, 195.0, 237.0, 203.0, 121.0, 32.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.48403930664062, -204.03048706054688, -198.57693481445312, -193.12338256835938, -187.66983032226562, -182.2162628173828, -176.76271057128906, -171.3091583251953, -165.85560607910156, -160.4020538330078, -154.94850158691406, -149.4949493408203, -144.0413818359375, -138.58782958984375, -133.13427734375, -127.68072509765625, -122.2271728515625, -116.77362060546875, -111.320068359375, -105.86650848388672, -100.41295623779297, -94.95940399169922, -89.50584411621094, -84.05229187011719, -78.59873962402344, -73.14518737792969, -67.69163513183594, -62.238075256347656, -56.784523010253906, -51.330970764160156, -45.87741470336914, -40.423858642578125, -34.970306396484375, -29.516752243041992, -24.06319808959961, -18.609643936157227, -13.156089782714844, -7.702535629272461, -2.248981475830078, 3.2045745849609375, 8.658126831054688, 14.11168098449707, 19.565235137939453, 25.018789291381836, 30.47234344482422, 35.92589569091797, 41.379451751708984, 46.8330078125, 52.28656005859375, 57.7401123046875, 63.193668365478516, 68.64722442626953, 74.10077667236328, 79.55432891845703, 85.00788879394531, 90.46144104003906, 95.91499328613281, 101.36854553222656, 106.82209777832031, 112.2756576538086, 117.72920989990234, 123.1827621459961, 128.63632202148438, 134.08987426757812, 139.54342651367188]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 11.0, 7.0, 9.0, 11.0, 13.0, 12.0, 13.0, 18.0, 28.0, 29.0, 31.0, 40.0, 36.0, 48.0, 58.0, 46.0, 42.0, 52.0, 52.0, 37.0, 49.0, 49.0, 41.0, 29.0, 31.0, 37.0, 20.0, 30.0, 26.0, 21.0, 17.0, 15.0, 7.0, 6.0, 7.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.8531379699707, -60.965328216552734, -59.0775146484375, -57.18970489501953, -55.3018913269043, -53.41408157348633, -51.526268005371094, -49.638458251953125, -47.750648498535156, -45.86283874511719, -43.97502517700195, -42.087215423583984, -40.19940185546875, -38.31159210205078, -36.42378234863281, -34.53596878051758, -32.648155212402344, -30.760343551635742, -28.87253189086914, -26.984722137451172, -25.096908569335938, -23.20909881591797, -21.321287155151367, -19.433475494384766, -17.545663833618164, -15.657852172851562, -13.770040512084961, -11.882229804992676, -9.994418144226074, -8.106606483459473, -6.2187957763671875, -4.330984115600586, -2.4431686401367188, -0.5553572177886963, 1.3324542045593262, 3.2202653884887695, 5.108077049255371, 6.995888710021973, 8.883699417114258, 10.77151107788086, 12.659322738647461, 14.547134399414062, 16.434946060180664, 18.322757720947266, 20.210567474365234, 22.09838104248047, 23.986190795898438, 25.87400245666504, 27.76181411743164, 29.649625778198242, 31.537437438964844, 33.42524719238281, 35.31306076049805, 37.200870513916016, 39.08868408203125, 40.97649383544922, 42.86430358886719, 44.752113342285156, 46.63992691040039, 48.52773666381836, 50.415550231933594, 52.30335998535156, 54.19116973876953, 56.078983306884766, 57.966796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 4.0, 6.0, 11.0, 15.0, 22.0, 18.0, 29.0, 31.0, 47.0, 78.0, 108.0, 143.0, 246.0, 386.0, 619.0, 1015.0, 1737.0, 3156.0, 5777.0, 11192.0, 23885.0, 58072.0, 182003.0, 892635.0, 2257081.0, 541513.0, 129219.0, 45468.0, 19351.0, 9395.0, 4789.0, 2631.0, 1391.0, 792.0, 516.0, 318.0, 171.0, 138.0, 89.0, 59.0, 34.0, 30.0, 22.0, 16.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.4453125, -4.29888916015625, -4.1524658203125, -4.00604248046875, -3.859619140625, -3.71319580078125, -3.5667724609375, -3.42034912109375, -3.27392578125, -3.12750244140625, -2.9810791015625, -2.83465576171875, -2.688232421875, -2.54180908203125, -2.3953857421875, -2.24896240234375, -2.1025390625, -1.95611572265625, -1.8096923828125, -1.66326904296875, -1.516845703125, -1.37042236328125, -1.2239990234375, -1.07757568359375, -0.93115234375, -0.78472900390625, -0.6383056640625, -0.49188232421875, -0.345458984375, -0.19903564453125, -0.0526123046875, 0.09381103515625, 0.240234375, 0.38665771484375, 0.5330810546875, 0.67950439453125, 0.825927734375, 0.97235107421875, 1.1187744140625, 1.26519775390625, 1.41162109375, 1.55804443359375, 1.7044677734375, 1.85089111328125, 1.997314453125, 2.14373779296875, 2.2901611328125, 2.43658447265625, 2.5830078125, 2.72943115234375, 2.8758544921875, 3.02227783203125, 3.168701171875, 3.31512451171875, 3.4615478515625, 3.60797119140625, 3.75439453125, 3.90081787109375, 4.0472412109375, 4.19366455078125, 4.340087890625, 4.48651123046875, 4.6329345703125, 4.77935791015625, 4.92578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 10.0, 11.0, 13.0, 12.0, 18.0, 14.0, 25.0, 21.0, 31.0, 42.0, 45.0, 44.0, 49.0, 58.0, 70.0, 55.0, 55.0, 55.0, 53.0, 45.0, 44.0, 42.0, 30.0, 34.0, 24.0, 25.0, 19.0, 13.0, 15.0, 9.0, 3.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0], "bins": [-5.171875, -5.050201416015625, -4.92852783203125, -4.806854248046875, -4.6851806640625, -4.563507080078125, -4.44183349609375, -4.320159912109375, -4.198486328125, -4.076812744140625, -3.95513916015625, -3.833465576171875, -3.7117919921875, -3.590118408203125, -3.46844482421875, -3.346771240234375, -3.22509765625, -3.103424072265625, -2.98175048828125, -2.860076904296875, -2.7384033203125, -2.616729736328125, -2.49505615234375, -2.373382568359375, -2.251708984375, -2.130035400390625, -2.00836181640625, -1.886688232421875, -1.7650146484375, -1.643341064453125, -1.52166748046875, -1.399993896484375, -1.2783203125, -1.156646728515625, -1.03497314453125, -0.913299560546875, -0.7916259765625, -0.669952392578125, -0.54827880859375, -0.426605224609375, -0.304931640625, -0.183258056640625, -0.06158447265625, 0.060089111328125, 0.1817626953125, 0.303436279296875, 0.42510986328125, 0.546783447265625, 0.66845703125, 0.790130615234375, 0.91180419921875, 1.033477783203125, 1.1551513671875, 1.276824951171875, 1.39849853515625, 1.520172119140625, 1.641845703125, 1.763519287109375, 1.88519287109375, 2.006866455078125, 2.1285400390625, 2.250213623046875, 2.37188720703125, 2.493560791015625, 2.615234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 2.0, 5.0, 7.0, 14.0, 18.0, 29.0, 32.0, 44.0, 72.0, 90.0, 221.0, 291.0, 591.0, 1289.0, 2761.0, 7033.0, 22262.0, 96138.0, 898001.0, 2872093.0, 231668.0, 42181.0, 11801.0, 4141.0, 1676.0, 787.0, 426.0, 221.0, 121.0, 78.0, 59.0, 36.0, 26.0, 19.0, 6.0, 6.0, 7.0, 10.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-10.671875, -10.39276123046875, -10.1136474609375, -9.83453369140625, -9.555419921875, -9.27630615234375, -8.9971923828125, -8.71807861328125, -8.43896484375, -8.15985107421875, -7.8807373046875, -7.60162353515625, -7.322509765625, -7.04339599609375, -6.7642822265625, -6.48516845703125, -6.2060546875, -5.92694091796875, -5.6478271484375, -5.36871337890625, -5.089599609375, -4.81048583984375, -4.5313720703125, -4.25225830078125, -3.97314453125, -3.69403076171875, -3.4149169921875, -3.13580322265625, -2.856689453125, -2.57757568359375, -2.2984619140625, -2.01934814453125, -1.740234375, -1.46112060546875, -1.1820068359375, -0.90289306640625, -0.623779296875, -0.34466552734375, -0.0655517578125, 0.21356201171875, 0.49267578125, 0.77178955078125, 1.0509033203125, 1.33001708984375, 1.609130859375, 1.88824462890625, 2.1673583984375, 2.44647216796875, 2.7255859375, 3.00469970703125, 3.2838134765625, 3.56292724609375, 3.842041015625, 4.12115478515625, 4.4002685546875, 4.67938232421875, 4.95849609375, 5.23760986328125, 5.5167236328125, 5.79583740234375, 6.074951171875, 6.35406494140625, 6.6331787109375, 6.91229248046875, 7.19140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 7.0, 7.0, 2.0, 11.0, 8.0, 13.0, 21.0, 32.0, 30.0, 53.0, 71.0, 94.0, 160.0, 249.0, 398.0, 622.0, 800.0, 490.0, 331.0, 186.0, 149.0, 98.0, 65.0, 43.0, 29.0, 24.0, 22.0, 14.0, 12.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.7578125, -9.4652099609375, -9.172607421875, -8.8800048828125, -8.58740234375, -8.2947998046875, -8.002197265625, -7.7095947265625, -7.4169921875, -7.1243896484375, -6.831787109375, -6.5391845703125, -6.24658203125, -5.9539794921875, -5.661376953125, -5.3687744140625, -5.076171875, -4.7835693359375, -4.490966796875, -4.1983642578125, -3.90576171875, -3.6131591796875, -3.320556640625, -3.0279541015625, -2.7353515625, -2.4427490234375, -2.150146484375, -1.8575439453125, -1.56494140625, -1.2723388671875, -0.979736328125, -0.6871337890625, -0.39453125, -0.1019287109375, 0.190673828125, 0.4832763671875, 0.77587890625, 1.0684814453125, 1.361083984375, 1.6536865234375, 1.9462890625, 2.2388916015625, 2.531494140625, 2.8240966796875, 3.11669921875, 3.4093017578125, 3.701904296875, 3.9945068359375, 4.287109375, 4.5797119140625, 4.872314453125, 5.1649169921875, 5.45751953125, 5.7501220703125, 6.042724609375, 6.3353271484375, 6.6279296875, 6.9205322265625, 7.213134765625, 7.5057373046875, 7.79833984375, 8.0909423828125, 8.383544921875, 8.6761474609375, 8.96875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 6.0, 9.0, 17.0, 78.0, 303.0, 406.0, 146.0, 29.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-449.61151123046875, -441.33709716796875, -433.0627136230469, -424.7882995605469, -416.513916015625, -408.239501953125, -399.9651184082031, -391.6907043457031, -383.41632080078125, -375.14190673828125, -366.8675231933594, -358.5931091308594, -350.3187255859375, -342.0443115234375, -333.7699279785156, -325.4955139160156, -317.22113037109375, -308.94671630859375, -300.6723327636719, -292.3979187011719, -284.12353515625, -275.84912109375, -267.5747375488281, -259.3003234863281, -251.02590942382812, -242.7515106201172, -234.47711181640625, -226.2027130126953, -217.92831420898438, -209.65391540527344, -201.3795166015625, -193.1051025390625, -184.83071899414062, -176.5563201904297, -168.28192138671875, -160.0075225830078, -151.73312377929688, -143.45872497558594, -135.184326171875, -126.90991973876953, -118.63551330566406, -110.36111450195312, -102.08671569824219, -93.81231689453125, -85.53791809082031, -77.26351928710938, -68.9891128540039, -60.71471405029297, -52.44031524658203, -44.165916442871094, -35.891517639160156, -27.617115020751953, -19.342716217041016, -11.068317413330078, -2.793914794921875, 5.4804840087890625, 13.7548828125, 22.029281616210938, 30.303682327270508, 38.57808303833008, 46.852481842041016, 55.12688064575195, 63.401283264160156, 71.6756820678711, 79.95008087158203]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 9.0, 2.0, 8.0, 5.0, 9.0, 16.0, 18.0, 24.0, 18.0, 34.0, 28.0, 36.0, 24.0, 40.0, 28.0, 49.0, 39.0, 58.0, 59.0, 59.0, 47.0, 65.0, 57.0, 41.0, 33.0, 35.0, 25.0, 29.0, 25.0, 22.0, 15.0, 12.0, 7.0, 9.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.7188606262207, -34.038429260253906, -32.35799789428711, -30.67756462097168, -28.997133255004883, -27.316701889038086, -25.636268615722656, -23.95583724975586, -22.275405883789062, -20.594974517822266, -18.91454315185547, -17.23410987854004, -15.553678512573242, -13.873247146606445, -12.192814826965332, -10.512382507324219, -8.831951141357422, -7.151519298553467, -5.471087455749512, -3.7906556129455566, -2.1102237701416016, -0.4297924041748047, 1.2506399154663086, 2.931072235107422, 4.611503601074219, 6.291935443878174, 7.972367286682129, 9.652799606323242, 11.333230972290039, 13.013662338256836, 14.69409465789795, 16.374526977539062, 18.054962158203125, 19.735393524169922, 21.41582489013672, 23.09625816345215, 24.776689529418945, 26.457120895385742, 28.137554168701172, 29.81798553466797, 31.498416900634766, 33.17884826660156, 34.85927963256836, 36.539710998535156, 38.22014617919922, 39.90057373046875, 41.58100891113281, 43.26144027709961, 44.941871643066406, 46.6223030090332, 48.302734375, 49.9831657409668, 51.663597106933594, 53.344032287597656, 55.02446365356445, 56.70489501953125, 58.38532638549805, 60.065757751464844, 61.74618911743164, 63.42662048339844, 65.1070556640625, 66.78748321533203, 68.4679183959961, 70.14834594726562, 71.82878112792969]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 23.0, 19.0, 31.0, 34.0, 61.0, 82.0, 128.0, 175.0, 305.0, 390.0, 615.0, 954.0, 1390.0, 2199.0, 3478.0, 5868.0, 9959.0, 17429.0, 31376.0, 62534.0, 160174.0, 374844.0, 213058.0, 77159.0, 36954.0, 20002.0, 11386.0, 6775.0, 3990.0, 2436.0, 1504.0, 1118.0, 686.0, 455.0, 288.0, 202.0, 127.0, 104.0, 67.0, 59.0, 36.0, 18.0, 17.0, 8.0, 7.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-6.57421875, -6.37872314453125, -6.1832275390625, -5.98773193359375, -5.792236328125, -5.59674072265625, -5.4012451171875, -5.20574951171875, -5.01025390625, -4.81475830078125, -4.6192626953125, -4.42376708984375, -4.228271484375, -4.03277587890625, -3.8372802734375, -3.64178466796875, -3.4462890625, -3.25079345703125, -3.0552978515625, -2.85980224609375, -2.664306640625, -2.46881103515625, -2.2733154296875, -2.07781982421875, -1.88232421875, -1.68682861328125, -1.4913330078125, -1.29583740234375, -1.100341796875, -0.90484619140625, -0.7093505859375, -0.51385498046875, -0.318359375, -0.12286376953125, 0.0726318359375, 0.26812744140625, 0.463623046875, 0.65911865234375, 0.8546142578125, 1.05010986328125, 1.24560546875, 1.44110107421875, 1.6365966796875, 1.83209228515625, 2.027587890625, 2.22308349609375, 2.4185791015625, 2.61407470703125, 2.8095703125, 3.00506591796875, 3.2005615234375, 3.39605712890625, 3.591552734375, 3.78704833984375, 3.9825439453125, 4.17803955078125, 4.37353515625, 4.56903076171875, 4.7645263671875, 4.96002197265625, 5.155517578125, 5.35101318359375, 5.5465087890625, 5.74200439453125, 5.9375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 6.0, 16.0, 19.0, 22.0, 27.0, 40.0, 43.0, 49.0, 46.0, 70.0, 52.0, 67.0, 81.0, 68.0, 73.0, 55.0, 39.0, 46.0, 41.0, 33.0, 31.0, 20.0, 15.0, 7.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.5625, -6.407073974609375, -6.25164794921875, -6.096221923828125, -5.9407958984375, -5.785369873046875, -5.62994384765625, -5.474517822265625, -5.319091796875, -5.163665771484375, -5.00823974609375, -4.852813720703125, -4.6973876953125, -4.541961669921875, -4.38653564453125, -4.231109619140625, -4.07568359375, -3.920257568359375, -3.76483154296875, -3.609405517578125, -3.4539794921875, -3.298553466796875, -3.14312744140625, -2.987701416015625, -2.832275390625, -2.676849365234375, -2.52142333984375, -2.365997314453125, -2.2105712890625, -2.055145263671875, -1.89971923828125, -1.744293212890625, -1.5888671875, -1.433441162109375, -1.27801513671875, -1.122589111328125, -0.9671630859375, -0.811737060546875, -0.65631103515625, -0.500885009765625, -0.345458984375, -0.190032958984375, -0.03460693359375, 0.120819091796875, 0.2762451171875, 0.431671142578125, 0.58709716796875, 0.742523193359375, 0.89794921875, 1.053375244140625, 1.20880126953125, 1.364227294921875, 1.5196533203125, 1.675079345703125, 1.83050537109375, 1.985931396484375, 2.141357421875, 2.296783447265625, 2.45220947265625, 2.607635498046875, 2.7630615234375, 2.918487548828125, 3.07391357421875, 3.229339599609375, 3.384765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 8.0, 8.0, 13.0, 24.0, 20.0, 39.0, 48.0, 74.0, 108.0, 162.0, 244.0, 415.0, 804.0, 1658.0, 4498.0, 22295.0, 421486.0, 563377.0, 24533.0, 4902.0, 1778.0, 798.0, 432.0, 280.0, 190.0, 104.0, 77.0, 60.0, 29.0, 25.0, 17.0, 10.0, 13.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.984375, -24.3095703125, -23.634765625, -22.9599609375, -22.28515625, -21.6103515625, -20.935546875, -20.2607421875, -19.5859375, -18.9111328125, -18.236328125, -17.5615234375, -16.88671875, -16.2119140625, -15.537109375, -14.8623046875, -14.1875, -13.5126953125, -12.837890625, -12.1630859375, -11.48828125, -10.8134765625, -10.138671875, -9.4638671875, -8.7890625, -8.1142578125, -7.439453125, -6.7646484375, -6.08984375, -5.4150390625, -4.740234375, -4.0654296875, -3.390625, -2.7158203125, -2.041015625, -1.3662109375, -0.69140625, -0.0166015625, 0.658203125, 1.3330078125, 2.0078125, 2.6826171875, 3.357421875, 4.0322265625, 4.70703125, 5.3818359375, 6.056640625, 6.7314453125, 7.40625, 8.0810546875, 8.755859375, 9.4306640625, 10.10546875, 10.7802734375, 11.455078125, 12.1298828125, 12.8046875, 13.4794921875, 14.154296875, 14.8291015625, 15.50390625, 16.1787109375, 16.853515625, 17.5283203125, 18.203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 10.0, 4.0, 6.0, 7.0, 12.0, 15.0, 19.0, 17.0, 31.0, 33.0, 31.0, 34.0, 51.0, 49.0, 43.0, 60.0, 60.0, 68.0, 47.0, 44.0, 57.0, 37.0, 34.0, 33.0, 31.0, 40.0, 29.0, 22.0, 19.0, 17.0, 13.0, 3.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.515625, -17.91455078125, -17.3134765625, -16.71240234375, -16.111328125, -15.51025390625, -14.9091796875, -14.30810546875, -13.70703125, -13.10595703125, -12.5048828125, -11.90380859375, -11.302734375, -10.70166015625, -10.1005859375, -9.49951171875, -8.8984375, -8.29736328125, -7.6962890625, -7.09521484375, -6.494140625, -5.89306640625, -5.2919921875, -4.69091796875, -4.08984375, -3.48876953125, -2.8876953125, -2.28662109375, -1.685546875, -1.08447265625, -0.4833984375, 0.11767578125, 0.71875, 1.31982421875, 1.9208984375, 2.52197265625, 3.123046875, 3.72412109375, 4.3251953125, 4.92626953125, 5.52734375, 6.12841796875, 6.7294921875, 7.33056640625, 7.931640625, 8.53271484375, 9.1337890625, 9.73486328125, 10.3359375, 10.93701171875, 11.5380859375, 12.13916015625, 12.740234375, 13.34130859375, 13.9423828125, 14.54345703125, 15.14453125, 15.74560546875, 16.3466796875, 16.94775390625, 17.548828125, 18.14990234375, 18.7509765625, 19.35205078125, 19.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 11.0, 14.0, 23.0, 23.0, 52.0, 83.0, 140.0, 279.0, 525.0, 1128.0, 3282.0, 12863.0, 78043.0, 794879.0, 132007.0, 17969.0, 4461.0, 1510.0, 601.0, 263.0, 141.0, 91.0, 57.0, 30.0, 16.0, 22.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.83843994140625, -5.6104736328125, -5.38250732421875, -5.154541015625, -4.92657470703125, -4.6986083984375, -4.47064208984375, -4.24267578125, -4.01470947265625, -3.7867431640625, -3.55877685546875, -3.330810546875, -3.10284423828125, -2.8748779296875, -2.64691162109375, -2.4189453125, -2.19097900390625, -1.9630126953125, -1.73504638671875, -1.507080078125, -1.27911376953125, -1.0511474609375, -0.82318115234375, -0.59521484375, -0.36724853515625, -0.1392822265625, 0.08868408203125, 0.316650390625, 0.54461669921875, 0.7725830078125, 1.00054931640625, 1.228515625, 1.45648193359375, 1.6844482421875, 1.91241455078125, 2.140380859375, 2.36834716796875, 2.5963134765625, 2.82427978515625, 3.05224609375, 3.28021240234375, 3.5081787109375, 3.73614501953125, 3.964111328125, 4.19207763671875, 4.4200439453125, 4.64801025390625, 4.8759765625, 5.10394287109375, 5.3319091796875, 5.55987548828125, 5.787841796875, 6.01580810546875, 6.2437744140625, 6.47174072265625, 6.69970703125, 6.92767333984375, 7.1556396484375, 7.38360595703125, 7.611572265625, 7.83953857421875, 8.0675048828125, 8.29547119140625, 8.5234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 13.0, 4.0, 15.0, 12.0, 25.0, 24.0, 27.0, 45.0, 63.0, 124.0, 171.0, 148.0, 95.0, 58.0, 41.0, 28.0, 12.0, 15.0, 11.0, 15.0, 10.0, 14.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015993118286132812, -0.0015546083450317383, -0.0015099048614501953, -0.0014652013778686523, -0.0014204978942871094, -0.0013757944107055664, -0.0013310909271240234, -0.0012863874435424805, -0.0012416839599609375, -0.0011969804763793945, -0.0011522769927978516, -0.0011075735092163086, -0.0010628700256347656, -0.0010181665420532227, -0.0009734630584716797, -0.0009287595748901367, -0.0008840560913085938, -0.0008393526077270508, -0.0007946491241455078, -0.0007499456405639648, -0.0007052421569824219, -0.0006605386734008789, -0.0006158351898193359, -0.000571131706237793, -0.00052642822265625, -0.00048172473907470703, -0.00043702125549316406, -0.0003923177719116211, -0.0003476142883300781, -0.00030291080474853516, -0.0002582073211669922, -0.00021350383758544922, -0.00016880035400390625, -0.00012409687042236328, -7.939338684082031e-05, -3.4689903259277344e-05, 1.0013580322265625e-05, 5.4717063903808594e-05, 9.942054748535156e-05, 0.00014412403106689453, 0.0001888275146484375, 0.00023353099822998047, 0.00027823448181152344, 0.0003229379653930664, 0.0003676414489746094, 0.00041234493255615234, 0.0004570484161376953, 0.0005017518997192383, 0.0005464553833007812, 0.0005911588668823242, 0.0006358623504638672, 0.0006805658340454102, 0.0007252693176269531, 0.0007699728012084961, 0.0008146762847900391, 0.000859379768371582, 0.000904083251953125, 0.000948786735534668, 0.000993490219116211, 0.001038193702697754, 0.0010828971862792969, 0.0011276006698608398, 0.0011723041534423828, 0.0012170076370239258, 0.0012617111206054688]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 9.0, 8.0, 17.0, 16.0, 12.0, 23.0, 48.0, 52.0, 76.0, 99.0, 180.0, 244.0, 441.0, 758.0, 1278.0, 2860.0, 7735.0, 30022.0, 208990.0, 685516.0, 84218.0, 16240.0, 4833.0, 2073.0, 1058.0, 617.0, 371.0, 220.0, 169.0, 107.0, 76.0, 57.0, 33.0, 29.0, 16.0, 16.0, 12.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.36328125, -5.19189453125, -5.0205078125, -4.84912109375, -4.677734375, -4.50634765625, -4.3349609375, -4.16357421875, -3.9921875, -3.82080078125, -3.6494140625, -3.47802734375, -3.306640625, -3.13525390625, -2.9638671875, -2.79248046875, -2.62109375, -2.44970703125, -2.2783203125, -2.10693359375, -1.935546875, -1.76416015625, -1.5927734375, -1.42138671875, -1.25, -1.07861328125, -0.9072265625, -0.73583984375, -0.564453125, -0.39306640625, -0.2216796875, -0.05029296875, 0.12109375, 0.29248046875, 0.4638671875, 0.63525390625, 0.806640625, 0.97802734375, 1.1494140625, 1.32080078125, 1.4921875, 1.66357421875, 1.8349609375, 2.00634765625, 2.177734375, 2.34912109375, 2.5205078125, 2.69189453125, 2.86328125, 3.03466796875, 3.2060546875, 3.37744140625, 3.548828125, 3.72021484375, 3.8916015625, 4.06298828125, 4.234375, 4.40576171875, 4.5771484375, 4.74853515625, 4.919921875, 5.09130859375, 5.2626953125, 5.43408203125, 5.60546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 6.0, 12.0, 9.0, 12.0, 14.0, 23.0, 25.0, 33.0, 37.0, 50.0, 56.0, 83.0, 93.0, 97.0, 73.0, 45.0, 65.0, 57.0, 38.0, 34.0, 21.0, 27.0, 16.0, 10.0, 9.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8748779296875, -4.714599609375, -4.5543212890625, -4.39404296875, -4.2337646484375, -4.073486328125, -3.9132080078125, -3.7529296875, -3.5926513671875, -3.432373046875, -3.2720947265625, -3.11181640625, -2.9515380859375, -2.791259765625, -2.6309814453125, -2.470703125, -2.3104248046875, -2.150146484375, -1.9898681640625, -1.82958984375, -1.6693115234375, -1.509033203125, -1.3487548828125, -1.1884765625, -1.0281982421875, -0.867919921875, -0.7076416015625, -0.54736328125, -0.3870849609375, -0.226806640625, -0.0665283203125, 0.09375, 0.2540283203125, 0.414306640625, 0.5745849609375, 0.73486328125, 0.8951416015625, 1.055419921875, 1.2156982421875, 1.3759765625, 1.5362548828125, 1.696533203125, 1.8568115234375, 2.01708984375, 2.1773681640625, 2.337646484375, 2.4979248046875, 2.658203125, 2.8184814453125, 2.978759765625, 3.1390380859375, 3.29931640625, 3.4595947265625, 3.619873046875, 3.7801513671875, 3.9404296875, 4.1007080078125, 4.260986328125, 4.4212646484375, 4.58154296875, 4.7418212890625, 4.902099609375, 5.0623779296875, 5.22265625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 11.0, 14.0, 30.0, 55.0, 97.0, 133.0, 190.0, 183.0, 105.0, 78.0, 41.0, 20.0, 13.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5271987915039, -97.04827117919922, -93.5693359375, -90.09040832519531, -86.6114730834961, -83.1325454711914, -79.65361022949219, -76.1746826171875, -72.69575500488281, -69.21682739257812, -65.7378921508789, -62.25896453857422, -58.780029296875, -55.30110168457031, -51.82217025756836, -48.343238830566406, -44.86430358886719, -41.385372161865234, -37.90644073486328, -34.427513122558594, -30.948579788208008, -27.469648361206055, -23.990718841552734, -20.51178741455078, -17.032855987548828, -13.553924560546875, -10.074994087219238, -6.596063613891602, -3.1171321868896484, 0.3617992401123047, 3.840728759765625, 7.319660186767578, 10.798599243164062, 14.277530670166016, 17.75646209716797, 21.23539161682129, 24.714323043823242, 28.193254470825195, 31.672183990478516, 35.15111541748047, 38.63004684448242, 42.108978271484375, 45.58790969848633, 49.06684112548828, 52.54576873779297, 56.02470397949219, 59.503631591796875, 62.98256301879883, 66.46149444580078, 69.94042205810547, 73.41935729980469, 76.89828491210938, 80.3772201538086, 83.85614776611328, 87.3350830078125, 90.81401062011719, 94.29293823242188, 97.77186584472656, 101.25080108642578, 104.72972869873047, 108.20866394042969, 111.68759155273438, 115.16651916503906, 118.64545440673828, 122.1243896484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 8.0, 4.0, 12.0, 11.0, 18.0, 11.0, 23.0, 18.0, 39.0, 32.0, 34.0, 45.0, 49.0, 49.0, 88.0, 67.0, 57.0, 62.0, 58.0, 46.0, 49.0, 45.0, 30.0, 25.0, 32.0, 23.0, 15.0, 17.0, 16.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-103.24591064453125, -100.6688232421875, -98.09173583984375, -95.51464080810547, -92.93755340576172, -90.36046600341797, -87.78337860107422, -85.20629119873047, -82.62919616699219, -80.05210876464844, -77.47502136230469, -74.8979263305664, -72.32083892822266, -69.7437515258789, -67.16666412353516, -64.5895767211914, -62.012489318847656, -59.435401916503906, -56.85831069946289, -54.28122329711914, -51.704132080078125, -49.127044677734375, -46.549957275390625, -43.972869873046875, -41.39577865600586, -38.81869125366211, -36.241600036621094, -33.664512634277344, -31.08742332458496, -28.510334014892578, -25.933246612548828, -23.356157302856445, -20.779067993164062, -18.20197868347168, -15.624890327453613, -13.047801971435547, -10.470712661743164, -7.893623352050781, -5.316534996032715, -2.7394466400146484, -0.16235733032226562, 2.414731502532959, 4.991820335388184, 7.568909168243408, 10.145998001098633, 12.723087310791016, 15.300175666809082, 17.87726402282715, 20.45435333251953, 23.031442642211914, 25.608531951904297, 28.185619354248047, 30.76270866394043, 33.33979797363281, 35.91688537597656, 38.49397277832031, 41.07106399536133, 43.64815139770508, 46.225242614746094, 48.802330017089844, 51.379417419433594, 53.95650863647461, 56.53359603881836, 59.110687255859375, 61.687774658203125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 7.0, 13.0, 18.0, 19.0, 20.0, 27.0, 45.0, 66.0, 71.0, 126.0, 197.0, 514.0, 3178.0, 80870.0, 4055935.0, 49988.0, 2233.0, 399.0, 145.0, 91.0, 76.0, 50.0, 39.0, 41.0, 31.0, 11.0, 10.0, 11.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.984375, -24.2373046875, -23.490234375, -22.7431640625, -21.99609375, -21.2490234375, -20.501953125, -19.7548828125, -19.0078125, -18.2607421875, -17.513671875, -16.7666015625, -16.01953125, -15.2724609375, -14.525390625, -13.7783203125, -13.03125, -12.2841796875, -11.537109375, -10.7900390625, -10.04296875, -9.2958984375, -8.548828125, -7.8017578125, -7.0546875, -6.3076171875, -5.560546875, -4.8134765625, -4.06640625, -3.3193359375, -2.572265625, -1.8251953125, -1.078125, -0.3310546875, 0.416015625, 1.1630859375, 1.91015625, 2.6572265625, 3.404296875, 4.1513671875, 4.8984375, 5.6455078125, 6.392578125, 7.1396484375, 7.88671875, 8.6337890625, 9.380859375, 10.1279296875, 10.875, 11.6220703125, 12.369140625, 13.1162109375, 13.86328125, 14.6103515625, 15.357421875, 16.1044921875, 16.8515625, 17.5986328125, 18.345703125, 19.0927734375, 19.83984375, 20.5869140625, 21.333984375, 22.0810546875, 22.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 14.0, 30.0, 33.0, 48.0, 69.0, 74.0, 93.0, 102.0, 110.0, 102.0, 71.0, 64.0, 61.0, 36.0, 27.0, 20.0, 17.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0], "bins": [-10.734375, -10.515838623046875, -10.29730224609375, -10.078765869140625, -9.8602294921875, -9.641693115234375, -9.42315673828125, -9.204620361328125, -8.986083984375, -8.767547607421875, -8.54901123046875, -8.330474853515625, -8.1119384765625, -7.893402099609375, -7.67486572265625, -7.456329345703125, -7.23779296875, -7.019256591796875, -6.80072021484375, -6.582183837890625, -6.3636474609375, -6.145111083984375, -5.92657470703125, -5.708038330078125, -5.489501953125, -5.270965576171875, -5.05242919921875, -4.833892822265625, -4.6153564453125, -4.396820068359375, -4.17828369140625, -3.959747314453125, -3.7412109375, -3.522674560546875, -3.30413818359375, -3.085601806640625, -2.8670654296875, -2.648529052734375, -2.42999267578125, -2.211456298828125, -1.992919921875, -1.774383544921875, -1.55584716796875, -1.337310791015625, -1.1187744140625, -0.900238037109375, -0.68170166015625, -0.463165283203125, -0.24462890625, -0.026092529296875, 0.19244384765625, 0.410980224609375, 0.6295166015625, 0.848052978515625, 1.06658935546875, 1.285125732421875, 1.503662109375, 1.722198486328125, 1.94073486328125, 2.159271240234375, 2.3778076171875, 2.596343994140625, 2.81488037109375, 3.033416748046875, 3.251953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 6.0, 7.0, 11.0, 23.0, 26.0, 49.0, 96.0, 122.0, 212.0, 410.0, 893.0, 1877.0, 5346.0, 17430.0, 79373.0, 890247.0, 2931494.0, 215310.0, 35371.0, 9762.0, 3436.0, 1326.0, 665.0, 328.0, 168.0, 117.0, 57.0, 43.0, 26.0, 11.0, 11.0, 8.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.6973876953125, -9.386962890625, -9.0765380859375, -8.76611328125, -8.4556884765625, -8.145263671875, -7.8348388671875, -7.5244140625, -7.2139892578125, -6.903564453125, -6.5931396484375, -6.28271484375, -5.9722900390625, -5.661865234375, -5.3514404296875, -5.041015625, -4.7305908203125, -4.420166015625, -4.1097412109375, -3.79931640625, -3.4888916015625, -3.178466796875, -2.8680419921875, -2.5576171875, -2.2471923828125, -1.936767578125, -1.6263427734375, -1.31591796875, -1.0054931640625, -0.695068359375, -0.3846435546875, -0.07421875, 0.2362060546875, 0.546630859375, 0.8570556640625, 1.16748046875, 1.4779052734375, 1.788330078125, 2.0987548828125, 2.4091796875, 2.7196044921875, 3.030029296875, 3.3404541015625, 3.65087890625, 3.9613037109375, 4.271728515625, 4.5821533203125, 4.892578125, 5.2030029296875, 5.513427734375, 5.8238525390625, 6.13427734375, 6.4447021484375, 6.755126953125, 7.0655517578125, 7.3759765625, 7.6864013671875, 7.996826171875, 8.3072509765625, 8.61767578125, 8.9281005859375, 9.238525390625, 9.5489501953125, 9.859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 6.0, 13.0, 21.0, 38.0, 56.0, 92.0, 166.0, 301.0, 561.0, 996.0, 793.0, 405.0, 217.0, 146.0, 91.0, 45.0, 27.0, 20.0, 18.0, 14.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.09375, -11.7132568359375, -11.332763671875, -10.9522705078125, -10.57177734375, -10.1912841796875, -9.810791015625, -9.4302978515625, -9.0498046875, -8.6693115234375, -8.288818359375, -7.9083251953125, -7.52783203125, -7.1473388671875, -6.766845703125, -6.3863525390625, -6.005859375, -5.6253662109375, -5.244873046875, -4.8643798828125, -4.48388671875, -4.1033935546875, -3.722900390625, -3.3424072265625, -2.9619140625, -2.5814208984375, -2.200927734375, -1.8204345703125, -1.43994140625, -1.0594482421875, -0.678955078125, -0.2984619140625, 0.08203125, 0.4625244140625, 0.843017578125, 1.2235107421875, 1.60400390625, 1.9844970703125, 2.364990234375, 2.7454833984375, 3.1259765625, 3.5064697265625, 3.886962890625, 4.2674560546875, 4.64794921875, 5.0284423828125, 5.408935546875, 5.7894287109375, 6.169921875, 6.5504150390625, 6.930908203125, 7.3114013671875, 7.69189453125, 8.0723876953125, 8.452880859375, 8.8333740234375, 9.2138671875, 9.5943603515625, 9.974853515625, 10.3553466796875, 10.73583984375, 11.1163330078125, 11.496826171875, 11.8773193359375, 12.2578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 40.0, 69.0, 139.0, 208.0, 210.0, 148.0, 79.0, 37.0, 15.0, 16.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.38055419921875, -58.07809066772461, -54.77562713623047, -51.473167419433594, -48.17070388793945, -44.86824035644531, -41.56577682495117, -38.26331329345703, -34.960853576660156, -31.658390045166016, -28.355928421020508, -25.053464889526367, -21.75100326538086, -18.44853973388672, -15.146076202392578, -11.84361457824707, -8.541149139404297, -5.238686561584473, -1.9362235069274902, 1.3662395477294922, 4.668702125549316, 7.971164703369141, 11.273628234863281, 14.576089859008789, 17.87855339050293, 21.18101692199707, 24.483478546142578, 27.78594207763672, 31.08840560913086, 34.390869140625, 37.693328857421875, 40.995792388916016, 44.298255920410156, 47.6007194519043, 50.90318298339844, 54.20564270019531, 57.50810623168945, 60.810569763183594, 64.113037109375, 67.41549682617188, 70.71795654296875, 74.02041625976562, 77.32288360595703, 80.6253433227539, 83.92781066894531, 87.23027038574219, 90.53273010253906, 93.83519744873047, 97.13766479492188, 100.44012451171875, 103.74259185791016, 107.04505157470703, 110.34751892089844, 113.64997863769531, 116.95243835449219, 120.2549057006836, 123.55736541748047, 126.85982513427734, 130.16229248046875, 133.46475219726562, 136.7672119140625, 140.06967163085938, 143.3721466064453, 146.6746063232422, 149.97706604003906]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 10.0, 14.0, 12.0, 14.0, 12.0, 22.0, 18.0, 22.0, 23.0, 34.0, 31.0, 39.0, 47.0, 36.0, 53.0, 55.0, 50.0, 60.0, 57.0, 54.0, 51.0, 48.0, 44.0, 35.0, 26.0, 29.0, 20.0, 12.0, 17.0, 8.0, 13.0, 8.0, 3.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.728912353515625, -37.204811096191406, -35.68070983886719, -34.15660858154297, -32.632503509521484, -31.108402252197266, -29.584300994873047, -28.060199737548828, -26.536096572875977, -25.011995315551758, -23.487892150878906, -21.963790893554688, -20.43968963623047, -18.915586471557617, -17.3914852142334, -15.867383003234863, -14.343280792236328, -12.819178581237793, -11.295076370239258, -9.770975112915039, -8.246872901916504, -6.722770690917969, -5.19866943359375, -3.674567222595215, -2.1504650115966797, -0.6263630390167236, 0.8977389335632324, 2.4218406677246094, 3.9459428787231445, 5.47004508972168, 6.994146347045898, 8.518248558044434, 10.042350769042969, 11.566452980041504, 13.090555191040039, 14.614656448364258, 16.13875961303711, 17.662860870361328, 19.186962127685547, 20.711063385009766, 22.235166549682617, 23.759267807006836, 25.283370971679688, 26.807472229003906, 28.331573486328125, 29.855676651000977, 31.379777908325195, 32.90388107299805, 34.427982330322266, 35.952083587646484, 37.4761848449707, 39.00028991699219, 40.524391174316406, 42.048492431640625, 43.572593688964844, 45.09669494628906, 46.62079620361328, 48.1448974609375, 49.66899871826172, 51.19309997558594, 52.71720504760742, 54.24130630493164, 55.76540756225586, 57.28950881958008, 58.81361389160156]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 12.0, 6.0, 22.0, 18.0, 48.0, 48.0, 92.0, 133.0, 206.0, 316.0, 520.0, 785.0, 1402.0, 2333.0, 4170.0, 7939.0, 15835.0, 34453.0, 95390.0, 366419.0, 358558.0, 92774.0, 33607.0, 15470.0, 7913.0, 4134.0, 2377.0, 1358.0, 858.0, 471.0, 294.0, 210.0, 129.0, 70.0, 60.0, 41.0, 27.0, 20.0, 10.0, 6.0, 5.0, 6.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.55108642578125, -6.3326416015625, -6.11419677734375, -5.895751953125, -5.67730712890625, -5.4588623046875, -5.24041748046875, -5.02197265625, -4.80352783203125, -4.5850830078125, -4.36663818359375, -4.148193359375, -3.92974853515625, -3.7113037109375, -3.49285888671875, -3.2744140625, -3.05596923828125, -2.8375244140625, -2.61907958984375, -2.400634765625, -2.18218994140625, -1.9637451171875, -1.74530029296875, -1.52685546875, -1.30841064453125, -1.0899658203125, -0.87152099609375, -0.653076171875, -0.43463134765625, -0.2161865234375, 0.00225830078125, 0.220703125, 0.43914794921875, 0.6575927734375, 0.87603759765625, 1.094482421875, 1.31292724609375, 1.5313720703125, 1.74981689453125, 1.96826171875, 2.18670654296875, 2.4051513671875, 2.62359619140625, 2.842041015625, 3.06048583984375, 3.2789306640625, 3.49737548828125, 3.7158203125, 3.93426513671875, 4.1527099609375, 4.37115478515625, 4.589599609375, 4.80804443359375, 5.0264892578125, 5.24493408203125, 5.46337890625, 5.68182373046875, 5.9002685546875, 6.11871337890625, 6.337158203125, 6.55560302734375, 6.7740478515625, 6.99249267578125, 7.2109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 8.0, 4.0, 19.0, 16.0, 15.0, 20.0, 32.0, 23.0, 35.0, 44.0, 55.0, 51.0, 51.0, 66.0, 46.0, 54.0, 62.0, 63.0, 63.0, 39.0, 40.0, 29.0, 29.0, 27.0, 16.0, 20.0, 13.0, 12.0, 13.0, 10.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.632904052734375, -4.50018310546875, -4.367462158203125, -4.2347412109375, -4.102020263671875, -3.96929931640625, -3.836578369140625, -3.703857421875, -3.571136474609375, -3.43841552734375, -3.305694580078125, -3.1729736328125, -3.040252685546875, -2.90753173828125, -2.774810791015625, -2.64208984375, -2.509368896484375, -2.37664794921875, -2.243927001953125, -2.1112060546875, -1.978485107421875, -1.84576416015625, -1.713043212890625, -1.580322265625, -1.447601318359375, -1.31488037109375, -1.182159423828125, -1.0494384765625, -0.916717529296875, -0.78399658203125, -0.651275634765625, -0.5185546875, -0.385833740234375, -0.25311279296875, -0.120391845703125, 0.0123291015625, 0.145050048828125, 0.27777099609375, 0.410491943359375, 0.543212890625, 0.675933837890625, 0.80865478515625, 0.941375732421875, 1.0740966796875, 1.206817626953125, 1.33953857421875, 1.472259521484375, 1.60498046875, 1.737701416015625, 1.87042236328125, 2.003143310546875, 2.1358642578125, 2.268585205078125, 2.40130615234375, 2.534027099609375, 2.666748046875, 2.799468994140625, 2.93218994140625, 3.064910888671875, 3.1976318359375, 3.330352783203125, 3.46307373046875, 3.595794677734375, 3.728515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 14.0, 19.0, 23.0, 37.0, 50.0, 70.0, 111.0, 173.0, 327.0, 683.0, 1489.0, 4010.0, 17381.0, 158904.0, 801134.0, 50871.0, 8674.0, 2425.0, 966.0, 481.0, 260.0, 135.0, 95.0, 78.0, 40.0, 20.0, 20.0, 19.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.3165283203125, -13.750244140625, -13.1839599609375, -12.61767578125, -12.0513916015625, -11.485107421875, -10.9188232421875, -10.3525390625, -9.7862548828125, -9.219970703125, -8.6536865234375, -8.08740234375, -7.5211181640625, -6.954833984375, -6.3885498046875, -5.822265625, -5.2559814453125, -4.689697265625, -4.1234130859375, -3.55712890625, -2.9908447265625, -2.424560546875, -1.8582763671875, -1.2919921875, -0.7257080078125, -0.159423828125, 0.4068603515625, 0.97314453125, 1.5394287109375, 2.105712890625, 2.6719970703125, 3.23828125, 3.8045654296875, 4.370849609375, 4.9371337890625, 5.50341796875, 6.0697021484375, 6.635986328125, 7.2022705078125, 7.7685546875, 8.3348388671875, 8.901123046875, 9.4674072265625, 10.03369140625, 10.5999755859375, 11.166259765625, 11.7325439453125, 12.298828125, 12.8651123046875, 13.431396484375, 13.9976806640625, 14.56396484375, 15.1302490234375, 15.696533203125, 16.2628173828125, 16.8291015625, 17.3953857421875, 17.961669921875, 18.5279541015625, 19.09423828125, 19.6605224609375, 20.226806640625, 20.7930908203125, 21.359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 7.0, 4.0, 10.0, 14.0, 13.0, 15.0, 17.0, 21.0, 28.0, 45.0, 45.0, 48.0, 49.0, 54.0, 54.0, 56.0, 73.0, 54.0, 42.0, 45.0, 60.0, 36.0, 24.0, 35.0, 34.0, 24.0, 18.0, 17.0, 11.0, 10.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.8193359375, -18.232421875, -17.6455078125, -17.05859375, -16.4716796875, -15.884765625, -15.2978515625, -14.7109375, -14.1240234375, -13.537109375, -12.9501953125, -12.36328125, -11.7763671875, -11.189453125, -10.6025390625, -10.015625, -9.4287109375, -8.841796875, -8.2548828125, -7.66796875, -7.0810546875, -6.494140625, -5.9072265625, -5.3203125, -4.7333984375, -4.146484375, -3.5595703125, -2.97265625, -2.3857421875, -1.798828125, -1.2119140625, -0.625, -0.0380859375, 0.548828125, 1.1357421875, 1.72265625, 2.3095703125, 2.896484375, 3.4833984375, 4.0703125, 4.6572265625, 5.244140625, 5.8310546875, 6.41796875, 7.0048828125, 7.591796875, 8.1787109375, 8.765625, 9.3525390625, 9.939453125, 10.5263671875, 11.11328125, 11.7001953125, 12.287109375, 12.8740234375, 13.4609375, 14.0478515625, 14.634765625, 15.2216796875, 15.80859375, 16.3955078125, 16.982421875, 17.5693359375, 18.15625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 11.0, 11.0, 27.0, 43.0, 47.0, 84.0, 198.0, 401.0, 1268.0, 5035.0, 31464.0, 585493.0, 392094.0, 25963.0, 4342.0, 1229.0, 380.0, 201.0, 107.0, 53.0, 26.0, 23.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.40313720703125, -7.1383056640625, -6.87347412109375, -6.608642578125, -6.34381103515625, -6.0789794921875, -5.81414794921875, -5.54931640625, -5.28448486328125, -5.0196533203125, -4.75482177734375, -4.489990234375, -4.22515869140625, -3.9603271484375, -3.69549560546875, -3.4306640625, -3.16583251953125, -2.9010009765625, -2.63616943359375, -2.371337890625, -2.10650634765625, -1.8416748046875, -1.57684326171875, -1.31201171875, -1.04718017578125, -0.7823486328125, -0.51751708984375, -0.252685546875, 0.01214599609375, 0.2769775390625, 0.54180908203125, 0.806640625, 1.07147216796875, 1.3363037109375, 1.60113525390625, 1.865966796875, 2.13079833984375, 2.3956298828125, 2.66046142578125, 2.92529296875, 3.19012451171875, 3.4549560546875, 3.71978759765625, 3.984619140625, 4.24945068359375, 4.5142822265625, 4.77911376953125, 5.0439453125, 5.30877685546875, 5.5736083984375, 5.83843994140625, 6.103271484375, 6.36810302734375, 6.6329345703125, 6.89776611328125, 7.16259765625, 7.42742919921875, 7.6922607421875, 7.95709228515625, 8.221923828125, 8.48675537109375, 8.7515869140625, 9.01641845703125, 9.28125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 12.0, 10.0, 17.0, 13.0, 19.0, 18.0, 30.0, 59.0, 92.0, 108.0, 110.0, 139.0, 80.0, 63.0, 54.0, 33.0, 31.0, 11.0, 22.0, 10.0, 13.0, 8.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011806488037109375, -0.0011445283889770508, -0.001108407974243164, -0.0010722875595092773, -0.0010361671447753906, -0.001000046730041504, -0.0009639263153076172, -0.0009278059005737305, -0.0008916854858398438, -0.000855565071105957, -0.0008194446563720703, -0.0007833242416381836, -0.0007472038269042969, -0.0007110834121704102, -0.0006749629974365234, -0.0006388425827026367, -0.00060272216796875, -0.0005666017532348633, -0.0005304813385009766, -0.0004943609237670898, -0.0004582405090332031, -0.0004221200942993164, -0.0003859996795654297, -0.00034987926483154297, -0.00031375885009765625, -0.00027763843536376953, -0.0002415180206298828, -0.0002053976058959961, -0.00016927719116210938, -0.00013315677642822266, -9.703636169433594e-05, -6.091594696044922e-05, -2.47955322265625e-05, 1.1324882507324219e-05, 4.744529724121094e-05, 8.356571197509766e-05, 0.00011968612670898438, 0.0001558065414428711, 0.0001919269561767578, 0.00022804737091064453, 0.00026416778564453125, 0.00030028820037841797, 0.0003364086151123047, 0.0003725290298461914, 0.0004086494445800781, 0.00044476985931396484, 0.00048089027404785156, 0.0005170106887817383, 0.000553131103515625, 0.0005892515182495117, 0.0006253719329833984, 0.0006614923477172852, 0.0006976127624511719, 0.0007337331771850586, 0.0007698535919189453, 0.000805974006652832, 0.0008420944213867188, 0.0008782148361206055, 0.0009143352508544922, 0.0009504556655883789, 0.0009865760803222656, 0.0010226964950561523, 0.001058816909790039, 0.0010949373245239258, 0.0011310577392578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 9.0, 16.0, 23.0, 67.0, 115.0, 232.0, 507.0, 1439.0, 6097.0, 56089.0, 850370.0, 121123.0, 9279.0, 1967.0, 640.0, 278.0, 139.0, 72.0, 29.0, 21.0, 10.0, 6.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76171875, -6.46282958984375, -6.1639404296875, -5.86505126953125, -5.566162109375, -5.26727294921875, -4.9683837890625, -4.66949462890625, -4.37060546875, -4.07171630859375, -3.7728271484375, -3.47393798828125, -3.175048828125, -2.87615966796875, -2.5772705078125, -2.27838134765625, -1.9794921875, -1.68060302734375, -1.3817138671875, -1.08282470703125, -0.783935546875, -0.48504638671875, -0.1861572265625, 0.11273193359375, 0.41162109375, 0.71051025390625, 1.0093994140625, 1.30828857421875, 1.607177734375, 1.90606689453125, 2.2049560546875, 2.50384521484375, 2.802734375, 3.10162353515625, 3.4005126953125, 3.69940185546875, 3.998291015625, 4.29718017578125, 4.5960693359375, 4.89495849609375, 5.19384765625, 5.49273681640625, 5.7916259765625, 6.09051513671875, 6.389404296875, 6.68829345703125, 6.9871826171875, 7.28607177734375, 7.5849609375, 7.88385009765625, 8.1827392578125, 8.48162841796875, 8.780517578125, 9.07940673828125, 9.3782958984375, 9.67718505859375, 9.97607421875, 10.27496337890625, 10.5738525390625, 10.87274169921875, 11.171630859375, 11.47052001953125, 11.7694091796875, 12.06829833984375, 12.3671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 17.0, 16.0, 26.0, 30.0, 43.0, 56.0, 74.0, 103.0, 118.0, 112.0, 97.0, 110.0, 38.0, 47.0, 30.0, 16.0, 17.0, 15.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-9.265625, -9.05487060546875, -8.8441162109375, -8.63336181640625, -8.422607421875, -8.21185302734375, -8.0010986328125, -7.79034423828125, -7.57958984375, -7.36883544921875, -7.1580810546875, -6.94732666015625, -6.736572265625, -6.52581787109375, -6.3150634765625, -6.10430908203125, -5.8935546875, -5.68280029296875, -5.4720458984375, -5.26129150390625, -5.050537109375, -4.83978271484375, -4.6290283203125, -4.41827392578125, -4.20751953125, -3.99676513671875, -3.7860107421875, -3.57525634765625, -3.364501953125, -3.15374755859375, -2.9429931640625, -2.73223876953125, -2.521484375, -2.31072998046875, -2.0999755859375, -1.88922119140625, -1.678466796875, -1.46771240234375, -1.2569580078125, -1.04620361328125, -0.83544921875, -0.62469482421875, -0.4139404296875, -0.20318603515625, 0.007568359375, 0.21832275390625, 0.4290771484375, 0.63983154296875, 0.8505859375, 1.06134033203125, 1.2720947265625, 1.48284912109375, 1.693603515625, 1.90435791015625, 2.1151123046875, 2.32586669921875, 2.53662109375, 2.74737548828125, 2.9581298828125, 3.16888427734375, 3.379638671875, 3.59039306640625, 3.8011474609375, 4.01190185546875, 4.22265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 17.0, 30.0, 54.0, 108.0, 185.0, 238.0, 165.0, 105.0, 41.0, 22.0, 7.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-172.4517822265625, -168.65771484375, -164.86366271972656, -161.06959533691406, -157.27554321289062, -153.48147583007812, -149.6874237060547, -145.8933563232422, -142.09930419921875, -138.30523681640625, -134.5111846923828, -130.7171173095703, -126.92306518554688, -123.1290054321289, -119.33494567871094, -115.54088592529297, -111.746826171875, -107.95276641845703, -104.15870666503906, -100.3646469116211, -96.57058715820312, -92.77652740478516, -88.98246765136719, -85.18840789794922, -81.39434051513672, -77.60028076171875, -73.80622100830078, -70.01216125488281, -66.21810150146484, -62.424041748046875, -58.629981994628906, -54.83592224121094, -51.04186248779297, -47.247802734375, -43.45374298095703, -39.65968322753906, -35.865623474121094, -32.071563720703125, -28.277502059936523, -24.483442306518555, -20.689382553100586, -16.895322799682617, -13.101263046264648, -9.307202339172363, -5.5131425857543945, -1.7190818786621094, 2.0749778747558594, 5.869037628173828, 9.663097381591797, 13.457157135009766, 17.251216888427734, 21.045276641845703, 24.839336395263672, 28.633398056030273, 32.427459716796875, 36.221519470214844, 40.01557922363281, 43.80963897705078, 47.60369873046875, 51.39775848388672, 55.19181823730469, 58.985877990722656, 62.779937744140625, 66.5739974975586, 70.36805725097656]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 7.0, 7.0, 12.0, 11.0, 6.0, 15.0, 13.0, 24.0, 39.0, 28.0, 22.0, 39.0, 31.0, 37.0, 54.0, 49.0, 50.0, 66.0, 49.0, 47.0, 32.0, 43.0, 57.0, 31.0, 21.0, 26.0, 31.0, 19.0, 17.0, 19.0, 15.0, 13.0, 16.0, 13.0, 9.0, 5.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.6159896850586, -63.55924606323242, -61.50250244140625, -59.44575881958008, -57.389015197753906, -55.332275390625, -53.27553176879883, -51.218788146972656, -49.162044525146484, -47.10530090332031, -45.04855728149414, -42.99181365966797, -40.93507385253906, -38.878326416015625, -36.82158660888672, -34.76484298706055, -32.708099365234375, -30.651355743408203, -28.59461212158203, -26.537870407104492, -24.48112678527832, -22.42438316345215, -20.36764144897461, -18.310897827148438, -16.254154205322266, -14.197410583496094, -12.140667915344238, -10.083925247192383, -8.027181625366211, -5.970438003540039, -3.9136953353881836, -1.8569526672363281, 0.1997833251953125, 2.256526470184326, 4.31326961517334, 6.3700127601623535, 8.426755905151367, 10.483499526977539, 12.540242195129395, 14.59698486328125, 16.653728485107422, 18.710472106933594, 20.767215728759766, 22.823957443237305, 24.880701065063477, 26.93744468688965, 28.994186401367188, 31.05093002319336, 33.10767364501953, 35.1644172668457, 37.221160888671875, 39.27790451049805, 41.33464813232422, 43.391387939453125, 45.4481315612793, 47.50487518310547, 49.56161880493164, 51.61836242675781, 53.675106048583984, 55.731849670410156, 57.78858947753906, 59.8453369140625, 61.902076721191406, 63.95882034301758, 66.01556396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 10.0, 13.0, 17.0, 37.0, 45.0, 70.0, 105.0, 212.0, 365.0, 720.0, 1392.0, 3054.0, 6612.0, 15704.0, 41312.0, 125637.0, 505212.0, 1899065.0, 1199828.0, 271167.0, 77064.0, 27269.0, 10810.0, 4542.0, 2021.0, 1030.0, 440.0, 221.0, 136.0, 65.0, 39.0, 18.0, 11.0, 6.0, 5.0, 4.0, 9.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.1180419921875, -4.966552734375, -4.8150634765625, -4.66357421875, -4.5120849609375, -4.360595703125, -4.2091064453125, -4.0576171875, -3.9061279296875, -3.754638671875, -3.6031494140625, -3.45166015625, -3.3001708984375, -3.148681640625, -2.9971923828125, -2.845703125, -2.6942138671875, -2.542724609375, -2.3912353515625, -2.23974609375, -2.0882568359375, -1.936767578125, -1.7852783203125, -1.6337890625, -1.4822998046875, -1.330810546875, -1.1793212890625, -1.02783203125, -0.8763427734375, -0.724853515625, -0.5733642578125, -0.421875, -0.2703857421875, -0.118896484375, 0.0325927734375, 0.18408203125, 0.3355712890625, 0.487060546875, 0.6385498046875, 0.7900390625, 0.9415283203125, 1.093017578125, 1.2445068359375, 1.39599609375, 1.5474853515625, 1.698974609375, 1.8504638671875, 2.001953125, 2.1534423828125, 2.304931640625, 2.4564208984375, 2.60791015625, 2.7593994140625, 2.910888671875, 3.0623779296875, 3.2138671875, 3.3653564453125, 3.516845703125, 3.6683349609375, 3.81982421875, 3.9713134765625, 4.122802734375, 4.2742919921875, 4.42578125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 6.0, 20.0, 19.0, 24.0, 42.0, 37.0, 56.0, 63.0, 74.0, 84.0, 60.0, 71.0, 70.0, 65.0, 53.0, 49.0, 39.0, 40.0, 29.0, 23.0, 24.0, 16.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.921875, -6.761322021484375, -6.60076904296875, -6.440216064453125, -6.2796630859375, -6.119110107421875, -5.95855712890625, -5.798004150390625, -5.637451171875, -5.476898193359375, -5.31634521484375, -5.155792236328125, -4.9952392578125, -4.834686279296875, -4.67413330078125, -4.513580322265625, -4.35302734375, -4.192474365234375, -4.03192138671875, -3.871368408203125, -3.7108154296875, -3.550262451171875, -3.38970947265625, -3.229156494140625, -3.068603515625, -2.908050537109375, -2.74749755859375, -2.586944580078125, -2.4263916015625, -2.265838623046875, -2.10528564453125, -1.944732666015625, -1.7841796875, -1.623626708984375, -1.46307373046875, -1.302520751953125, -1.1419677734375, -0.981414794921875, -0.82086181640625, -0.660308837890625, -0.499755859375, -0.339202880859375, -0.17864990234375, -0.018096923828125, 0.1424560546875, 0.303009033203125, 0.46356201171875, 0.624114990234375, 0.78466796875, 0.945220947265625, 1.10577392578125, 1.266326904296875, 1.4268798828125, 1.587432861328125, 1.74798583984375, 1.908538818359375, 2.069091796875, 2.229644775390625, 2.39019775390625, 2.550750732421875, 2.7113037109375, 2.871856689453125, 3.03240966796875, 3.192962646484375, 3.353515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 7.0, 13.0, 20.0, 35.0, 55.0, 50.0, 81.0, 133.0, 271.0, 519.0, 1131.0, 3066.0, 9747.0, 42143.0, 263491.0, 2623704.0, 1094514.0, 120757.0, 23997.0, 6481.0, 2219.0, 828.0, 416.0, 216.0, 123.0, 66.0, 58.0, 34.0, 24.0, 22.0, 12.0, 16.0, 4.0, 4.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0390625, -9.73291015625, -9.4267578125, -9.12060546875, -8.814453125, -8.50830078125, -8.2021484375, -7.89599609375, -7.58984375, -7.28369140625, -6.9775390625, -6.67138671875, -6.365234375, -6.05908203125, -5.7529296875, -5.44677734375, -5.140625, -4.83447265625, -4.5283203125, -4.22216796875, -3.916015625, -3.60986328125, -3.3037109375, -2.99755859375, -2.69140625, -2.38525390625, -2.0791015625, -1.77294921875, -1.466796875, -1.16064453125, -0.8544921875, -0.54833984375, -0.2421875, 0.06396484375, 0.3701171875, 0.67626953125, 0.982421875, 1.28857421875, 1.5947265625, 1.90087890625, 2.20703125, 2.51318359375, 2.8193359375, 3.12548828125, 3.431640625, 3.73779296875, 4.0439453125, 4.35009765625, 4.65625, 4.96240234375, 5.2685546875, 5.57470703125, 5.880859375, 6.18701171875, 6.4931640625, 6.79931640625, 7.10546875, 7.41162109375, 7.7177734375, 8.02392578125, 8.330078125, 8.63623046875, 8.9423828125, 9.24853515625, 9.5546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 9.0, 13.0, 16.0, 26.0, 17.0, 25.0, 30.0, 58.0, 61.0, 91.0, 143.0, 154.0, 228.0, 321.0, 421.0, 527.0, 467.0, 350.0, 260.0, 222.0, 146.0, 102.0, 88.0, 53.0, 54.0, 44.0, 25.0, 25.0, 19.0, 12.0, 13.0, 15.0, 6.0, 4.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.8515625, -8.5731201171875, -8.294677734375, -8.0162353515625, -7.73779296875, -7.4593505859375, -7.180908203125, -6.9024658203125, -6.6240234375, -6.3455810546875, -6.067138671875, -5.7886962890625, -5.51025390625, -5.2318115234375, -4.953369140625, -4.6749267578125, -4.396484375, -4.1180419921875, -3.839599609375, -3.5611572265625, -3.28271484375, -3.0042724609375, -2.725830078125, -2.4473876953125, -2.1689453125, -1.8905029296875, -1.612060546875, -1.3336181640625, -1.05517578125, -0.7767333984375, -0.498291015625, -0.2198486328125, 0.05859375, 0.3370361328125, 0.615478515625, 0.8939208984375, 1.17236328125, 1.4508056640625, 1.729248046875, 2.0076904296875, 2.2861328125, 2.5645751953125, 2.843017578125, 3.1214599609375, 3.39990234375, 3.6783447265625, 3.956787109375, 4.2352294921875, 4.513671875, 4.7921142578125, 5.070556640625, 5.3489990234375, 5.62744140625, 5.9058837890625, 6.184326171875, 6.4627685546875, 6.7412109375, 7.0196533203125, 7.298095703125, 7.5765380859375, 7.85498046875, 8.1334228515625, 8.411865234375, 8.6903076171875, 8.96875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 27.0, 59.0, 156.0, 242.0, 232.0, 141.0, 55.0, 33.0, 12.0, 6.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.96585083007812, -191.03646850585938, -186.10708618164062, -181.17770385742188, -176.24832153320312, -171.31893920898438, -166.38955688476562, -161.46017456054688, -156.53079223632812, -151.60140991210938, -146.67202758789062, -141.74264526367188, -136.81326293945312, -131.88388061523438, -126.95449829101562, -122.02511596679688, -117.09573364257812, -112.16635131835938, -107.23696899414062, -102.30758666992188, -97.37820434570312, -92.44882202148438, -87.51943969726562, -82.59005737304688, -77.66067504882812, -72.73129272460938, -67.80191040039062, -62.872528076171875, -57.943145751953125, -53.013763427734375, -48.084381103515625, -43.154998779296875, -38.225616455078125, -33.296234130859375, -28.366851806640625, -23.437469482421875, -18.508087158203125, -13.578704833984375, -8.649322509765625, -3.719940185546875, 1.209442138671875, 6.138824462890625, 11.068206787109375, 15.997589111328125, 20.926971435546875, 25.856353759765625, 30.785736083984375, 35.715118408203125, 40.644500732421875, 45.573883056640625, 50.503265380859375, 55.432647705078125, 60.362030029296875, 65.29141235351562, 70.22079467773438, 75.15017700195312, 80.07955932617188, 85.00894165039062, 89.93832397460938, 94.86770629882812, 99.79708862304688, 104.72647094726562, 109.65585327148438, 114.58523559570312, 119.51461791992188]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 6.0, 7.0, 6.0, 11.0, 5.0, 16.0, 13.0, 20.0, 20.0, 24.0, 39.0, 32.0, 49.0, 43.0, 40.0, 45.0, 47.0, 50.0, 61.0, 49.0, 52.0, 33.0, 45.0, 44.0, 36.0, 33.0, 34.0, 25.0, 23.0, 21.0, 17.0, 16.0, 11.0, 8.0, 2.0, 2.0, 7.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.158912658691406, -50.22468566894531, -48.290462493896484, -46.35623550415039, -44.42201232910156, -42.48778533935547, -40.553558349609375, -38.61933135986328, -36.68510818481445, -34.75088119506836, -32.81665802001953, -30.882431030273438, -28.948205947875977, -27.013980865478516, -25.079753875732422, -23.14552879333496, -21.2113037109375, -19.27707862854004, -17.342853546142578, -15.408626556396484, -13.474401473999023, -11.540176391601562, -9.605950355529785, -7.671724319458008, -5.737499237060547, -3.8032736778259277, -1.8690481185913086, 0.06517744064331055, 1.9994029998779297, 3.9336280822753906, 5.867854118347168, 7.802080154418945, 9.736305236816406, 11.670530319213867, 13.604756355285645, 15.538982391357422, 17.473207473754883, 19.407432556152344, 21.341659545898438, 23.2758846282959, 25.21010971069336, 27.14433479309082, 29.07855987548828, 31.012786865234375, 32.94701385498047, 34.8812370300293, 36.81546401977539, 38.74968719482422, 40.68391418457031, 42.618141174316406, 44.552364349365234, 46.48659133911133, 48.420814514160156, 50.35504150390625, 52.289268493652344, 54.22349548339844, 56.157718658447266, 58.09194564819336, 60.02616882324219, 61.96039581298828, 63.894622802734375, 65.82884216308594, 67.76306915283203, 69.69729614257812, 71.63152313232422]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 13.0, 7.0, 17.0, 27.0, 48.0, 56.0, 107.0, 171.0, 231.0, 364.0, 584.0, 1075.0, 1749.0, 3158.0, 5640.0, 10624.0, 21025.0, 43165.0, 96458.0, 259795.0, 353386.0, 135712.0, 57576.0, 27557.0, 13578.0, 7088.0, 3820.0, 2209.0, 1291.0, 769.0, 439.0, 290.0, 177.0, 117.0, 77.0, 59.0, 28.0, 21.0, 12.0, 6.0, 8.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.66796875, -6.44708251953125, -6.2261962890625, -6.00531005859375, -5.784423828125, -5.56353759765625, -5.3426513671875, -5.12176513671875, -4.90087890625, -4.67999267578125, -4.4591064453125, -4.23822021484375, -4.017333984375, -3.79644775390625, -3.5755615234375, -3.35467529296875, -3.1337890625, -2.91290283203125, -2.6920166015625, -2.47113037109375, -2.250244140625, -2.02935791015625, -1.8084716796875, -1.58758544921875, -1.36669921875, -1.14581298828125, -0.9249267578125, -0.70404052734375, -0.483154296875, -0.26226806640625, -0.0413818359375, 0.17950439453125, 0.400390625, 0.62127685546875, 0.8421630859375, 1.06304931640625, 1.283935546875, 1.50482177734375, 1.7257080078125, 1.94659423828125, 2.16748046875, 2.38836669921875, 2.6092529296875, 2.83013916015625, 3.051025390625, 3.27191162109375, 3.4927978515625, 3.71368408203125, 3.9345703125, 4.15545654296875, 4.3763427734375, 4.59722900390625, 4.818115234375, 5.03900146484375, 5.2598876953125, 5.48077392578125, 5.70166015625, 5.92254638671875, 6.1434326171875, 6.36431884765625, 6.585205078125, 6.80609130859375, 7.0269775390625, 7.24786376953125, 7.46875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 7.0, 12.0, 10.0, 10.0, 15.0, 24.0, 20.0, 20.0, 46.0, 37.0, 39.0, 38.0, 45.0, 53.0, 62.0, 42.0, 41.0, 50.0, 39.0, 41.0, 48.0, 47.0, 40.0, 29.0, 30.0, 19.0, 17.0, 18.0, 27.0, 16.0, 8.0, 12.0, 12.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.970123291015625, -3.85430908203125, -3.738494873046875, -3.6226806640625, -3.506866455078125, -3.39105224609375, -3.275238037109375, -3.159423828125, -3.043609619140625, -2.92779541015625, -2.811981201171875, -2.6961669921875, -2.580352783203125, -2.46453857421875, -2.348724365234375, -2.23291015625, -2.117095947265625, -2.00128173828125, -1.885467529296875, -1.7696533203125, -1.653839111328125, -1.53802490234375, -1.422210693359375, -1.306396484375, -1.190582275390625, -1.07476806640625, -0.958953857421875, -0.8431396484375, -0.727325439453125, -0.61151123046875, -0.495697021484375, -0.3798828125, -0.264068603515625, -0.14825439453125, -0.032440185546875, 0.0833740234375, 0.199188232421875, 0.31500244140625, 0.430816650390625, 0.546630859375, 0.662445068359375, 0.77825927734375, 0.894073486328125, 1.0098876953125, 1.125701904296875, 1.24151611328125, 1.357330322265625, 1.47314453125, 1.588958740234375, 1.70477294921875, 1.820587158203125, 1.9364013671875, 2.052215576171875, 2.16802978515625, 2.283843994140625, 2.399658203125, 2.515472412109375, 2.63128662109375, 2.747100830078125, 2.8629150390625, 2.978729248046875, 3.09454345703125, 3.210357666015625, 3.326171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 5.0, 13.0, 15.0, 22.0, 32.0, 35.0, 52.0, 86.0, 117.0, 163.0, 225.0, 340.0, 502.0, 901.0, 1598.0, 3286.0, 9281.0, 43225.0, 605139.0, 334202.0, 34349.0, 8041.0, 3015.0, 1534.0, 853.0, 505.0, 335.0, 177.0, 117.0, 92.0, 76.0, 62.0, 41.0, 24.0, 13.0, 19.0, 13.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.546875, -19.958740234375, -19.37060546875, -18.782470703125, -18.1943359375, -17.606201171875, -17.01806640625, -16.429931640625, -15.841796875, -15.253662109375, -14.66552734375, -14.077392578125, -13.4892578125, -12.901123046875, -12.31298828125, -11.724853515625, -11.13671875, -10.548583984375, -9.96044921875, -9.372314453125, -8.7841796875, -8.196044921875, -7.60791015625, -7.019775390625, -6.431640625, -5.843505859375, -5.25537109375, -4.667236328125, -4.0791015625, -3.490966796875, -2.90283203125, -2.314697265625, -1.7265625, -1.138427734375, -0.55029296875, 0.037841796875, 0.6259765625, 1.214111328125, 1.80224609375, 2.390380859375, 2.978515625, 3.566650390625, 4.15478515625, 4.742919921875, 5.3310546875, 5.919189453125, 6.50732421875, 7.095458984375, 7.68359375, 8.271728515625, 8.85986328125, 9.447998046875, 10.0361328125, 10.624267578125, 11.21240234375, 11.800537109375, 12.388671875, 12.976806640625, 13.56494140625, 14.153076171875, 14.7412109375, 15.329345703125, 15.91748046875, 16.505615234375, 17.09375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 12.0, 11.0, 23.0, 17.0, 41.0, 43.0, 36.0, 43.0, 66.0, 55.0, 67.0, 53.0, 70.0, 50.0, 64.0, 59.0, 54.0, 55.0, 30.0, 29.0, 24.0, 18.0, 19.0, 11.0, 8.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.953125, -19.236572265625, -18.52001953125, -17.803466796875, -17.0869140625, -16.370361328125, -15.65380859375, -14.937255859375, -14.220703125, -13.504150390625, -12.78759765625, -12.071044921875, -11.3544921875, -10.637939453125, -9.92138671875, -9.204833984375, -8.48828125, -7.771728515625, -7.05517578125, -6.338623046875, -5.6220703125, -4.905517578125, -4.18896484375, -3.472412109375, -2.755859375, -2.039306640625, -1.32275390625, -0.606201171875, 0.1103515625, 0.826904296875, 1.54345703125, 2.260009765625, 2.9765625, 3.693115234375, 4.40966796875, 5.126220703125, 5.8427734375, 6.559326171875, 7.27587890625, 7.992431640625, 8.708984375, 9.425537109375, 10.14208984375, 10.858642578125, 11.5751953125, 12.291748046875, 13.00830078125, 13.724853515625, 14.44140625, 15.157958984375, 15.87451171875, 16.591064453125, 17.3076171875, 18.024169921875, 18.74072265625, 19.457275390625, 20.173828125, 20.890380859375, 21.60693359375, 22.323486328125, 23.0400390625, 23.756591796875, 24.47314453125, 25.189697265625, 25.90625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 5.0, 6.0, 12.0, 11.0, 24.0, 35.0, 48.0, 81.0, 136.0, 236.0, 411.0, 763.0, 1714.0, 3716.0, 9850.0, 30519.0, 113939.0, 631318.0, 185969.0, 46125.0, 14066.0, 5099.0, 2201.0, 1023.0, 571.0, 270.0, 155.0, 75.0, 58.0, 40.0, 18.0, 17.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.91015625, -4.75982666015625, -4.6094970703125, -4.45916748046875, -4.308837890625, -4.15850830078125, -4.0081787109375, -3.85784912109375, -3.70751953125, -3.55718994140625, -3.4068603515625, -3.25653076171875, -3.106201171875, -2.95587158203125, -2.8055419921875, -2.65521240234375, -2.5048828125, -2.35455322265625, -2.2042236328125, -2.05389404296875, -1.903564453125, -1.75323486328125, -1.6029052734375, -1.45257568359375, -1.30224609375, -1.15191650390625, -1.0015869140625, -0.85125732421875, -0.700927734375, -0.55059814453125, -0.4002685546875, -0.24993896484375, -0.099609375, 0.05072021484375, 0.2010498046875, 0.35137939453125, 0.501708984375, 0.65203857421875, 0.8023681640625, 0.95269775390625, 1.10302734375, 1.25335693359375, 1.4036865234375, 1.55401611328125, 1.704345703125, 1.85467529296875, 2.0050048828125, 2.15533447265625, 2.3056640625, 2.45599365234375, 2.6063232421875, 2.75665283203125, 2.906982421875, 3.05731201171875, 3.2076416015625, 3.35797119140625, 3.50830078125, 3.65863037109375, 3.8089599609375, 3.95928955078125, 4.109619140625, 4.25994873046875, 4.4102783203125, 4.56060791015625, 4.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 11.0, 15.0, 18.0, 18.0, 18.0, 35.0, 41.0, 39.0, 51.0, 90.0, 132.0, 135.0, 97.0, 57.0, 41.0, 31.0, 22.0, 21.0, 12.0, 14.0, 20.0, 13.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016345977783203125, -0.0015864968299865723, -0.001538395881652832, -0.0014902949333190918, -0.0014421939849853516, -0.0013940930366516113, -0.001345992088317871, -0.0012978911399841309, -0.0012497901916503906, -0.0012016892433166504, -0.0011535882949829102, -0.00110548734664917, -0.0010573863983154297, -0.0010092854499816895, -0.0009611845016479492, -0.000913083553314209, -0.0008649826049804688, -0.0008168816566467285, -0.0007687807083129883, -0.000720679759979248, -0.0006725788116455078, -0.0006244778633117676, -0.0005763769149780273, -0.0005282759666442871, -0.0004801750183105469, -0.00043207406997680664, -0.0003839731216430664, -0.00033587217330932617, -0.00028777122497558594, -0.0002396702766418457, -0.00019156932830810547, -0.00014346837997436523, -9.5367431640625e-05, -4.7266483306884766e-05, 8.344650268554688e-07, 4.89354133605957e-05, 9.703636169433594e-05, 0.00014513731002807617, 0.0001932382583618164, 0.00024133920669555664, 0.0002894401550292969, 0.0003375411033630371, 0.00038564205169677734, 0.0004337430000305176, 0.0004818439483642578, 0.000529944896697998, 0.0005780458450317383, 0.0006261467933654785, 0.0006742477416992188, 0.000722348690032959, 0.0007704496383666992, 0.0008185505867004395, 0.0008666515350341797, 0.0009147524833679199, 0.0009628534317016602, 0.0010109543800354004, 0.0010590553283691406, 0.0011071562767028809, 0.001155257225036621, 0.0012033581733703613, 0.0012514591217041016, 0.0012995600700378418, 0.001347661018371582, 0.0013957619667053223, 0.0014438629150390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 17.0, 20.0, 19.0, 25.0, 41.0, 48.0, 89.0, 109.0, 162.0, 219.0, 363.0, 551.0, 864.0, 1411.0, 2640.0, 6021.0, 17514.0, 72385.0, 509685.0, 344666.0, 64006.0, 16013.0, 5468.0, 2490.0, 1347.0, 830.0, 485.0, 325.0, 207.0, 151.0, 101.0, 66.0, 46.0, 36.0, 21.0, 24.0, 11.0, 14.0, 4.0, 9.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.2421875, -4.1005859375, -3.958984375, -3.8173828125, -3.67578125, -3.5341796875, -3.392578125, -3.2509765625, -3.109375, -2.9677734375, -2.826171875, -2.6845703125, -2.54296875, -2.4013671875, -2.259765625, -2.1181640625, -1.9765625, -1.8349609375, -1.693359375, -1.5517578125, -1.41015625, -1.2685546875, -1.126953125, -0.9853515625, -0.84375, -0.7021484375, -0.560546875, -0.4189453125, -0.27734375, -0.1357421875, 0.005859375, 0.1474609375, 0.2890625, 0.4306640625, 0.572265625, 0.7138671875, 0.85546875, 0.9970703125, 1.138671875, 1.2802734375, 1.421875, 1.5634765625, 1.705078125, 1.8466796875, 1.98828125, 2.1298828125, 2.271484375, 2.4130859375, 2.5546875, 2.6962890625, 2.837890625, 2.9794921875, 3.12109375, 3.2626953125, 3.404296875, 3.5458984375, 3.6875, 3.8291015625, 3.970703125, 4.1123046875, 4.25390625, 4.3955078125, 4.537109375, 4.6787109375, 4.8203125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 6.0, 7.0, 8.0, 11.0, 9.0, 18.0, 12.0, 16.0, 23.0, 20.0, 29.0, 26.0, 31.0, 41.0, 48.0, 54.0, 88.0, 60.0, 48.0, 65.0, 44.0, 53.0, 47.0, 33.0, 26.0, 23.0, 20.0, 21.0, 16.0, 14.0, 10.0, 13.0, 7.0, 13.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.3671875, -4.2401123046875, -4.113037109375, -3.9859619140625, -3.85888671875, -3.7318115234375, -3.604736328125, -3.4776611328125, -3.3505859375, -3.2235107421875, -3.096435546875, -2.9693603515625, -2.84228515625, -2.7152099609375, -2.588134765625, -2.4610595703125, -2.333984375, -2.2069091796875, -2.079833984375, -1.9527587890625, -1.82568359375, -1.6986083984375, -1.571533203125, -1.4444580078125, -1.3173828125, -1.1903076171875, -1.063232421875, -0.9361572265625, -0.80908203125, -0.6820068359375, -0.554931640625, -0.4278564453125, -0.30078125, -0.1737060546875, -0.046630859375, 0.0804443359375, 0.20751953125, 0.3345947265625, 0.461669921875, 0.5887451171875, 0.7158203125, 0.8428955078125, 0.969970703125, 1.0970458984375, 1.22412109375, 1.3511962890625, 1.478271484375, 1.6053466796875, 1.732421875, 1.8594970703125, 1.986572265625, 2.1136474609375, 2.24072265625, 2.3677978515625, 2.494873046875, 2.6219482421875, 2.7490234375, 2.8760986328125, 3.003173828125, 3.1302490234375, 3.25732421875, 3.3843994140625, 3.511474609375, 3.6385498046875, 3.765625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 29.0, 90.0, 208.0, 399.0, 175.0, 52.0, 15.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-284.26275634765625, -276.82891845703125, -269.3950500488281, -261.9612121582031, -254.52734375, -247.093505859375, -239.65965270996094, -232.22579956054688, -224.7919464111328, -217.35809326171875, -209.9242401123047, -202.49038696289062, -195.05654907226562, -187.6226806640625, -180.1888427734375, -172.75498962402344, -165.32113647460938, -157.8872833251953, -150.45343017578125, -143.0195770263672, -135.58572387695312, -128.15188598632812, -120.71803283691406, -113.2841796875, -105.85032653808594, -98.41647338867188, -90.98262023925781, -83.54877471923828, -76.11492156982422, -68.68106842041016, -61.24721908569336, -53.81336975097656, -46.3795166015625, -38.94566345214844, -31.51181411743164, -24.07796287536621, -16.64411163330078, -9.210258483886719, -1.7764091491699219, 5.657440185546875, 13.091293334960938, 20.525144577026367, 27.958995819091797, 35.392845153808594, 42.826698303222656, 50.26055145263672, 57.694400787353516, 65.12825012207031, 72.56210327148438, 79.99595642089844, 87.4298095703125, 94.86365509033203, 102.2975082397461, 109.73136138916016, 117.16520690917969, 124.59906005859375, 132.0329132080078, 139.46676635742188, 146.90061950683594, 154.33447265625, 161.768310546875, 169.20217895507812, 176.63601684570312, 184.0698699951172, 191.50372314453125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 3.0, 3.0, 11.0, 9.0, 10.0, 16.0, 17.0, 22.0, 18.0, 15.0, 21.0, 34.0, 22.0, 28.0, 29.0, 40.0, 40.0, 43.0, 50.0, 58.0, 53.0, 55.0, 47.0, 31.0, 41.0, 31.0, 21.0, 33.0, 22.0, 24.0, 15.0, 23.0, 19.0, 11.0, 12.0, 12.0, 9.0, 10.0, 6.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-59.611419677734375, -57.745235443115234, -55.87905502319336, -54.01287078857422, -52.146690368652344, -50.2805061340332, -48.41432189941406, -46.54814147949219, -44.68195724487305, -42.815773010253906, -40.94959259033203, -39.08340835571289, -37.21722412109375, -35.351043701171875, -33.484859466552734, -31.618677139282227, -29.75249481201172, -27.88631248474121, -26.020130157470703, -24.153945922851562, -22.287763595581055, -20.421581268310547, -18.555397033691406, -16.6892147064209, -14.82303237915039, -12.956850051879883, -11.090666770935059, -9.224483489990234, -7.358301162719727, -5.492118835449219, -3.6259355545043945, -1.7597522735595703, 0.10643386840820312, 1.9726166725158691, 3.838799476623535, 5.704982280731201, 7.571165084838867, 9.437347412109375, 11.3035306930542, 13.169713973999023, 15.035896301269531, 16.90207862854004, 18.768260955810547, 20.634445190429688, 22.500627517700195, 24.366809844970703, 26.232994079589844, 28.09917640686035, 29.96535873413086, 31.831541061401367, 33.697723388671875, 35.563907623291016, 37.430091857910156, 39.29627227783203, 41.16245651245117, 43.02864074707031, 44.89482116699219, 46.76100540161133, 48.6271858215332, 50.493370056152344, 52.35955047607422, 54.22573471069336, 56.0919189453125, 57.958099365234375, 59.824283599853516]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 16.0, 21.0, 14.0, 34.0, 67.0, 91.0, 127.0, 182.0, 324.0, 448.0, 726.0, 1214.0, 2088.0, 3686.0, 6490.0, 12609.0, 24156.0, 50790.0, 122208.0, 346905.0, 1059430.0, 1547012.0, 643585.0, 213720.0, 82711.0, 36761.0, 18010.0, 9219.0, 4966.0, 2702.0, 1564.0, 883.0, 577.0, 336.0, 204.0, 137.0, 84.0, 54.0, 40.0, 27.0, 11.0, 13.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.122802734375, -3.02294921875, -2.923095703125, -2.8232421875, -2.723388671875, -2.62353515625, -2.523681640625, -2.423828125, -2.323974609375, -2.22412109375, -2.124267578125, -2.0244140625, -1.924560546875, -1.82470703125, -1.724853515625, -1.625, -1.525146484375, -1.42529296875, -1.325439453125, -1.2255859375, -1.125732421875, -1.02587890625, -0.926025390625, -0.826171875, -0.726318359375, -0.62646484375, -0.526611328125, -0.4267578125, -0.326904296875, -0.22705078125, -0.127197265625, -0.02734375, 0.072509765625, 0.17236328125, 0.272216796875, 0.3720703125, 0.471923828125, 0.57177734375, 0.671630859375, 0.771484375, 0.871337890625, 0.97119140625, 1.071044921875, 1.1708984375, 1.270751953125, 1.37060546875, 1.470458984375, 1.5703125, 1.670166015625, 1.77001953125, 1.869873046875, 1.9697265625, 2.069580078125, 2.16943359375, 2.269287109375, 2.369140625, 2.468994140625, 2.56884765625, 2.668701171875, 2.7685546875, 2.868408203125, 2.96826171875, 3.068115234375, 3.16796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 9.0, 9.0, 11.0, 19.0, 23.0, 17.0, 33.0, 42.0, 49.0, 50.0, 54.0, 52.0, 63.0, 66.0, 58.0, 65.0, 54.0, 51.0, 48.0, 55.0, 21.0, 29.0, 28.0, 23.0, 19.0, 14.0, 10.0, 5.0, 11.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.96484375, -4.81903076171875, -4.6732177734375, -4.52740478515625, -4.381591796875, -4.23577880859375, -4.0899658203125, -3.94415283203125, -3.79833984375, -3.65252685546875, -3.5067138671875, -3.36090087890625, -3.215087890625, -3.06927490234375, -2.9234619140625, -2.77764892578125, -2.6318359375, -2.48602294921875, -2.3402099609375, -2.19439697265625, -2.048583984375, -1.90277099609375, -1.7569580078125, -1.61114501953125, -1.46533203125, -1.31951904296875, -1.1737060546875, -1.02789306640625, -0.882080078125, -0.73626708984375, -0.5904541015625, -0.44464111328125, -0.298828125, -0.15301513671875, -0.0072021484375, 0.13861083984375, 0.284423828125, 0.43023681640625, 0.5760498046875, 0.72186279296875, 0.86767578125, 1.01348876953125, 1.1593017578125, 1.30511474609375, 1.450927734375, 1.59674072265625, 1.7425537109375, 1.88836669921875, 2.0341796875, 2.17999267578125, 2.3258056640625, 2.47161865234375, 2.617431640625, 2.76324462890625, 2.9090576171875, 3.05487060546875, 3.20068359375, 3.34649658203125, 3.4923095703125, 3.63812255859375, 3.783935546875, 3.92974853515625, 4.0755615234375, 4.22137451171875, 4.3671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 22.0, 26.0, 41.0, 88.0, 121.0, 219.0, 409.0, 976.0, 3273.0, 21183.0, 365694.0, 3612867.0, 171589.0, 13899.0, 2523.0, 718.0, 313.0, 132.0, 78.0, 46.0, 18.0, 12.0, 7.0, 7.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.3243408203125, -13.781494140625, -13.2386474609375, -12.69580078125, -12.1529541015625, -11.610107421875, -11.0672607421875, -10.5244140625, -9.9815673828125, -9.438720703125, -8.8958740234375, -8.35302734375, -7.8101806640625, -7.267333984375, -6.7244873046875, -6.181640625, -5.6387939453125, -5.095947265625, -4.5531005859375, -4.01025390625, -3.4674072265625, -2.924560546875, -2.3817138671875, -1.8388671875, -1.2960205078125, -0.753173828125, -0.2103271484375, 0.33251953125, 0.8753662109375, 1.418212890625, 1.9610595703125, 2.50390625, 3.0467529296875, 3.589599609375, 4.1324462890625, 4.67529296875, 5.2181396484375, 5.760986328125, 6.3038330078125, 6.8466796875, 7.3895263671875, 7.932373046875, 8.4752197265625, 9.01806640625, 9.5609130859375, 10.103759765625, 10.6466064453125, 11.189453125, 11.7322998046875, 12.275146484375, 12.8179931640625, 13.36083984375, 13.9036865234375, 14.446533203125, 14.9893798828125, 15.5322265625, 16.0750732421875, 16.617919921875, 17.1607666015625, 17.70361328125, 18.2464599609375, 18.789306640625, 19.3321533203125, 19.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 4.0, 5.0, 6.0, 15.0, 17.0, 25.0, 42.0, 78.0, 118.0, 239.0, 399.0, 789.0, 947.0, 612.0, 301.0, 185.0, 115.0, 61.0, 42.0, 28.0, 14.0, 13.0, 9.0, 3.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.1875, -19.6732177734375, -19.158935546875, -18.6446533203125, -18.13037109375, -17.6160888671875, -17.101806640625, -16.5875244140625, -16.0732421875, -15.5589599609375, -15.044677734375, -14.5303955078125, -14.01611328125, -13.5018310546875, -12.987548828125, -12.4732666015625, -11.958984375, -11.4447021484375, -10.930419921875, -10.4161376953125, -9.90185546875, -9.3875732421875, -8.873291015625, -8.3590087890625, -7.8447265625, -7.3304443359375, -6.816162109375, -6.3018798828125, -5.78759765625, -5.2733154296875, -4.759033203125, -4.2447509765625, -3.73046875, -3.2161865234375, -2.701904296875, -2.1876220703125, -1.67333984375, -1.1590576171875, -0.644775390625, -0.1304931640625, 0.3837890625, 0.8980712890625, 1.412353515625, 1.9266357421875, 2.44091796875, 2.9552001953125, 3.469482421875, 3.9837646484375, 4.498046875, 5.0123291015625, 5.526611328125, 6.0408935546875, 6.55517578125, 7.0694580078125, 7.583740234375, 8.0980224609375, 8.6123046875, 9.1265869140625, 9.640869140625, 10.1551513671875, 10.66943359375, 11.1837158203125, 11.697998046875, 12.2122802734375, 12.7265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 25.0, 115.0, 198.0, 287.0, 201.0, 85.0, 25.0, 25.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-198.02877807617188, -192.569580078125, -187.11038208007812, -181.6511688232422, -176.1919708251953, -170.73277282714844, -165.2735595703125, -159.81436157226562, -154.35516357421875, -148.89596557617188, -143.436767578125, -137.97755432128906, -132.5183563232422, -127.05915832519531, -121.5999526977539, -116.1407470703125, -110.68154907226562, -105.22235107421875, -99.76314544677734, -94.30393981933594, -88.84474182128906, -83.38554382324219, -77.92633819580078, -72.46713256835938, -67.0079345703125, -61.54873275756836, -56.08953094482422, -50.63032913208008, -45.17112731933594, -39.7119255065918, -34.252723693847656, -28.793521881103516, -23.334320068359375, -17.875118255615234, -12.415916442871094, -6.956714630126953, -1.4975128173828125, 3.961688995361328, 9.420890808105469, 14.88009262084961, 20.33929443359375, 25.79849624633789, 31.25769805908203, 36.71689987182617, 42.17610168457031, 47.63530349731445, 53.094505310058594, 58.553707122802734, 64.01290893554688, 69.47210693359375, 74.93131256103516, 80.39051818847656, 85.84971618652344, 91.30891418457031, 96.76811981201172, 102.22732543945312, 107.6865234375, 113.14572143554688, 118.60492706298828, 124.06413269042969, 129.52333068847656, 134.98252868652344, 140.44174194335938, 145.90093994140625, 151.36013793945312]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 7.0, 17.0, 17.0, 28.0, 25.0, 40.0, 58.0, 74.0, 55.0, 56.0, 70.0, 68.0, 63.0, 64.0, 63.0, 53.0, 47.0, 45.0, 45.0, 23.0, 21.0, 12.0, 12.0, 10.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3060073852539, -87.77186584472656, -85.23771667480469, -82.70357513427734, -80.16943359375, -77.63528442382812, -75.10114288330078, -72.56700134277344, -70.03285217285156, -67.49871063232422, -64.96456146240234, -62.430419921875, -59.896278381347656, -57.36213302612305, -54.82798767089844, -52.293846130371094, -49.75970458984375, -47.22555923461914, -44.6914176940918, -42.15727233886719, -39.623130798339844, -37.088985443115234, -34.554840087890625, -32.02069854736328, -29.486553192138672, -26.952409744262695, -24.41826629638672, -21.88412094116211, -19.349977493286133, -16.815834045410156, -14.281689643859863, -11.74754524230957, -9.213401794433594, -6.679257869720459, -4.145113945007324, -1.6109700202941895, 0.9231739044189453, 3.457317352294922, 5.991461753845215, 8.525606155395508, 11.059749603271484, 13.593893051147461, 16.128036499023438, 18.662181854248047, 21.196325302124023, 23.73046875, 26.26461410522461, 28.798757553100586, 31.332901000976562, 33.86704635620117, 36.401187896728516, 38.935333251953125, 41.46947479248047, 44.00362014770508, 46.53776550292969, 49.07190704345703, 51.60605239868164, 54.14019775390625, 56.674339294433594, 59.2084846496582, 61.74263000488281, 64.27677154541016, 66.8109130859375, 69.34506225585938, 71.87920379638672]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 11.0, 15.0, 16.0, 20.0, 54.0, 57.0, 82.0, 128.0, 215.0, 285.0, 423.0, 696.0, 1077.0, 1639.0, 2712.0, 4356.0, 7343.0, 13486.0, 27255.0, 65028.0, 194534.0, 403872.0, 198913.0, 65858.0, 27332.0, 13775.0, 7558.0, 4386.0, 2611.0, 1687.0, 1088.0, 703.0, 455.0, 287.0, 196.0, 127.0, 71.0, 68.0, 39.0, 30.0, 17.0, 13.0, 12.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0], "bins": [-7.8125, -7.5985107421875, -7.384521484375, -7.1705322265625, -6.95654296875, -6.7425537109375, -6.528564453125, -6.3145751953125, -6.1005859375, -5.8865966796875, -5.672607421875, -5.4586181640625, -5.24462890625, -5.0306396484375, -4.816650390625, -4.6026611328125, -4.388671875, -4.1746826171875, -3.960693359375, -3.7467041015625, -3.53271484375, -3.3187255859375, -3.104736328125, -2.8907470703125, -2.6767578125, -2.4627685546875, -2.248779296875, -2.0347900390625, -1.82080078125, -1.6068115234375, -1.392822265625, -1.1788330078125, -0.96484375, -0.7508544921875, -0.536865234375, -0.3228759765625, -0.10888671875, 0.1051025390625, 0.319091796875, 0.5330810546875, 0.7470703125, 0.9610595703125, 1.175048828125, 1.3890380859375, 1.60302734375, 1.8170166015625, 2.031005859375, 2.2449951171875, 2.458984375, 2.6729736328125, 2.886962890625, 3.1009521484375, 3.31494140625, 3.5289306640625, 3.742919921875, 3.9569091796875, 4.1708984375, 4.3848876953125, 4.598876953125, 4.8128662109375, 5.02685546875, 5.2408447265625, 5.454833984375, 5.6688232421875, 5.8828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 12.0, 16.0, 16.0, 38.0, 19.0, 42.0, 41.0, 37.0, 38.0, 43.0, 47.0, 55.0, 49.0, 53.0, 52.0, 41.0, 48.0, 38.0, 38.0, 32.0, 32.0, 29.0, 23.0, 16.0, 14.0, 10.0, 9.0, 17.0, 6.0, 8.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.8828125, -4.756072998046875, -4.62933349609375, -4.502593994140625, -4.3758544921875, -4.249114990234375, -4.12237548828125, -3.995635986328125, -3.868896484375, -3.742156982421875, -3.61541748046875, -3.488677978515625, -3.3619384765625, -3.235198974609375, -3.10845947265625, -2.981719970703125, -2.85498046875, -2.728240966796875, -2.60150146484375, -2.474761962890625, -2.3480224609375, -2.221282958984375, -2.09454345703125, -1.967803955078125, -1.841064453125, -1.714324951171875, -1.58758544921875, -1.460845947265625, -1.3341064453125, -1.207366943359375, -1.08062744140625, -0.953887939453125, -0.8271484375, -0.700408935546875, -0.57366943359375, -0.446929931640625, -0.3201904296875, -0.193450927734375, -0.06671142578125, 0.060028076171875, 0.186767578125, 0.313507080078125, 0.44024658203125, 0.566986083984375, 0.6937255859375, 0.820465087890625, 0.94720458984375, 1.073944091796875, 1.20068359375, 1.327423095703125, 1.45416259765625, 1.580902099609375, 1.7076416015625, 1.834381103515625, 1.96112060546875, 2.087860107421875, 2.214599609375, 2.341339111328125, 2.46807861328125, 2.594818115234375, 2.7215576171875, 2.848297119140625, 2.97503662109375, 3.101776123046875, 3.228515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 8.0, 9.0, 11.0, 14.0, 20.0, 35.0, 50.0, 58.0, 87.0, 139.0, 197.0, 298.0, 509.0, 864.0, 1865.0, 4809.0, 17223.0, 114820.0, 798177.0, 86631.0, 14757.0, 4182.0, 1619.0, 832.0, 422.0, 284.0, 187.0, 130.0, 100.0, 79.0, 40.0, 25.0, 19.0, 15.0, 8.0, 12.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.609375, -15.060546875, -14.51171875, -13.962890625, -13.4140625, -12.865234375, -12.31640625, -11.767578125, -11.21875, -10.669921875, -10.12109375, -9.572265625, -9.0234375, -8.474609375, -7.92578125, -7.376953125, -6.828125, -6.279296875, -5.73046875, -5.181640625, -4.6328125, -4.083984375, -3.53515625, -2.986328125, -2.4375, -1.888671875, -1.33984375, -0.791015625, -0.2421875, 0.306640625, 0.85546875, 1.404296875, 1.953125, 2.501953125, 3.05078125, 3.599609375, 4.1484375, 4.697265625, 5.24609375, 5.794921875, 6.34375, 6.892578125, 7.44140625, 7.990234375, 8.5390625, 9.087890625, 9.63671875, 10.185546875, 10.734375, 11.283203125, 11.83203125, 12.380859375, 12.9296875, 13.478515625, 14.02734375, 14.576171875, 15.125, 15.673828125, 16.22265625, 16.771484375, 17.3203125, 17.869140625, 18.41796875, 18.966796875, 19.515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 3.0, 4.0, 6.0, 10.0, 14.0, 9.0, 26.0, 13.0, 21.0, 29.0, 30.0, 37.0, 36.0, 40.0, 51.0, 57.0, 44.0, 52.0, 64.0, 43.0, 54.0, 59.0, 54.0, 32.0, 41.0, 26.0, 26.0, 23.0, 23.0, 8.0, 17.0, 10.0, 5.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8046875, -15.2122802734375, -14.619873046875, -14.0274658203125, -13.43505859375, -12.8426513671875, -12.250244140625, -11.6578369140625, -11.0654296875, -10.4730224609375, -9.880615234375, -9.2882080078125, -8.69580078125, -8.1033935546875, -7.510986328125, -6.9185791015625, -6.326171875, -5.7337646484375, -5.141357421875, -4.5489501953125, -3.95654296875, -3.3641357421875, -2.771728515625, -2.1793212890625, -1.5869140625, -0.9945068359375, -0.402099609375, 0.1903076171875, 0.78271484375, 1.3751220703125, 1.967529296875, 2.5599365234375, 3.15234375, 3.7447509765625, 4.337158203125, 4.9295654296875, 5.52197265625, 6.1143798828125, 6.706787109375, 7.2991943359375, 7.8916015625, 8.4840087890625, 9.076416015625, 9.6688232421875, 10.26123046875, 10.8536376953125, 11.446044921875, 12.0384521484375, 12.630859375, 13.2232666015625, 13.815673828125, 14.4080810546875, 15.00048828125, 15.5928955078125, 16.185302734375, 16.7777099609375, 17.3701171875, 17.9625244140625, 18.554931640625, 19.1473388671875, 19.73974609375, 20.3321533203125, 20.924560546875, 21.5169677734375, 22.109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 16.0, 19.0, 31.0, 28.0, 52.0, 62.0, 115.0, 180.0, 301.0, 402.0, 810.0, 1450.0, 3123.0, 7384.0, 20682.0, 68854.0, 302890.0, 517635.0, 83837.0, 24733.0, 8511.0, 3566.0, 1674.0, 872.0, 463.0, 269.0, 184.0, 136.0, 78.0, 42.0, 32.0, 29.0, 13.0, 16.0, 9.0, 9.0, 7.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1484375, -4.010498046875, -3.87255859375, -3.734619140625, -3.5966796875, -3.458740234375, -3.32080078125, -3.182861328125, -3.044921875, -2.906982421875, -2.76904296875, -2.631103515625, -2.4931640625, -2.355224609375, -2.21728515625, -2.079345703125, -1.94140625, -1.803466796875, -1.66552734375, -1.527587890625, -1.3896484375, -1.251708984375, -1.11376953125, -0.975830078125, -0.837890625, -0.699951171875, -0.56201171875, -0.424072265625, -0.2861328125, -0.148193359375, -0.01025390625, 0.127685546875, 0.265625, 0.403564453125, 0.54150390625, 0.679443359375, 0.8173828125, 0.955322265625, 1.09326171875, 1.231201171875, 1.369140625, 1.507080078125, 1.64501953125, 1.782958984375, 1.9208984375, 2.058837890625, 2.19677734375, 2.334716796875, 2.47265625, 2.610595703125, 2.74853515625, 2.886474609375, 3.0244140625, 3.162353515625, 3.30029296875, 3.438232421875, 3.576171875, 3.714111328125, 3.85205078125, 3.989990234375, 4.1279296875, 4.265869140625, 4.40380859375, 4.541748046875, 4.6796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 5.0, 9.0, 16.0, 17.0, 22.0, 24.0, 32.0, 64.0, 58.0, 103.0, 132.0, 147.0, 102.0, 69.0, 34.0, 35.0, 24.0, 19.0, 18.0, 9.0, 10.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014925003051757812, -0.0014423727989196777, -0.0013922452926635742, -0.0013421177864074707, -0.0012919902801513672, -0.0012418627738952637, -0.0011917352676391602, -0.0011416077613830566, -0.0010914802551269531, -0.0010413527488708496, -0.000991225242614746, -0.0009410977363586426, -0.0008909702301025391, -0.0008408427238464355, -0.000790715217590332, -0.0007405877113342285, -0.000690460205078125, -0.0006403326988220215, -0.000590205192565918, -0.0005400776863098145, -0.0004899501800537109, -0.0004398226737976074, -0.0003896951675415039, -0.0003395676612854004, -0.0002894401550292969, -0.00023931264877319336, -0.00018918514251708984, -0.00013905763626098633, -8.893013000488281e-05, -3.88026237487793e-05, 1.1324882507324219e-05, 6.145238876342773e-05, 0.00011157989501953125, 0.00016170740127563477, 0.00021183490753173828, 0.0002619624137878418, 0.0003120899200439453, 0.00036221742630004883, 0.00041234493255615234, 0.00046247243881225586, 0.0005125999450683594, 0.0005627274513244629, 0.0006128549575805664, 0.0006629824638366699, 0.0007131099700927734, 0.000763237476348877, 0.0008133649826049805, 0.000863492488861084, 0.0009136199951171875, 0.000963747501373291, 0.0010138750076293945, 0.001064002513885498, 0.0011141300201416016, 0.001164257526397705, 0.0012143850326538086, 0.0012645125389099121, 0.0013146400451660156, 0.0013647675514221191, 0.0014148950576782227, 0.0014650225639343262, 0.0015151500701904297, 0.0015652775764465332, 0.0016154050827026367, 0.0016655325889587402, 0.0017156600952148438]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 14.0, 19.0, 33.0, 63.0, 136.0, 218.0, 663.0, 1933.0, 10396.0, 238324.0, 772006.0, 20252.0, 3012.0, 850.0, 315.0, 128.0, 58.0, 40.0, 21.0, 21.0, 12.0, 7.0, 3.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.671875, -11.3087158203125, -10.945556640625, -10.5823974609375, -10.21923828125, -9.8560791015625, -9.492919921875, -9.1297607421875, -8.7666015625, -8.4034423828125, -8.040283203125, -7.6771240234375, -7.31396484375, -6.9508056640625, -6.587646484375, -6.2244873046875, -5.861328125, -5.4981689453125, -5.135009765625, -4.7718505859375, -4.40869140625, -4.0455322265625, -3.682373046875, -3.3192138671875, -2.9560546875, -2.5928955078125, -2.229736328125, -1.8665771484375, -1.50341796875, -1.1402587890625, -0.777099609375, -0.4139404296875, -0.05078125, 0.3123779296875, 0.675537109375, 1.0386962890625, 1.40185546875, 1.7650146484375, 2.128173828125, 2.4913330078125, 2.8544921875, 3.2176513671875, 3.580810546875, 3.9439697265625, 4.30712890625, 4.6702880859375, 5.033447265625, 5.3966064453125, 5.759765625, 6.1229248046875, 6.486083984375, 6.8492431640625, 7.21240234375, 7.5755615234375, 7.938720703125, 8.3018798828125, 8.6650390625, 9.0281982421875, 9.391357421875, 9.7545166015625, 10.11767578125, 10.4808349609375, 10.843994140625, 11.2071533203125, 11.5703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 10.0, 11.0, 13.0, 16.0, 29.0, 24.0, 33.0, 55.0, 59.0, 82.0, 80.0, 97.0, 104.0, 75.0, 66.0, 54.0, 43.0, 23.0, 24.0, 14.0, 16.0, 12.0, 9.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.0390625, -5.869873046875, -5.70068359375, -5.531494140625, -5.3623046875, -5.193115234375, -5.02392578125, -4.854736328125, -4.685546875, -4.516357421875, -4.34716796875, -4.177978515625, -4.0087890625, -3.839599609375, -3.67041015625, -3.501220703125, -3.33203125, -3.162841796875, -2.99365234375, -2.824462890625, -2.6552734375, -2.486083984375, -2.31689453125, -2.147705078125, -1.978515625, -1.809326171875, -1.64013671875, -1.470947265625, -1.3017578125, -1.132568359375, -0.96337890625, -0.794189453125, -0.625, -0.455810546875, -0.28662109375, -0.117431640625, 0.0517578125, 0.220947265625, 0.39013671875, 0.559326171875, 0.728515625, 0.897705078125, 1.06689453125, 1.236083984375, 1.4052734375, 1.574462890625, 1.74365234375, 1.912841796875, 2.08203125, 2.251220703125, 2.42041015625, 2.589599609375, 2.7587890625, 2.927978515625, 3.09716796875, 3.266357421875, 3.435546875, 3.604736328125, 3.77392578125, 3.943115234375, 4.1123046875, 4.281494140625, 4.45068359375, 4.619873046875, 4.7890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 13.0, 66.0, 201.0, 464.0, 176.0, 52.0, 12.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-319.15911865234375, -311.2900085449219, -303.4208679199219, -295.5517578125, -287.6826477050781, -279.81353759765625, -271.94439697265625, -264.0752868652344, -256.2061767578125, -248.33705139160156, -240.4679412841797, -232.59881591796875, -224.72970581054688, -216.86058044433594, -208.991455078125, -201.12234497070312, -193.25320434570312, -185.3840789794922, -177.5149688720703, -169.64584350585938, -161.7767333984375, -153.90760803222656, -146.03848266601562, -138.16937255859375, -130.3002471923828, -122.4311294555664, -114.56201171875, -106.69288635253906, -98.82376861572266, -90.95465087890625, -83.08552551269531, -75.2164077758789, -67.3472900390625, -59.478172302246094, -51.60905075073242, -43.73992919921875, -35.870811462402344, -28.001693725585938, -20.132572174072266, -12.263450622558594, -4.3943328857421875, 3.4747867584228516, 11.34390640258789, 19.21302604675293, 27.08214569091797, 34.951263427734375, 42.82038497924805, 50.68950653076172, 58.558624267578125, 66.42774200439453, 74.29685974121094, 82.16598510742188, 90.03510284423828, 97.90422058105469, 105.77334594726562, 113.64246368408203, 121.51158142089844, 129.38070678710938, 137.24981689453125, 145.1189422607422, 152.98806762695312, 160.857177734375, 168.72630310058594, 176.59542846679688, 184.46453857421875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 5.0, 13.0, 16.0, 13.0, 13.0, 21.0, 29.0, 23.0, 27.0, 26.0, 32.0, 34.0, 43.0, 46.0, 59.0, 68.0, 72.0, 74.0, 48.0, 38.0, 34.0, 32.0, 36.0, 24.0, 22.0, 22.0, 20.0, 11.0, 14.0, 13.0, 14.0, 12.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.67729949951172, -71.43338012695312, -69.189453125, -66.94552612304688, -64.70160675048828, -62.45768356323242, -60.21376037597656, -57.9698371887207, -55.725914001464844, -53.481990814208984, -51.238067626953125, -48.994144439697266, -46.750221252441406, -44.50629806518555, -42.26237487792969, -40.01845169067383, -37.77452850341797, -35.53060531616211, -33.28668212890625, -31.04275894165039, -28.79883575439453, -26.554912567138672, -24.310989379882812, -22.067066192626953, -19.823143005371094, -17.579219818115234, -15.335296630859375, -13.091373443603516, -10.847450256347656, -8.603527069091797, -6.3596038818359375, -4.115680694580078, -1.8717498779296875, 0.3721733093261719, 2.6160964965820312, 4.860019683837891, 7.10394287109375, 9.34786605834961, 11.591789245605469, 13.835712432861328, 16.079635620117188, 18.323558807373047, 20.567481994628906, 22.811405181884766, 25.055328369140625, 27.299251556396484, 29.543174743652344, 31.787097930908203, 34.03102111816406, 36.27494430541992, 38.51886749267578, 40.76279067993164, 43.0067138671875, 45.25063705444336, 47.49456024169922, 49.73848342895508, 51.98240661621094, 54.2263298034668, 56.470252990722656, 58.714176177978516, 60.958099365234375, 63.202022552490234, 65.4459457397461, 67.68986511230469, 69.93379211425781]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 14.0, 15.0, 28.0, 33.0, 51.0, 84.0, 102.0, 188.0, 214.0, 382.0, 670.0, 1016.0, 1834.0, 3406.0, 6670.0, 14670.0, 37264.0, 118688.0, 524784.0, 2030495.0, 1114178.0, 232948.0, 63624.0, 22595.0, 9814.0, 4733.0, 2433.0, 1270.0, 785.0, 475.0, 284.0, 154.0, 112.0, 84.0, 53.0, 37.0, 27.0, 14.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.9375, -4.799346923828125, -4.66119384765625, -4.523040771484375, -4.3848876953125, -4.246734619140625, -4.10858154296875, -3.970428466796875, -3.832275390625, -3.694122314453125, -3.55596923828125, -3.417816162109375, -3.2796630859375, -3.141510009765625, -3.00335693359375, -2.865203857421875, -2.72705078125, -2.588897705078125, -2.45074462890625, -2.312591552734375, -2.1744384765625, -2.036285400390625, -1.89813232421875, -1.759979248046875, -1.621826171875, -1.483673095703125, -1.34552001953125, -1.207366943359375, -1.0692138671875, -0.931060791015625, -0.79290771484375, -0.654754638671875, -0.5166015625, -0.378448486328125, -0.24029541015625, -0.102142333984375, 0.0360107421875, 0.174163818359375, 0.31231689453125, 0.450469970703125, 0.588623046875, 0.726776123046875, 0.86492919921875, 1.003082275390625, 1.1412353515625, 1.279388427734375, 1.41754150390625, 1.555694580078125, 1.69384765625, 1.832000732421875, 1.97015380859375, 2.108306884765625, 2.2464599609375, 2.384613037109375, 2.52276611328125, 2.660919189453125, 2.799072265625, 2.937225341796875, 3.07537841796875, 3.213531494140625, 3.3516845703125, 3.489837646484375, 3.62799072265625, 3.766143798828125, 3.904296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 7.0, 0.0, 4.0, 6.0, 1.0, 2.0, 7.0, 11.0, 10.0, 11.0, 11.0, 9.0, 12.0, 27.0, 18.0, 21.0, 26.0, 19.0, 44.0, 47.0, 41.0, 44.0, 51.0, 43.0, 56.0, 39.0, 42.0, 51.0, 45.0, 41.0, 35.0, 36.0, 24.0, 24.0, 26.0, 21.0, 16.0, 20.0, 12.0, 8.0, 9.0, 7.0, 6.0, 6.0, 4.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.115020751953125, -2.99761962890625, -2.880218505859375, -2.7628173828125, -2.645416259765625, -2.52801513671875, -2.410614013671875, -2.293212890625, -2.175811767578125, -2.05841064453125, -1.941009521484375, -1.8236083984375, -1.706207275390625, -1.58880615234375, -1.471405029296875, -1.35400390625, -1.236602783203125, -1.11920166015625, -1.001800537109375, -0.8843994140625, -0.766998291015625, -0.64959716796875, -0.532196044921875, -0.414794921875, -0.297393798828125, -0.17999267578125, -0.062591552734375, 0.0548095703125, 0.172210693359375, 0.28961181640625, 0.407012939453125, 0.5244140625, 0.641815185546875, 0.75921630859375, 0.876617431640625, 0.9940185546875, 1.111419677734375, 1.22882080078125, 1.346221923828125, 1.463623046875, 1.581024169921875, 1.69842529296875, 1.815826416015625, 1.9332275390625, 2.050628662109375, 2.16802978515625, 2.285430908203125, 2.40283203125, 2.520233154296875, 2.63763427734375, 2.755035400390625, 2.8724365234375, 2.989837646484375, 3.10723876953125, 3.224639892578125, 3.342041015625, 3.459442138671875, 3.57684326171875, 3.694244384765625, 3.8116455078125, 3.929046630859375, 4.04644775390625, 4.163848876953125, 4.28125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 18.0, 14.0, 15.0, 27.0, 73.0, 125.0, 349.0, 894.0, 2976.0, 14999.0, 228731.0, 3808413.0, 123563.0, 10615.0, 2216.0, 690.0, 258.0, 126.0, 48.0, 40.0, 22.0, 16.0, 11.0, 9.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.666015625, -19.01953125, -18.373046875, -17.7265625, -17.080078125, -16.43359375, -15.787109375, -15.140625, -14.494140625, -13.84765625, -13.201171875, -12.5546875, -11.908203125, -11.26171875, -10.615234375, -9.96875, -9.322265625, -8.67578125, -8.029296875, -7.3828125, -6.736328125, -6.08984375, -5.443359375, -4.796875, -4.150390625, -3.50390625, -2.857421875, -2.2109375, -1.564453125, -0.91796875, -0.271484375, 0.375, 1.021484375, 1.66796875, 2.314453125, 2.9609375, 3.607421875, 4.25390625, 4.900390625, 5.546875, 6.193359375, 6.83984375, 7.486328125, 8.1328125, 8.779296875, 9.42578125, 10.072265625, 10.71875, 11.365234375, 12.01171875, 12.658203125, 13.3046875, 13.951171875, 14.59765625, 15.244140625, 15.890625, 16.537109375, 17.18359375, 17.830078125, 18.4765625, 19.123046875, 19.76953125, 20.416015625, 21.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 4.0, 6.0, 10.0, 20.0, 22.0, 28.0, 46.0, 54.0, 80.0, 126.0, 248.0, 540.0, 825.0, 785.0, 516.0, 314.0, 182.0, 83.0, 49.0, 41.0, 28.0, 11.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.28125, -15.8419189453125, -15.402587890625, -14.9632568359375, -14.52392578125, -14.0845947265625, -13.645263671875, -13.2059326171875, -12.7666015625, -12.3272705078125, -11.887939453125, -11.4486083984375, -11.00927734375, -10.5699462890625, -10.130615234375, -9.6912841796875, -9.251953125, -8.8126220703125, -8.373291015625, -7.9339599609375, -7.49462890625, -7.0552978515625, -6.615966796875, -6.1766357421875, -5.7373046875, -5.2979736328125, -4.858642578125, -4.4193115234375, -3.97998046875, -3.5406494140625, -3.101318359375, -2.6619873046875, -2.22265625, -1.7833251953125, -1.343994140625, -0.9046630859375, -0.46533203125, -0.0260009765625, 0.413330078125, 0.8526611328125, 1.2919921875, 1.7313232421875, 2.170654296875, 2.6099853515625, 3.04931640625, 3.4886474609375, 3.927978515625, 4.3673095703125, 4.806640625, 5.2459716796875, 5.685302734375, 6.1246337890625, 6.56396484375, 7.0032958984375, 7.442626953125, 7.8819580078125, 8.3212890625, 8.7606201171875, 9.199951171875, 9.6392822265625, 10.07861328125, 10.5179443359375, 10.957275390625, 11.3966064453125, 11.8359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 26.0, 162.0, 483.0, 264.0, 38.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-495.57635498046875, -485.1648864746094, -474.75341796875, -464.3419494628906, -453.93048095703125, -443.51898193359375, -433.1075134277344, -422.696044921875, -412.2845764160156, -401.87310791015625, -391.4616394042969, -381.0501708984375, -370.638671875, -360.2272033691406, -349.81573486328125, -339.4042663574219, -328.9927978515625, -318.5813293457031, -308.16986083984375, -297.7583923339844, -287.346923828125, -276.9354248046875, -266.5239562988281, -256.11248779296875, -245.70101928710938, -235.28955078125, -224.87808227539062, -214.4665985107422, -204.0551300048828, -193.64366149902344, -183.232177734375, -172.82070922851562, -162.40921020507812, -151.99774169921875, -141.58627319335938, -131.17478942871094, -120.76332092285156, -110.35185241699219, -99.94037628173828, -89.52890014648438, -79.117431640625, -68.70596313476562, -58.29448699951172, -47.88301467895508, -37.47154235839844, -27.060070037841797, -16.648597717285156, -6.23712158203125, 4.174346923828125, 14.585819244384766, 24.997291564941406, 35.40876388549805, 45.82023620605469, 56.23170852661133, 66.64318084716797, 77.05465698242188, 87.46612548828125, 97.87759399414062, 108.28907012939453, 118.70054626464844, 129.1120147705078, 139.5234832763672, 149.93496704101562, 160.346435546875, 170.75790405273438]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 7.0, 9.0, 8.0, 16.0, 13.0, 19.0, 14.0, 21.0, 21.0, 40.0, 27.0, 34.0, 37.0, 44.0, 40.0, 54.0, 46.0, 50.0, 53.0, 44.0, 48.0, 45.0, 47.0, 41.0, 39.0, 30.0, 30.0, 23.0, 15.0, 15.0, 7.0, 7.0, 13.0, 8.0, 10.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.40056610107422, -55.601078033447266, -53.80158996582031, -52.002105712890625, -50.20261764526367, -48.40312957763672, -46.60364532470703, -44.80415725708008, -43.004669189453125, -41.20518112182617, -39.40569305419922, -37.60620880126953, -35.80672073364258, -34.007232666015625, -32.20774841308594, -30.408260345458984, -28.60877227783203, -26.809284210205078, -25.009798049926758, -23.210311889648438, -21.410823822021484, -19.61133575439453, -17.81184959411621, -16.01236343383789, -14.212875366210938, -12.4133882522583, -10.613901138305664, -8.814414024353027, -7.014926910400391, -5.215439796447754, -3.415952682495117, -1.6164655685424805, 0.18302536010742188, 1.9825124740600586, 3.7819995880126953, 5.581486701965332, 7.380973815917969, 9.180460929870605, 10.979948043823242, 12.779435157775879, 14.578922271728516, 16.37841033935547, 18.17789649963379, 19.97738265991211, 21.776870727539062, 23.576358795166016, 25.375844955444336, 27.175331115722656, 28.97481918334961, 30.774307250976562, 32.57379150390625, 34.3732795715332, 36.172767639160156, 37.97225570678711, 39.77174377441406, 41.57122802734375, 43.3707160949707, 45.170204162597656, 46.969688415527344, 48.7691764831543, 50.56866455078125, 52.3681526184082, 54.167640686035156, 55.967124938964844, 57.7666130065918]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 5.0, 8.0, 17.0, 26.0, 46.0, 60.0, 87.0, 151.0, 226.0, 376.0, 612.0, 913.0, 1486.0, 2592.0, 4726.0, 9362.0, 21739.0, 62747.0, 201527.0, 398198.0, 226959.0, 70546.0, 23902.0, 10081.0, 5055.0, 2806.0, 1638.0, 986.0, 603.0, 387.0, 234.0, 158.0, 101.0, 72.0, 40.0, 24.0, 22.0, 11.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.25390625, -6.0780029296875, -5.902099609375, -5.7261962890625, -5.55029296875, -5.3743896484375, -5.198486328125, -5.0225830078125, -4.8466796875, -4.6707763671875, -4.494873046875, -4.3189697265625, -4.14306640625, -3.9671630859375, -3.791259765625, -3.6153564453125, -3.439453125, -3.2635498046875, -3.087646484375, -2.9117431640625, -2.73583984375, -2.5599365234375, -2.384033203125, -2.2081298828125, -2.0322265625, -1.8563232421875, -1.680419921875, -1.5045166015625, -1.32861328125, -1.1527099609375, -0.976806640625, -0.8009033203125, -0.625, -0.4490966796875, -0.273193359375, -0.0972900390625, 0.07861328125, 0.2545166015625, 0.430419921875, 0.6063232421875, 0.7822265625, 0.9581298828125, 1.134033203125, 1.3099365234375, 1.48583984375, 1.6617431640625, 1.837646484375, 2.0135498046875, 2.189453125, 2.3653564453125, 2.541259765625, 2.7171630859375, 2.89306640625, 3.0689697265625, 3.244873046875, 3.4207763671875, 3.5966796875, 3.7725830078125, 3.948486328125, 4.1243896484375, 4.30029296875, 4.4761962890625, 4.652099609375, 4.8280029296875, 5.00390625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 8.0, 7.0, 11.0, 12.0, 22.0, 25.0, 24.0, 24.0, 30.0, 39.0, 56.0, 40.0, 53.0, 60.0, 62.0, 71.0, 69.0, 53.0, 61.0, 62.0, 51.0, 40.0, 32.0, 22.0, 16.0, 15.0, 7.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.10247802734375, -4.9197998046875, -4.73712158203125, -4.554443359375, -4.37176513671875, -4.1890869140625, -4.00640869140625, -3.82373046875, -3.64105224609375, -3.4583740234375, -3.27569580078125, -3.093017578125, -2.91033935546875, -2.7276611328125, -2.54498291015625, -2.3623046875, -2.17962646484375, -1.9969482421875, -1.81427001953125, -1.631591796875, -1.44891357421875, -1.2662353515625, -1.08355712890625, -0.90087890625, -0.71820068359375, -0.5355224609375, -0.35284423828125, -0.170166015625, 0.01251220703125, 0.1951904296875, 0.37786865234375, 0.560546875, 0.74322509765625, 0.9259033203125, 1.10858154296875, 1.291259765625, 1.47393798828125, 1.6566162109375, 1.83929443359375, 2.02197265625, 2.20465087890625, 2.3873291015625, 2.57000732421875, 2.752685546875, 2.93536376953125, 3.1180419921875, 3.30072021484375, 3.4833984375, 3.66607666015625, 3.8487548828125, 4.03143310546875, 4.214111328125, 4.39678955078125, 4.5794677734375, 4.76214599609375, 4.94482421875, 5.12750244140625, 5.3101806640625, 5.49285888671875, 5.675537109375, 5.85821533203125, 6.0408935546875, 6.22357177734375, 6.40625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 8.0, 8.0, 12.0, 9.0, 11.0, 15.0, 27.0, 49.0, 77.0, 133.0, 281.0, 657.0, 1811.0, 7225.0, 56456.0, 819612.0, 145694.0, 12041.0, 2815.0, 840.0, 342.0, 155.0, 94.0, 58.0, 39.0, 26.0, 18.0, 11.0, 10.0, 4.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.31298828125, -15.8134765625, -15.31396484375, -14.814453125, -14.31494140625, -13.8154296875, -13.31591796875, -12.81640625, -12.31689453125, -11.8173828125, -11.31787109375, -10.818359375, -10.31884765625, -9.8193359375, -9.31982421875, -8.8203125, -8.32080078125, -7.8212890625, -7.32177734375, -6.822265625, -6.32275390625, -5.8232421875, -5.32373046875, -4.82421875, -4.32470703125, -3.8251953125, -3.32568359375, -2.826171875, -2.32666015625, -1.8271484375, -1.32763671875, -0.828125, -0.32861328125, 0.1708984375, 0.67041015625, 1.169921875, 1.66943359375, 2.1689453125, 2.66845703125, 3.16796875, 3.66748046875, 4.1669921875, 4.66650390625, 5.166015625, 5.66552734375, 6.1650390625, 6.66455078125, 7.1640625, 7.66357421875, 8.1630859375, 8.66259765625, 9.162109375, 9.66162109375, 10.1611328125, 10.66064453125, 11.16015625, 11.65966796875, 12.1591796875, 12.65869140625, 13.158203125, 13.65771484375, 14.1572265625, 14.65673828125, 15.15625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 10.0, 13.0, 7.0, 12.0, 19.0, 22.0, 15.0, 30.0, 38.0, 45.0, 39.0, 46.0, 48.0, 54.0, 53.0, 47.0, 60.0, 50.0, 47.0, 45.0, 43.0, 41.0, 37.0, 39.0, 21.0, 19.0, 25.0, 17.0, 12.0, 5.0, 5.0, 5.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.34375, -19.741943359375, -19.14013671875, -18.538330078125, -17.9365234375, -17.334716796875, -16.73291015625, -16.131103515625, -15.529296875, -14.927490234375, -14.32568359375, -13.723876953125, -13.1220703125, -12.520263671875, -11.91845703125, -11.316650390625, -10.71484375, -10.113037109375, -9.51123046875, -8.909423828125, -8.3076171875, -7.705810546875, -7.10400390625, -6.502197265625, -5.900390625, -5.298583984375, -4.69677734375, -4.094970703125, -3.4931640625, -2.891357421875, -2.28955078125, -1.687744140625, -1.0859375, -0.484130859375, 0.11767578125, 0.719482421875, 1.3212890625, 1.923095703125, 2.52490234375, 3.126708984375, 3.728515625, 4.330322265625, 4.93212890625, 5.533935546875, 6.1357421875, 6.737548828125, 7.33935546875, 7.941162109375, 8.54296875, 9.144775390625, 9.74658203125, 10.348388671875, 10.9501953125, 11.552001953125, 12.15380859375, 12.755615234375, 13.357421875, 13.959228515625, 14.56103515625, 15.162841796875, 15.7646484375, 16.366455078125, 16.96826171875, 17.570068359375, 18.171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 3.0, 13.0, 16.0, 49.0, 77.0, 113.0, 271.0, 667.0, 1707.0, 5734.0, 26222.0, 208356.0, 715614.0, 72305.0, 12308.0, 3190.0, 1069.0, 407.0, 192.0, 101.0, 55.0, 34.0, 14.0, 13.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.918212890625, -4.73095703125, -4.543701171875, -4.3564453125, -4.169189453125, -3.98193359375, -3.794677734375, -3.607421875, -3.420166015625, -3.23291015625, -3.045654296875, -2.8583984375, -2.671142578125, -2.48388671875, -2.296630859375, -2.109375, -1.922119140625, -1.73486328125, -1.547607421875, -1.3603515625, -1.173095703125, -0.98583984375, -0.798583984375, -0.611328125, -0.424072265625, -0.23681640625, -0.049560546875, 0.1376953125, 0.324951171875, 0.51220703125, 0.699462890625, 0.88671875, 1.073974609375, 1.26123046875, 1.448486328125, 1.6357421875, 1.822998046875, 2.01025390625, 2.197509765625, 2.384765625, 2.572021484375, 2.75927734375, 2.946533203125, 3.1337890625, 3.321044921875, 3.50830078125, 3.695556640625, 3.8828125, 4.070068359375, 4.25732421875, 4.444580078125, 4.6318359375, 4.819091796875, 5.00634765625, 5.193603515625, 5.380859375, 5.568115234375, 5.75537109375, 5.942626953125, 6.1298828125, 6.317138671875, 6.50439453125, 6.691650390625, 6.87890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 16.0, 17.0, 18.0, 18.0, 31.0, 30.0, 42.0, 76.0, 81.0, 83.0, 96.0, 96.0, 80.0, 65.0, 55.0, 37.0, 27.0, 21.0, 21.0, 8.0, 10.0, 6.0, 5.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009455680847167969, -0.000914745032787323, -0.0008839219808578491, -0.0008530989289283752, -0.0008222758769989014, -0.0007914528250694275, -0.0007606297731399536, -0.0007298067212104797, -0.0006989836692810059, -0.000668160617351532, -0.0006373375654220581, -0.0006065145134925842, -0.0005756914615631104, -0.0005448684096336365, -0.0005140453577041626, -0.0004832223057746887, -0.00045239925384521484, -0.00042157620191574097, -0.0003907531499862671, -0.0003599300980567932, -0.00032910704612731934, -0.00029828399419784546, -0.0002674609422683716, -0.0002366378903388977, -0.00020581483840942383, -0.00017499178647994995, -0.00014416873455047607, -0.0001133456826210022, -8.252263069152832e-05, -5.169957876205444e-05, -2.0876526832580566e-05, 9.94652509689331e-06, 4.076957702636719e-05, 7.159262895584106e-05, 0.00010241568088531494, 0.00013323873281478882, 0.0001640617847442627, 0.00019488483667373657, 0.00022570788860321045, 0.0002565309405326843, 0.0002873539924621582, 0.0003181770443916321, 0.00034900009632110596, 0.00037982314825057983, 0.0004106462001800537, 0.0004414692521095276, 0.00047229230403900146, 0.0005031153559684753, 0.0005339384078979492, 0.0005647614598274231, 0.000595584511756897, 0.0006264075636863708, 0.0006572306156158447, 0.0006880536675453186, 0.0007188767194747925, 0.0007496997714042664, 0.0007805228233337402, 0.0008113458752632141, 0.000842168927192688, 0.0008729919791221619, 0.0009038150310516357, 0.0009346380829811096, 0.0009654611349105835, 0.0009962841868400574, 0.0010271072387695312]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 13.0, 15.0, 17.0, 45.0, 78.0, 144.0, 236.0, 510.0, 1364.0, 4737.0, 25671.0, 303118.0, 663228.0, 39716.0, 6557.0, 1727.0, 680.0, 284.0, 150.0, 99.0, 47.0, 36.0, 27.0, 13.0, 13.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.3177490234375, -8.080810546875, -7.8438720703125, -7.60693359375, -7.3699951171875, -7.133056640625, -6.8961181640625, -6.6591796875, -6.4222412109375, -6.185302734375, -5.9483642578125, -5.71142578125, -5.4744873046875, -5.237548828125, -5.0006103515625, -4.763671875, -4.5267333984375, -4.289794921875, -4.0528564453125, -3.81591796875, -3.5789794921875, -3.342041015625, -3.1051025390625, -2.8681640625, -2.6312255859375, -2.394287109375, -2.1573486328125, -1.92041015625, -1.6834716796875, -1.446533203125, -1.2095947265625, -0.97265625, -0.7357177734375, -0.498779296875, -0.2618408203125, -0.02490234375, 0.2120361328125, 0.448974609375, 0.6859130859375, 0.9228515625, 1.1597900390625, 1.396728515625, 1.6336669921875, 1.87060546875, 2.1075439453125, 2.344482421875, 2.5814208984375, 2.818359375, 3.0552978515625, 3.292236328125, 3.5291748046875, 3.76611328125, 4.0030517578125, 4.239990234375, 4.4769287109375, 4.7138671875, 4.9508056640625, 5.187744140625, 5.4246826171875, 5.66162109375, 5.8985595703125, 6.135498046875, 6.3724365234375, 6.609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 16.0, 15.0, 28.0, 39.0, 48.0, 87.0, 103.0, 128.0, 112.0, 111.0, 79.0, 70.0, 39.0, 28.0, 21.0, 17.0, 9.0, 13.0, 3.0, 6.0, 2.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.171875, -7.98223876953125, -7.7926025390625, -7.60296630859375, -7.413330078125, -7.22369384765625, -7.0340576171875, -6.84442138671875, -6.65478515625, -6.46514892578125, -6.2755126953125, -6.08587646484375, -5.896240234375, -5.70660400390625, -5.5169677734375, -5.32733154296875, -5.1376953125, -4.94805908203125, -4.7584228515625, -4.56878662109375, -4.379150390625, -4.18951416015625, -3.9998779296875, -3.81024169921875, -3.62060546875, -3.43096923828125, -3.2413330078125, -3.05169677734375, -2.862060546875, -2.67242431640625, -2.4827880859375, -2.29315185546875, -2.103515625, -1.91387939453125, -1.7242431640625, -1.53460693359375, -1.344970703125, -1.15533447265625, -0.9656982421875, -0.77606201171875, -0.58642578125, -0.39678955078125, -0.2071533203125, -0.01751708984375, 0.172119140625, 0.36175537109375, 0.5513916015625, 0.74102783203125, 0.9306640625, 1.12030029296875, 1.3099365234375, 1.49957275390625, 1.689208984375, 1.87884521484375, 2.0684814453125, 2.25811767578125, 2.44775390625, 2.63739013671875, 2.8270263671875, 3.01666259765625, 3.206298828125, 3.39593505859375, 3.5855712890625, 3.77520751953125, 3.96484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 18.0, 53.0, 147.0, 413.0, 238.0, 81.0, 22.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-330.9302978515625, -324.78338623046875, -318.6365051269531, -312.4895935058594, -306.3426818847656, -300.1957702636719, -294.04888916015625, -287.9019775390625, -281.75506591796875, -275.608154296875, -269.4612731933594, -263.3143615722656, -257.1674499511719, -251.0205535888672, -244.8736572265625, -238.72674560546875, -232.57984924316406, -226.43295288085938, -220.28604125976562, -214.13914489746094, -207.9922332763672, -201.8453369140625, -195.69842529296875, -189.55152893066406, -183.40463256835938, -177.2577362060547, -171.11082458496094, -164.96392822265625, -158.8170166015625, -152.6701202392578, -146.52322387695312, -140.37631225585938, -134.22940063476562, -128.08250427246094, -121.93559265136719, -115.7886962890625, -109.64178466796875, -103.49488830566406, -97.34798431396484, -91.20108032226562, -85.05416870117188, -78.90726470947266, -72.76036071777344, -66.61346435546875, -60.466556549072266, -54.31965255737305, -48.172752380371094, -42.025848388671875, -35.87894821166992, -29.732044219970703, -23.585142135620117, -17.43824005126953, -11.291336059570312, -5.144432067871094, 1.0024681091308594, 7.149372100830078, 13.296276092529297, 19.443180084228516, 25.5900821685791, 31.736984252929688, 37.883888244628906, 44.030792236328125, 50.17769241333008, 56.3245964050293, 62.471500396728516]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 5.0, 7.0, 8.0, 15.0, 24.0, 19.0, 27.0, 26.0, 35.0, 32.0, 31.0, 60.0, 75.0, 99.0, 89.0, 88.0, 48.0, 48.0, 43.0, 34.0, 31.0, 26.0, 23.0, 16.0, 15.0, 18.0, 10.0, 8.0, 15.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.79682922363281, -87.09203338623047, -84.38723754882812, -81.68244934082031, -78.97765350341797, -76.27285766601562, -73.56806945800781, -70.86327362060547, -68.15847778320312, -65.45368194580078, -62.7488899230957, -60.044097900390625, -57.33930206298828, -54.63450622558594, -51.92971420288086, -49.22492218017578, -46.52012634277344, -43.815330505371094, -41.110538482666016, -38.40574645996094, -35.700950622558594, -32.99615478515625, -30.291362762451172, -27.58656883239746, -24.88177490234375, -22.17698097229004, -19.472187042236328, -16.767393112182617, -14.062599182128906, -11.357805252075195, -8.653011322021484, -5.948217391967773, -3.2434158325195312, -0.5386219024658203, 2.1661720275878906, 4.870965957641602, 7.5757598876953125, 10.280553817749023, 12.985347747802734, 15.690141677856445, 18.394935607910156, 21.099729537963867, 23.804523468017578, 26.50931739807129, 29.214111328125, 31.91890525817871, 34.62369918823242, 37.3284912109375, 40.033287048339844, 42.73808288574219, 45.442874908447266, 48.147666931152344, 50.85246276855469, 53.55725860595703, 56.26205062866211, 58.96684265136719, 61.67163848876953, 64.37643432617188, 67.08122253417969, 69.78601837158203, 72.49081420898438, 75.19561004638672, 77.90040588378906, 80.60519409179688, 83.30998992919922]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 2.0, 5.0, 9.0, 17.0, 24.0, 32.0, 60.0, 60.0, 106.0, 141.0, 185.0, 259.0, 403.0, 655.0, 1044.0, 1864.0, 3462.0, 7083.0, 16425.0, 45162.0, 164611.0, 824286.0, 2254590.0, 660858.0, 141766.0, 40983.0, 15532.0, 6914.0, 3380.0, 1759.0, 979.0, 627.0, 370.0, 241.0, 113.0, 89.0, 77.0, 37.0, 16.0, 18.0, 10.0, 8.0, 2.0, 5.0, 4.0], "bins": [-5.9609375, -5.81707763671875, -5.6732177734375, -5.52935791015625, -5.385498046875, -5.24163818359375, -5.0977783203125, -4.95391845703125, -4.81005859375, -4.66619873046875, -4.5223388671875, -4.37847900390625, -4.234619140625, -4.09075927734375, -3.9468994140625, -3.80303955078125, -3.6591796875, -3.51531982421875, -3.3714599609375, -3.22760009765625, -3.083740234375, -2.93988037109375, -2.7960205078125, -2.65216064453125, -2.50830078125, -2.36444091796875, -2.2205810546875, -2.07672119140625, -1.932861328125, -1.78900146484375, -1.6451416015625, -1.50128173828125, -1.357421875, -1.21356201171875, -1.0697021484375, -0.92584228515625, -0.781982421875, -0.63812255859375, -0.4942626953125, -0.35040283203125, -0.20654296875, -0.06268310546875, 0.0811767578125, 0.22503662109375, 0.368896484375, 0.51275634765625, 0.6566162109375, 0.80047607421875, 0.9443359375, 1.08819580078125, 1.2320556640625, 1.37591552734375, 1.519775390625, 1.66363525390625, 1.8074951171875, 1.95135498046875, 2.09521484375, 2.23907470703125, 2.3829345703125, 2.52679443359375, 2.670654296875, 2.81451416015625, 2.9583740234375, 3.10223388671875, 3.24609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 11.0, 8.0, 8.0, 17.0, 22.0, 16.0, 28.0, 25.0, 40.0, 31.0, 54.0, 64.0, 48.0, 74.0, 56.0, 48.0, 51.0, 60.0, 47.0, 44.0, 36.0, 46.0, 38.0, 30.0, 19.0, 27.0, 13.0, 3.0, 4.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.31805419921875, -5.1517333984375, -4.98541259765625, -4.819091796875, -4.65277099609375, -4.4864501953125, -4.32012939453125, -4.15380859375, -3.98748779296875, -3.8211669921875, -3.65484619140625, -3.488525390625, -3.32220458984375, -3.1558837890625, -2.98956298828125, -2.8232421875, -2.65692138671875, -2.4906005859375, -2.32427978515625, -2.157958984375, -1.99163818359375, -1.8253173828125, -1.65899658203125, -1.49267578125, -1.32635498046875, -1.1600341796875, -0.99371337890625, -0.827392578125, -0.66107177734375, -0.4947509765625, -0.32843017578125, -0.162109375, 0.00421142578125, 0.1705322265625, 0.33685302734375, 0.503173828125, 0.66949462890625, 0.8358154296875, 1.00213623046875, 1.16845703125, 1.33477783203125, 1.5010986328125, 1.66741943359375, 1.833740234375, 2.00006103515625, 2.1663818359375, 2.33270263671875, 2.4990234375, 2.66534423828125, 2.8316650390625, 2.99798583984375, 3.164306640625, 3.33062744140625, 3.4969482421875, 3.66326904296875, 3.82958984375, 3.99591064453125, 4.1622314453125, 4.32855224609375, 4.494873046875, 4.66119384765625, 4.8275146484375, 4.99383544921875, 5.16015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 6.0, 13.0, 25.0, 47.0, 95.0, 165.0, 469.0, 1478.0, 8857.0, 155604.0, 3922289.0, 96084.0, 7022.0, 1313.0, 437.0, 153.0, 84.0, 46.0, 19.0, 19.0, 19.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.28125, -28.55712890625, -27.8330078125, -27.10888671875, -26.384765625, -25.66064453125, -24.9365234375, -24.21240234375, -23.48828125, -22.76416015625, -22.0400390625, -21.31591796875, -20.591796875, -19.86767578125, -19.1435546875, -18.41943359375, -17.6953125, -16.97119140625, -16.2470703125, -15.52294921875, -14.798828125, -14.07470703125, -13.3505859375, -12.62646484375, -11.90234375, -11.17822265625, -10.4541015625, -9.72998046875, -9.005859375, -8.28173828125, -7.5576171875, -6.83349609375, -6.109375, -5.38525390625, -4.6611328125, -3.93701171875, -3.212890625, -2.48876953125, -1.7646484375, -1.04052734375, -0.31640625, 0.40771484375, 1.1318359375, 1.85595703125, 2.580078125, 3.30419921875, 4.0283203125, 4.75244140625, 5.4765625, 6.20068359375, 6.9248046875, 7.64892578125, 8.373046875, 9.09716796875, 9.8212890625, 10.54541015625, 11.26953125, 11.99365234375, 12.7177734375, 13.44189453125, 14.166015625, 14.89013671875, 15.6142578125, 16.33837890625, 17.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 13.0, 11.0, 17.0, 28.0, 30.0, 53.0, 78.0, 147.0, 261.0, 451.0, 868.0, 852.0, 532.0, 301.0, 125.0, 88.0, 55.0, 37.0, 29.0, 19.0, 16.0, 13.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.7886962890625, -10.374267578125, -9.9598388671875, -9.54541015625, -9.1309814453125, -8.716552734375, -8.3021240234375, -7.8876953125, -7.4732666015625, -7.058837890625, -6.6444091796875, -6.22998046875, -5.8155517578125, -5.401123046875, -4.9866943359375, -4.572265625, -4.1578369140625, -3.743408203125, -3.3289794921875, -2.91455078125, -2.5001220703125, -2.085693359375, -1.6712646484375, -1.2568359375, -0.8424072265625, -0.427978515625, -0.0135498046875, 0.40087890625, 0.8153076171875, 1.229736328125, 1.6441650390625, 2.05859375, 2.4730224609375, 2.887451171875, 3.3018798828125, 3.71630859375, 4.1307373046875, 4.545166015625, 4.9595947265625, 5.3740234375, 5.7884521484375, 6.202880859375, 6.6173095703125, 7.03173828125, 7.4461669921875, 7.860595703125, 8.2750244140625, 8.689453125, 9.1038818359375, 9.518310546875, 9.9327392578125, 10.34716796875, 10.7615966796875, 11.176025390625, 11.5904541015625, 12.0048828125, 12.4193115234375, 12.833740234375, 13.2481689453125, 13.66259765625, 14.0770263671875, 14.491455078125, 14.9058837890625, 15.3203125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 7.0, 9.0, 20.0, 55.0, 98.0, 177.0, 213.0, 209.0, 104.0, 56.0, 23.0, 15.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.5263671875, -129.65699768066406, -125.78761291503906, -121.91824340820312, -118.04886627197266, -114.17948913574219, -110.31011199951172, -106.44073486328125, -102.57136535644531, -98.70198822021484, -94.83261108398438, -90.96324157714844, -87.09386444091797, -83.2244873046875, -79.35511016845703, -75.48573303222656, -71.6163558959961, -67.74697875976562, -63.87760543823242, -60.00822830200195, -56.13885498046875, -52.26947784423828, -48.40010070800781, -44.530723571777344, -40.66135025024414, -36.79197311401367, -32.92259979248047, -29.05322265625, -25.183847427368164, -21.314472198486328, -17.44509506225586, -13.575719833374023, -9.706352233886719, -5.836976528167725, -1.9676008224487305, 1.9017753601074219, 5.771150588989258, 9.640525817871094, 13.509902954101562, 17.3792781829834, 21.248653411865234, 25.11802864074707, 28.987403869628906, 32.856781005859375, 36.726158142089844, 40.59553146362305, 44.464908599853516, 48.33428192138672, 52.20365905761719, 56.073036193847656, 59.94240951538086, 63.81178665161133, 67.68115997314453, 71.550537109375, 75.41991424560547, 79.28929138183594, 83.15866088867188, 87.02803802490234, 90.89741516113281, 94.76678466796875, 98.63616180419922, 102.50553894042969, 106.37491607666016, 110.24429321289062, 114.1136703491211]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 12.0, 8.0, 11.0, 12.0, 23.0, 26.0, 30.0, 31.0, 29.0, 34.0, 47.0, 49.0, 58.0, 54.0, 46.0, 49.0, 61.0, 56.0, 55.0, 61.0, 44.0, 38.0, 26.0, 22.0, 34.0, 18.0, 22.0, 11.0, 14.0, 5.0, 5.0, 8.0, 5.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.52397918701172, -58.732112884521484, -56.94024658203125, -55.148380279541016, -53.35651397705078, -51.56464767456055, -49.77278137207031, -47.98091506958008, -46.189048767089844, -44.39718246459961, -42.605316162109375, -40.81344985961914, -39.021583557128906, -37.22971725463867, -35.43785095214844, -33.6459846496582, -31.8541202545166, -30.062253952026367, -28.270387649536133, -26.4785213470459, -24.686655044555664, -22.894790649414062, -21.102924346923828, -19.311058044433594, -17.51919174194336, -15.727325439453125, -13.93545913696289, -12.143592834472656, -10.351726531982422, -8.559861183166504, -6.7679948806762695, -4.976128578186035, -3.1842613220214844, -1.3923951387405396, 0.3994710445404053, 2.1913371086120605, 3.983203411102295, 5.775069236755371, 7.5669355392456055, 9.35880184173584, 11.150668144226074, 12.942534446716309, 14.734400749206543, 16.52626609802246, 18.318132400512695, 20.10999870300293, 21.901865005493164, 23.6937313079834, 25.485597610473633, 27.277463912963867, 29.0693302154541, 30.861196517944336, 32.65306091308594, 34.44492721557617, 36.236793518066406, 38.02865982055664, 39.820526123046875, 41.61239242553711, 43.404258728027344, 45.19612503051758, 46.98799133300781, 48.77985763549805, 50.57172393798828, 52.363590240478516, 54.15545654296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 14.0, 8.0, 14.0, 24.0, 32.0, 55.0, 90.0, 134.0, 291.0, 525.0, 977.0, 2240.0, 5521.0, 18988.0, 115535.0, 651722.0, 210703.0, 28870.0, 7336.0, 2822.0, 1258.0, 609.0, 320.0, 168.0, 102.0, 65.0, 51.0, 25.0, 15.0, 10.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.4739990234375, -12.151123046875, -11.8282470703125, -11.50537109375, -11.1824951171875, -10.859619140625, -10.5367431640625, -10.2138671875, -9.8909912109375, -9.568115234375, -9.2452392578125, -8.92236328125, -8.5994873046875, -8.276611328125, -7.9537353515625, -7.630859375, -7.3079833984375, -6.985107421875, -6.6622314453125, -6.33935546875, -6.0164794921875, -5.693603515625, -5.3707275390625, -5.0478515625, -4.7249755859375, -4.402099609375, -4.0792236328125, -3.75634765625, -3.4334716796875, -3.110595703125, -2.7877197265625, -2.46484375, -2.1419677734375, -1.819091796875, -1.4962158203125, -1.17333984375, -0.8504638671875, -0.527587890625, -0.2047119140625, 0.1181640625, 0.4410400390625, 0.763916015625, 1.0867919921875, 1.40966796875, 1.7325439453125, 2.055419921875, 2.3782958984375, 2.701171875, 3.0240478515625, 3.346923828125, 3.6697998046875, 3.99267578125, 4.3155517578125, 4.638427734375, 4.9613037109375, 5.2841796875, 5.6070556640625, 5.929931640625, 6.2528076171875, 6.57568359375, 6.8985595703125, 7.221435546875, 7.5443115234375, 7.8671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 11.0, 7.0, 5.0, 13.0, 14.0, 10.0, 11.0, 16.0, 19.0, 23.0, 17.0, 30.0, 35.0, 35.0, 33.0, 44.0, 36.0, 47.0, 41.0, 51.0, 43.0, 61.0, 37.0, 36.0, 40.0, 42.0, 35.0, 24.0, 33.0, 24.0, 29.0, 15.0, 15.0, 13.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.506439208984375, -4.37225341796875, -4.238067626953125, -4.1038818359375, -3.969696044921875, -3.83551025390625, -3.701324462890625, -3.567138671875, -3.432952880859375, -3.29876708984375, -3.164581298828125, -3.0303955078125, -2.896209716796875, -2.76202392578125, -2.627838134765625, -2.49365234375, -2.359466552734375, -2.22528076171875, -2.091094970703125, -1.9569091796875, -1.822723388671875, -1.68853759765625, -1.554351806640625, -1.420166015625, -1.285980224609375, -1.15179443359375, -1.017608642578125, -0.8834228515625, -0.749237060546875, -0.61505126953125, -0.480865478515625, -0.3466796875, -0.212493896484375, -0.07830810546875, 0.055877685546875, 0.1900634765625, 0.324249267578125, 0.45843505859375, 0.592620849609375, 0.726806640625, 0.860992431640625, 0.99517822265625, 1.129364013671875, 1.2635498046875, 1.397735595703125, 1.53192138671875, 1.666107177734375, 1.80029296875, 1.934478759765625, 2.06866455078125, 2.202850341796875, 2.3370361328125, 2.471221923828125, 2.60540771484375, 2.739593505859375, 2.873779296875, 3.007965087890625, 3.14215087890625, 3.276336669921875, 3.4105224609375, 3.544708251953125, 3.67889404296875, 3.813079833984375, 3.947265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 9.0, 4.0, 3.0, 11.0, 15.0, 19.0, 26.0, 29.0, 47.0, 67.0, 111.0, 143.0, 273.0, 499.0, 989.0, 2476.0, 8568.0, 52795.0, 730346.0, 221542.0, 22412.0, 4943.0, 1560.0, 666.0, 386.0, 199.0, 141.0, 84.0, 48.0, 34.0, 21.0, 25.0, 12.0, 13.0, 13.0, 6.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.90625, -12.5242919921875, -12.142333984375, -11.7603759765625, -11.37841796875, -10.9964599609375, -10.614501953125, -10.2325439453125, -9.8505859375, -9.4686279296875, -9.086669921875, -8.7047119140625, -8.32275390625, -7.9407958984375, -7.558837890625, -7.1768798828125, -6.794921875, -6.4129638671875, -6.031005859375, -5.6490478515625, -5.26708984375, -4.8851318359375, -4.503173828125, -4.1212158203125, -3.7392578125, -3.3572998046875, -2.975341796875, -2.5933837890625, -2.21142578125, -1.8294677734375, -1.447509765625, -1.0655517578125, -0.68359375, -0.3016357421875, 0.080322265625, 0.4622802734375, 0.84423828125, 1.2261962890625, 1.608154296875, 1.9901123046875, 2.3720703125, 2.7540283203125, 3.135986328125, 3.5179443359375, 3.89990234375, 4.2818603515625, 4.663818359375, 5.0457763671875, 5.427734375, 5.8096923828125, 6.191650390625, 6.5736083984375, 6.95556640625, 7.3375244140625, 7.719482421875, 8.1014404296875, 8.4833984375, 8.8653564453125, 9.247314453125, 9.6292724609375, 10.01123046875, 10.3931884765625, 10.775146484375, 11.1571044921875, 11.5390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 11.0, 9.0, 8.0, 15.0, 17.0, 16.0, 28.0, 13.0, 31.0, 33.0, 37.0, 38.0, 48.0, 44.0, 46.0, 49.0, 41.0, 53.0, 52.0, 45.0, 39.0, 36.0, 33.0, 33.0, 29.0, 29.0, 18.0, 16.0, 17.0, 22.0, 11.0, 7.0, 11.0, 6.0, 5.0, 8.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.65625, -17.1669921875, -16.677734375, -16.1884765625, -15.69921875, -15.2099609375, -14.720703125, -14.2314453125, -13.7421875, -13.2529296875, -12.763671875, -12.2744140625, -11.78515625, -11.2958984375, -10.806640625, -10.3173828125, -9.828125, -9.3388671875, -8.849609375, -8.3603515625, -7.87109375, -7.3818359375, -6.892578125, -6.4033203125, -5.9140625, -5.4248046875, -4.935546875, -4.4462890625, -3.95703125, -3.4677734375, -2.978515625, -2.4892578125, -2.0, -1.5107421875, -1.021484375, -0.5322265625, -0.04296875, 0.4462890625, 0.935546875, 1.4248046875, 1.9140625, 2.4033203125, 2.892578125, 3.3818359375, 3.87109375, 4.3603515625, 4.849609375, 5.3388671875, 5.828125, 6.3173828125, 6.806640625, 7.2958984375, 7.78515625, 8.2744140625, 8.763671875, 9.2529296875, 9.7421875, 10.2314453125, 10.720703125, 11.2099609375, 11.69921875, 12.1884765625, 12.677734375, 13.1669921875, 13.65625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 13.0, 18.0, 18.0, 28.0, 39.0, 61.0, 111.0, 170.0, 228.0, 355.0, 646.0, 1350.0, 2511.0, 5355.0, 12463.0, 34001.0, 115990.0, 629073.0, 171030.0, 46114.0, 15900.0, 6533.0, 2987.0, 1449.0, 810.0, 481.0, 266.0, 165.0, 109.0, 74.0, 43.0, 36.0, 25.0, 15.0, 8.0, 15.0, 8.0, 8.0, 6.0, 4.0, 1.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.0311279296875, -2.935302734375, -2.8394775390625, -2.74365234375, -2.6478271484375, -2.552001953125, -2.4561767578125, -2.3603515625, -2.2645263671875, -2.168701171875, -2.0728759765625, -1.97705078125, -1.8812255859375, -1.785400390625, -1.6895751953125, -1.59375, -1.4979248046875, -1.402099609375, -1.3062744140625, -1.21044921875, -1.1146240234375, -1.018798828125, -0.9229736328125, -0.8271484375, -0.7313232421875, -0.635498046875, -0.5396728515625, -0.44384765625, -0.3480224609375, -0.252197265625, -0.1563720703125, -0.060546875, 0.0352783203125, 0.131103515625, 0.2269287109375, 0.32275390625, 0.4185791015625, 0.514404296875, 0.6102294921875, 0.7060546875, 0.8018798828125, 0.897705078125, 0.9935302734375, 1.08935546875, 1.1851806640625, 1.281005859375, 1.3768310546875, 1.47265625, 1.5684814453125, 1.664306640625, 1.7601318359375, 1.85595703125, 1.9517822265625, 2.047607421875, 2.1434326171875, 2.2392578125, 2.3350830078125, 2.430908203125, 2.5267333984375, 2.62255859375, 2.7183837890625, 2.814208984375, 2.9100341796875, 3.005859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 12.0, 33.0, 63.0, 62.0, 120.0, 194.0, 178.0, 124.0, 76.0, 36.0, 21.0, 14.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018291473388671875, -0.0017780661582946777, -0.001726984977722168, -0.0016759037971496582, -0.0016248226165771484, -0.0015737414360046387, -0.001522660255432129, -0.0014715790748596191, -0.0014204978942871094, -0.0013694167137145996, -0.0013183355331420898, -0.00126725435256958, -0.0012161731719970703, -0.0011650919914245605, -0.0011140108108520508, -0.001062929630279541, -0.0010118484497070312, -0.0009607672691345215, -0.0009096860885620117, -0.000858604907989502, -0.0008075237274169922, -0.0007564425468444824, -0.0007053613662719727, -0.0006542801856994629, -0.0006031990051269531, -0.0005521178245544434, -0.0005010366439819336, -0.00044995546340942383, -0.00039887428283691406, -0.0003477931022644043, -0.00029671192169189453, -0.00024563074111938477, -0.000194549560546875, -0.00014346837997436523, -9.238719940185547e-05, -4.13060188293457e-05, 9.775161743164062e-06, 6.085634231567383e-05, 0.0001119375228881836, 0.00016301870346069336, 0.00021409988403320312, 0.0002651810646057129, 0.00031626224517822266, 0.0003673434257507324, 0.0004184246063232422, 0.00046950578689575195, 0.0005205869674682617, 0.0005716681480407715, 0.0006227493286132812, 0.000673830509185791, 0.0007249116897583008, 0.0007759928703308105, 0.0008270740509033203, 0.0008781552314758301, 0.0009292364120483398, 0.0009803175926208496, 0.0010313987731933594, 0.0010824799537658691, 0.001133561134338379, 0.0011846423149108887, 0.0012357234954833984, 0.0012868046760559082, 0.001337885856628418, 0.0013889670372009277, 0.0014400482177734375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 5.0, 19.0, 17.0, 15.0, 29.0, 49.0, 64.0, 118.0, 155.0, 266.0, 466.0, 794.0, 1681.0, 4129.0, 11809.0, 45970.0, 268442.0, 621496.0, 67483.0, 16137.0, 5179.0, 2021.0, 980.0, 453.0, 253.0, 177.0, 97.0, 65.0, 45.0, 35.0, 22.0, 23.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.19140625, -4.0609130859375, -3.930419921875, -3.7999267578125, -3.66943359375, -3.5389404296875, -3.408447265625, -3.2779541015625, -3.1474609375, -3.0169677734375, -2.886474609375, -2.7559814453125, -2.62548828125, -2.4949951171875, -2.364501953125, -2.2340087890625, -2.103515625, -1.9730224609375, -1.842529296875, -1.7120361328125, -1.58154296875, -1.4510498046875, -1.320556640625, -1.1900634765625, -1.0595703125, -0.9290771484375, -0.798583984375, -0.6680908203125, -0.53759765625, -0.4071044921875, -0.276611328125, -0.1461181640625, -0.015625, 0.1148681640625, 0.245361328125, 0.3758544921875, 0.50634765625, 0.6368408203125, 0.767333984375, 0.8978271484375, 1.0283203125, 1.1588134765625, 1.289306640625, 1.4197998046875, 1.55029296875, 1.6807861328125, 1.811279296875, 1.9417724609375, 2.072265625, 2.2027587890625, 2.333251953125, 2.4637451171875, 2.59423828125, 2.7247314453125, 2.855224609375, 2.9857177734375, 3.1162109375, 3.2467041015625, 3.377197265625, 3.5076904296875, 3.63818359375, 3.7686767578125, 3.899169921875, 4.0296630859375, 4.16015625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 12.0, 12.0, 11.0, 16.0, 30.0, 25.0, 35.0, 65.0, 53.0, 111.0, 104.0, 112.0, 95.0, 74.0, 49.0, 48.0, 28.0, 31.0, 17.0, 10.0, 13.0, 11.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.63671875, -4.508270263671875, -4.37982177734375, -4.251373291015625, -4.1229248046875, -3.994476318359375, -3.86602783203125, -3.737579345703125, -3.609130859375, -3.480682373046875, -3.35223388671875, -3.223785400390625, -3.0953369140625, -2.966888427734375, -2.83843994140625, -2.709991455078125, -2.58154296875, -2.453094482421875, -2.32464599609375, -2.196197509765625, -2.0677490234375, -1.939300537109375, -1.81085205078125, -1.682403564453125, -1.553955078125, -1.425506591796875, -1.29705810546875, -1.168609619140625, -1.0401611328125, -0.911712646484375, -0.78326416015625, -0.654815673828125, -0.5263671875, -0.397918701171875, -0.26947021484375, -0.141021728515625, -0.0125732421875, 0.115875244140625, 0.24432373046875, 0.372772216796875, 0.501220703125, 0.629669189453125, 0.75811767578125, 0.886566162109375, 1.0150146484375, 1.143463134765625, 1.27191162109375, 1.400360107421875, 1.52880859375, 1.657257080078125, 1.78570556640625, 1.914154052734375, 2.0426025390625, 2.171051025390625, 2.29949951171875, 2.427947998046875, 2.556396484375, 2.684844970703125, 2.81329345703125, 2.941741943359375, 3.0701904296875, 3.198638916015625, 3.32708740234375, 3.455535888671875, 3.583984375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 19.0, 35.0, 89.0, 174.0, 414.0, 161.0, 66.0, 13.0, 8.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-206.82421875, -202.1698760986328, -197.51553344726562, -192.8612060546875, -188.2068634033203, -183.55252075195312, -178.89817810058594, -174.24383544921875, -169.58950805664062, -164.93516540527344, -160.28082275390625, -155.62649536132812, -150.97215270996094, -146.31781005859375, -141.66346740722656, -137.00912475585938, -132.3547821044922, -127.700439453125, -123.04610443115234, -118.39176177978516, -113.7374267578125, -109.08308410644531, -104.42874145507812, -99.77439880371094, -95.12006378173828, -90.4657211303711, -85.81138610839844, -81.15704345703125, -76.50270080566406, -71.8483657836914, -67.19402313232422, -62.5396842956543, -57.88536071777344, -53.231021881103516, -48.576683044433594, -43.922340393066406, -39.268001556396484, -34.61366271972656, -29.959321975708008, -25.304981231689453, -20.65064239501953, -15.996302604675293, -11.341962814331055, -6.687623023986816, -2.033283233642578, 2.6210556030273438, 7.275396347045898, 11.929737091064453, 16.584075927734375, 21.238414764404297, 25.89275550842285, 30.547096252441406, 35.20143508911133, 39.85577392578125, 44.51011657714844, 49.16445541381836, 53.81879425048828, 58.4731330871582, 63.127471923828125, 67.78181457519531, 72.4361572265625, 77.09049224853516, 81.74483489990234, 86.399169921875, 91.05351257324219]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 5.0, 12.0, 8.0, 12.0, 28.0, 20.0, 33.0, 24.0, 34.0, 24.0, 31.0, 44.0, 70.0, 75.0, 100.0, 93.0, 56.0, 46.0, 34.0, 33.0, 26.0, 27.0, 29.0, 24.0, 16.0, 11.0, 14.0, 12.0, 12.0, 8.0, 2.0, 3.0, 6.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.32025146484375, -66.15970611572266, -63.9991569519043, -61.83860778808594, -59.67805862426758, -57.51750946044922, -55.356964111328125, -53.196414947509766, -51.035865783691406, -48.87531661987305, -46.71477127075195, -44.554222106933594, -42.393672943115234, -40.233123779296875, -38.07257843017578, -35.91202926635742, -33.75148391723633, -31.5909366607666, -29.430387496948242, -27.269840240478516, -25.109291076660156, -22.94874382019043, -20.788196563720703, -18.627647399902344, -16.467100143432617, -14.306551933288574, -12.146003723144531, -9.985456466674805, -7.824908256530762, -5.664360046386719, -3.503812789916992, -1.3432645797729492, 0.8172836303710938, 2.9778316020965576, 5.1383795738220215, 7.298927307128906, 9.45947551727295, 11.620023727416992, 13.780570983886719, 15.941119194030762, 18.101667404174805, 20.26221466064453, 22.42276382446289, 24.583311080932617, 26.743858337402344, 28.904407501220703, 31.06495475769043, 33.225502014160156, 35.386051177978516, 37.546600341796875, 39.70714569091797, 41.86769485473633, 44.02824401855469, 46.18878936767578, 48.34933853149414, 50.5098876953125, 52.670433044433594, 54.83098220825195, 56.99152755737305, 59.152076721191406, 61.312625885009766, 63.473175048828125, 65.63372039794922, 67.79426574707031, 69.95481872558594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 10.0, 17.0, 16.0, 25.0, 36.0, 55.0, 64.0, 86.0, 170.0, 243.0, 458.0, 882.0, 1885.0, 5099.0, 17394.0, 95731.0, 1051080.0, 2693157.0, 276802.0, 36691.0, 8766.0, 2962.0, 1245.0, 538.0, 312.0, 187.0, 97.0, 76.0, 63.0, 24.0, 27.0, 20.0, 12.0, 15.0, 10.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.0, -8.75164794921875, -8.5032958984375, -8.25494384765625, -8.006591796875, -7.75823974609375, -7.5098876953125, -7.26153564453125, -7.01318359375, -6.76483154296875, -6.5164794921875, -6.26812744140625, -6.019775390625, -5.77142333984375, -5.5230712890625, -5.27471923828125, -5.0263671875, -4.77801513671875, -4.5296630859375, -4.28131103515625, -4.032958984375, -3.78460693359375, -3.5362548828125, -3.28790283203125, -3.03955078125, -2.79119873046875, -2.5428466796875, -2.29449462890625, -2.046142578125, -1.79779052734375, -1.5494384765625, -1.30108642578125, -1.052734375, -0.80438232421875, -0.5560302734375, -0.30767822265625, -0.059326171875, 0.18902587890625, 0.4373779296875, 0.68572998046875, 0.93408203125, 1.18243408203125, 1.4307861328125, 1.67913818359375, 1.927490234375, 2.17584228515625, 2.4241943359375, 2.67254638671875, 2.9208984375, 3.16925048828125, 3.4176025390625, 3.66595458984375, 3.914306640625, 4.16265869140625, 4.4110107421875, 4.65936279296875, 4.90771484375, 5.15606689453125, 5.4044189453125, 5.65277099609375, 5.901123046875, 6.14947509765625, 6.3978271484375, 6.64617919921875, 6.89453125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 10.0, 8.0, 8.0, 11.0, 8.0, 14.0, 15.0, 23.0, 20.0, 23.0, 29.0, 27.0, 37.0, 40.0, 56.0, 53.0, 59.0, 50.0, 46.0, 47.0, 53.0, 45.0, 49.0, 44.0, 38.0, 29.0, 29.0, 24.0, 20.0, 21.0, 14.0, 18.0, 8.0, 7.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-5.91796875, -5.766998291015625, -5.61602783203125, -5.465057373046875, -5.3140869140625, -5.163116455078125, -5.01214599609375, -4.861175537109375, -4.710205078125, -4.559234619140625, -4.40826416015625, -4.257293701171875, -4.1063232421875, -3.955352783203125, -3.80438232421875, -3.653411865234375, -3.50244140625, -3.351470947265625, -3.20050048828125, -3.049530029296875, -2.8985595703125, -2.747589111328125, -2.59661865234375, -2.445648193359375, -2.294677734375, -2.143707275390625, -1.99273681640625, -1.841766357421875, -1.6907958984375, -1.539825439453125, -1.38885498046875, -1.237884521484375, -1.0869140625, -0.935943603515625, -0.78497314453125, -0.634002685546875, -0.4830322265625, -0.332061767578125, -0.18109130859375, -0.030120849609375, 0.120849609375, 0.271820068359375, 0.42279052734375, 0.573760986328125, 0.7247314453125, 0.875701904296875, 1.02667236328125, 1.177642822265625, 1.32861328125, 1.479583740234375, 1.63055419921875, 1.781524658203125, 1.9324951171875, 2.083465576171875, 2.23443603515625, 2.385406494140625, 2.536376953125, 2.687347412109375, 2.83831787109375, 2.989288330078125, 3.1402587890625, 3.291229248046875, 3.44219970703125, 3.593170166015625, 3.744140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 10.0, 11.0, 5.0, 8.0, 24.0, 25.0, 41.0, 77.0, 188.0, 417.0, 1185.0, 3960.0, 22686.0, 515888.0, 3545216.0, 92141.0, 8966.0, 2128.0, 727.0, 255.0, 137.0, 58.0, 37.0, 24.0, 17.0, 11.0, 14.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.078125, -17.5655517578125, -17.052978515625, -16.5404052734375, -16.02783203125, -15.5152587890625, -15.002685546875, -14.4901123046875, -13.9775390625, -13.4649658203125, -12.952392578125, -12.4398193359375, -11.92724609375, -11.4146728515625, -10.902099609375, -10.3895263671875, -9.876953125, -9.3643798828125, -8.851806640625, -8.3392333984375, -7.82666015625, -7.3140869140625, -6.801513671875, -6.2889404296875, -5.7763671875, -5.2637939453125, -4.751220703125, -4.2386474609375, -3.72607421875, -3.2135009765625, -2.700927734375, -2.1883544921875, -1.67578125, -1.1632080078125, -0.650634765625, -0.1380615234375, 0.37451171875, 0.8870849609375, 1.399658203125, 1.9122314453125, 2.4248046875, 2.9373779296875, 3.449951171875, 3.9625244140625, 4.47509765625, 4.9876708984375, 5.500244140625, 6.0128173828125, 6.525390625, 7.0379638671875, 7.550537109375, 8.0631103515625, 8.57568359375, 9.0882568359375, 9.600830078125, 10.1134033203125, 10.6259765625, 11.1385498046875, 11.651123046875, 12.1636962890625, 12.67626953125, 13.1888427734375, 13.701416015625, 14.2139892578125, 14.7265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 9.0, 13.0, 14.0, 29.0, 32.0, 38.0, 63.0, 89.0, 146.0, 191.0, 333.0, 545.0, 700.0, 679.0, 387.0, 248.0, 162.0, 111.0, 69.0, 65.0, 36.0, 28.0, 15.0, 7.0, 9.0, 7.0, 3.0, 11.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.724853515625, -8.41064453125, -8.096435546875, -7.7822265625, -7.468017578125, -7.15380859375, -6.839599609375, -6.525390625, -6.211181640625, -5.89697265625, -5.582763671875, -5.2685546875, -4.954345703125, -4.64013671875, -4.325927734375, -4.01171875, -3.697509765625, -3.38330078125, -3.069091796875, -2.7548828125, -2.440673828125, -2.12646484375, -1.812255859375, -1.498046875, -1.183837890625, -0.86962890625, -0.555419921875, -0.2412109375, 0.072998046875, 0.38720703125, 0.701416015625, 1.015625, 1.329833984375, 1.64404296875, 1.958251953125, 2.2724609375, 2.586669921875, 2.90087890625, 3.215087890625, 3.529296875, 3.843505859375, 4.15771484375, 4.471923828125, 4.7861328125, 5.100341796875, 5.41455078125, 5.728759765625, 6.04296875, 6.357177734375, 6.67138671875, 6.985595703125, 7.2998046875, 7.614013671875, 7.92822265625, 8.242431640625, 8.556640625, 8.870849609375, 9.18505859375, 9.499267578125, 9.8134765625, 10.127685546875, 10.44189453125, 10.756103515625, 11.0703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 11.0, 14.0, 14.0, 47.0, 91.0, 183.0, 213.0, 184.0, 113.0, 67.0, 25.0, 20.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.8641586303711, -99.6131362915039, -96.36210632324219, -93.111083984375, -89.86006164550781, -86.60903930664062, -83.35801696777344, -80.10698699951172, -76.85596466064453, -73.60494232177734, -70.35391235351562, -67.10289001464844, -63.85186767578125, -60.60084533691406, -57.34981918334961, -54.098793029785156, -50.84777069091797, -47.59674835205078, -44.34572219848633, -41.094696044921875, -37.84367370605469, -34.5926513671875, -31.341625213623047, -28.090600967407227, -24.839576721191406, -21.588552474975586, -18.337528228759766, -15.086503982543945, -11.835479736328125, -8.584455490112305, -5.333431243896484, -2.082406997680664, 1.168609619140625, 4.419633865356445, 7.670658111572266, 10.921682357788086, 14.172706604003906, 17.423730850219727, 20.674755096435547, 23.925779342651367, 27.176803588867188, 30.427827835083008, 33.67885208129883, 36.92987823486328, 40.18090057373047, 43.431922912597656, 46.68294906616211, 49.93397521972656, 53.18499755859375, 56.43601989746094, 59.68704605102539, 62.938072204589844, 66.18909454345703, 69.44011688232422, 72.69114685058594, 75.94216918945312, 79.19319152832031, 82.4442138671875, 85.69523620605469, 88.9462661743164, 92.1972885131836, 95.44831085205078, 98.6993408203125, 101.95036315917969, 105.20138549804688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 7.0, 1.0, 9.0, 7.0, 9.0, 13.0, 25.0, 12.0, 10.0, 17.0, 16.0, 18.0, 36.0, 24.0, 27.0, 31.0, 31.0, 34.0, 33.0, 34.0, 41.0, 45.0, 57.0, 54.0, 35.0, 39.0, 38.0, 35.0, 31.0, 23.0, 15.0, 24.0, 31.0, 23.0, 17.0, 20.0, 16.0, 8.0, 7.0, 10.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.54756164550781, -34.3658561706543, -33.18415069580078, -32.002445220947266, -30.820741653442383, -29.639036178588867, -28.457332611083984, -27.27562713623047, -26.093921661376953, -24.912216186523438, -23.730510711669922, -22.54880714416504, -21.367101669311523, -20.185396194458008, -19.003692626953125, -17.82198715209961, -16.640281677246094, -15.458576202392578, -14.276871681213379, -13.09516716003418, -11.913461685180664, -10.731756210327148, -9.55005168914795, -8.36834716796875, -7.186641693115234, -6.004936695098877, -4.8232316970825195, -3.641526699066162, -2.4598217010498047, -1.2781167030334473, -0.09641170501708984, 1.0852928161621094, 2.266998291015625, 3.4487032890319824, 4.63040828704834, 5.812113285064697, 6.993818283081055, 8.17552375793457, 9.35722827911377, 10.538932800292969, 11.720638275146484, 12.90234375, 14.0840482711792, 15.265752792358398, 16.447458267211914, 17.62916374206543, 18.810867309570312, 19.992572784423828, 21.174278259277344, 22.35598373413086, 23.537689208984375, 24.719392776489258, 25.901098251342773, 27.08280372619629, 28.264507293701172, 29.446212768554688, 30.627918243408203, 31.80962371826172, 32.991329193115234, 34.17303466796875, 35.354736328125, 36.536441802978516, 37.71814727783203, 38.89985275268555, 40.08155822753906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 11.0, 9.0, 10.0, 29.0, 32.0, 47.0, 58.0, 78.0, 106.0, 187.0, 256.0, 403.0, 644.0, 1030.0, 1910.0, 3589.0, 7243.0, 17004.0, 46831.0, 159796.0, 461533.0, 239463.0, 66152.0, 22841.0, 9311.0, 4358.0, 2168.0, 1298.0, 775.0, 458.0, 304.0, 176.0, 121.0, 78.0, 54.0, 46.0, 33.0, 28.0, 21.0, 19.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.4637451171875, -6.259521484375, -6.0552978515625, -5.85107421875, -5.6468505859375, -5.442626953125, -5.2384033203125, -5.0341796875, -4.8299560546875, -4.625732421875, -4.4215087890625, -4.21728515625, -4.0130615234375, -3.808837890625, -3.6046142578125, -3.400390625, -3.1961669921875, -2.991943359375, -2.7877197265625, -2.58349609375, -2.3792724609375, -2.175048828125, -1.9708251953125, -1.7666015625, -1.5623779296875, -1.358154296875, -1.1539306640625, -0.94970703125, -0.7454833984375, -0.541259765625, -0.3370361328125, -0.1328125, 0.0714111328125, 0.275634765625, 0.4798583984375, 0.68408203125, 0.8883056640625, 1.092529296875, 1.2967529296875, 1.5009765625, 1.7052001953125, 1.909423828125, 2.1136474609375, 2.31787109375, 2.5220947265625, 2.726318359375, 2.9305419921875, 3.134765625, 3.3389892578125, 3.543212890625, 3.7474365234375, 3.95166015625, 4.1558837890625, 4.360107421875, 4.5643310546875, 4.7685546875, 4.9727783203125, 5.177001953125, 5.3812255859375, 5.58544921875, 5.7896728515625, 5.993896484375, 6.1981201171875, 6.40234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 5.0, 15.0, 9.0, 14.0, 17.0, 15.0, 23.0, 34.0, 20.0, 29.0, 22.0, 29.0, 47.0, 36.0, 38.0, 50.0, 43.0, 57.0, 37.0, 44.0, 51.0, 35.0, 34.0, 31.0, 35.0, 34.0, 27.0, 26.0, 27.0, 18.0, 18.0, 11.0, 9.0, 11.0, 2.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.33984375, -4.1976318359375, -4.055419921875, -3.9132080078125, -3.77099609375, -3.6287841796875, -3.486572265625, -3.3443603515625, -3.2021484375, -3.0599365234375, -2.917724609375, -2.7755126953125, -2.63330078125, -2.4910888671875, -2.348876953125, -2.2066650390625, -2.064453125, -1.9222412109375, -1.780029296875, -1.6378173828125, -1.49560546875, -1.3533935546875, -1.211181640625, -1.0689697265625, -0.9267578125, -0.7845458984375, -0.642333984375, -0.5001220703125, -0.35791015625, -0.2156982421875, -0.073486328125, 0.0687255859375, 0.2109375, 0.3531494140625, 0.495361328125, 0.6375732421875, 0.77978515625, 0.9219970703125, 1.064208984375, 1.2064208984375, 1.3486328125, 1.4908447265625, 1.633056640625, 1.7752685546875, 1.91748046875, 2.0596923828125, 2.201904296875, 2.3441162109375, 2.486328125, 2.6285400390625, 2.770751953125, 2.9129638671875, 3.05517578125, 3.1973876953125, 3.339599609375, 3.4818115234375, 3.6240234375, 3.7662353515625, 3.908447265625, 4.0506591796875, 4.19287109375, 4.3350830078125, 4.477294921875, 4.6195068359375, 4.76171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 7.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 11.0, 25.0, 39.0, 58.0, 82.0, 128.0, 240.0, 488.0, 1056.0, 2689.0, 10275.0, 73621.0, 841695.0, 100200.0, 12336.0, 3236.0, 1161.0, 478.0, 255.0, 143.0, 103.0, 55.0, 37.0, 25.0, 19.0, 10.0, 9.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.25, -13.7984619140625, -13.346923828125, -12.8953857421875, -12.44384765625, -11.9923095703125, -11.540771484375, -11.0892333984375, -10.6376953125, -10.1861572265625, -9.734619140625, -9.2830810546875, -8.83154296875, -8.3800048828125, -7.928466796875, -7.4769287109375, -7.025390625, -6.5738525390625, -6.122314453125, -5.6707763671875, -5.21923828125, -4.7677001953125, -4.316162109375, -3.8646240234375, -3.4130859375, -2.9615478515625, -2.510009765625, -2.0584716796875, -1.60693359375, -1.1553955078125, -0.703857421875, -0.2523193359375, 0.19921875, 0.6507568359375, 1.102294921875, 1.5538330078125, 2.00537109375, 2.4569091796875, 2.908447265625, 3.3599853515625, 3.8115234375, 4.2630615234375, 4.714599609375, 5.1661376953125, 5.61767578125, 6.0692138671875, 6.520751953125, 6.9722900390625, 7.423828125, 7.8753662109375, 8.326904296875, 8.7784423828125, 9.22998046875, 9.6815185546875, 10.133056640625, 10.5845947265625, 11.0361328125, 11.4876708984375, 11.939208984375, 12.3907470703125, 12.84228515625, 13.2938232421875, 13.745361328125, 14.1968994140625, 14.6484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 8.0, 21.0, 16.0, 19.0, 25.0, 36.0, 43.0, 43.0, 58.0, 73.0, 73.0, 74.0, 82.0, 69.0, 57.0, 44.0, 42.0, 42.0, 29.0, 29.0, 25.0, 20.0, 15.0, 16.0, 12.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.061279296875, -17.27880859375, -16.496337890625, -15.7138671875, -14.931396484375, -14.14892578125, -13.366455078125, -12.583984375, -11.801513671875, -11.01904296875, -10.236572265625, -9.4541015625, -8.671630859375, -7.88916015625, -7.106689453125, -6.32421875, -5.541748046875, -4.75927734375, -3.976806640625, -3.1943359375, -2.411865234375, -1.62939453125, -0.846923828125, -0.064453125, 0.718017578125, 1.50048828125, 2.282958984375, 3.0654296875, 3.847900390625, 4.63037109375, 5.412841796875, 6.1953125, 6.977783203125, 7.76025390625, 8.542724609375, 9.3251953125, 10.107666015625, 10.89013671875, 11.672607421875, 12.455078125, 13.237548828125, 14.02001953125, 14.802490234375, 15.5849609375, 16.367431640625, 17.14990234375, 17.932373046875, 18.71484375, 19.497314453125, 20.27978515625, 21.062255859375, 21.8447265625, 22.627197265625, 23.40966796875, 24.192138671875, 24.974609375, 25.757080078125, 26.53955078125, 27.322021484375, 28.1044921875, 28.886962890625, 29.66943359375, 30.451904296875, 31.234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 12.0, 12.0, 20.0, 36.0, 48.0, 89.0, 131.0, 283.0, 513.0, 1038.0, 2381.0, 5673.0, 16694.0, 60453.0, 596063.0, 289054.0, 51746.0, 14715.0, 5410.0, 2141.0, 949.0, 499.0, 226.0, 145.0, 71.0, 48.0, 31.0, 18.0, 10.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.181640625, -3.087921142578125, -2.99420166015625, -2.900482177734375, -2.8067626953125, -2.713043212890625, -2.61932373046875, -2.525604248046875, -2.431884765625, -2.338165283203125, -2.24444580078125, -2.150726318359375, -2.0570068359375, -1.963287353515625, -1.86956787109375, -1.775848388671875, -1.68212890625, -1.588409423828125, -1.49468994140625, -1.400970458984375, -1.3072509765625, -1.213531494140625, -1.11981201171875, -1.026092529296875, -0.932373046875, -0.838653564453125, -0.74493408203125, -0.651214599609375, -0.5574951171875, -0.463775634765625, -0.37005615234375, -0.276336669921875, -0.1826171875, -0.088897705078125, 0.00482177734375, 0.098541259765625, 0.1922607421875, 0.285980224609375, 0.37969970703125, 0.473419189453125, 0.567138671875, 0.660858154296875, 0.75457763671875, 0.848297119140625, 0.9420166015625, 1.035736083984375, 1.12945556640625, 1.223175048828125, 1.31689453125, 1.410614013671875, 1.50433349609375, 1.598052978515625, 1.6917724609375, 1.785491943359375, 1.87921142578125, 1.972930908203125, 2.066650390625, 2.160369873046875, 2.25408935546875, 2.347808837890625, 2.4415283203125, 2.535247802734375, 2.62896728515625, 2.722686767578125, 2.81640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 5.0, 9.0, 9.0, 9.0, 20.0, 24.0, 41.0, 48.0, 57.0, 129.0, 142.0, 157.0, 114.0, 58.0, 47.0, 33.0, 26.0, 13.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0012664794921875, -0.0012313425540924072, -0.0011962056159973145, -0.0011610686779022217, -0.001125931739807129, -0.0010907948017120361, -0.0010556578636169434, -0.0010205209255218506, -0.0009853839874267578, -0.000950247049331665, -0.0009151101112365723, -0.0008799731731414795, -0.0008448362350463867, -0.0008096992969512939, -0.0007745623588562012, -0.0007394254207611084, -0.0007042884826660156, -0.0006691515445709229, -0.0006340146064758301, -0.0005988776683807373, -0.0005637407302856445, -0.0005286037921905518, -0.000493466854095459, -0.0004583299160003662, -0.00042319297790527344, -0.00038805603981018066, -0.0003529191017150879, -0.0003177821636199951, -0.00028264522552490234, -0.00024750828742980957, -0.0002123713493347168, -0.00017723441123962402, -0.00014209747314453125, -0.00010696053504943848, -7.18235969543457e-05, -3.668665885925293e-05, -1.5497207641601562e-06, 3.358721733093262e-05, 6.872415542602539e-05, 0.00010386109352111816, 0.00013899803161621094, 0.0001741349697113037, 0.00020927190780639648, 0.00024440884590148926, 0.00027954578399658203, 0.0003146827220916748, 0.0003498196601867676, 0.00038495659828186035, 0.0004200935363769531, 0.0004552304744720459, 0.0004903674125671387, 0.0005255043506622314, 0.0005606412887573242, 0.000595778226852417, 0.0006309151649475098, 0.0006660521030426025, 0.0007011890411376953, 0.0007363259792327881, 0.0007714629173278809, 0.0008065998554229736, 0.0008417367935180664, 0.0008768737316131592, 0.000912010669708252, 0.0009471476078033447, 0.0009822845458984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 7.0, 13.0, 13.0, 17.0, 10.0, 25.0, 27.0, 46.0, 60.0, 76.0, 133.0, 188.0, 354.0, 573.0, 1057.0, 2290.0, 5254.0, 14098.0, 44609.0, 177581.0, 650933.0, 104775.0, 29060.0, 9770.0, 3718.0, 1672.0, 859.0, 497.0, 279.0, 163.0, 108.0, 82.0, 57.0, 34.0, 23.0, 16.0, 14.0, 15.0, 11.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.75390625, -2.668701171875, -2.58349609375, -2.498291015625, -2.4130859375, -2.327880859375, -2.24267578125, -2.157470703125, -2.072265625, -1.987060546875, -1.90185546875, -1.816650390625, -1.7314453125, -1.646240234375, -1.56103515625, -1.475830078125, -1.390625, -1.305419921875, -1.22021484375, -1.135009765625, -1.0498046875, -0.964599609375, -0.87939453125, -0.794189453125, -0.708984375, -0.623779296875, -0.53857421875, -0.453369140625, -0.3681640625, -0.282958984375, -0.19775390625, -0.112548828125, -0.02734375, 0.057861328125, 0.14306640625, 0.228271484375, 0.3134765625, 0.398681640625, 0.48388671875, 0.569091796875, 0.654296875, 0.739501953125, 0.82470703125, 0.909912109375, 0.9951171875, 1.080322265625, 1.16552734375, 1.250732421875, 1.3359375, 1.421142578125, 1.50634765625, 1.591552734375, 1.6767578125, 1.761962890625, 1.84716796875, 1.932373046875, 2.017578125, 2.102783203125, 2.18798828125, 2.273193359375, 2.3583984375, 2.443603515625, 2.52880859375, 2.614013671875, 2.69921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 6.0, 6.0, 6.0, 7.0, 13.0, 11.0, 8.0, 22.0, 18.0, 15.0, 32.0, 28.0, 24.0, 41.0, 55.0, 61.0, 71.0, 77.0, 67.0, 77.0, 71.0, 54.0, 42.0, 28.0, 28.0, 24.0, 24.0, 12.0, 12.0, 11.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.74609375, -2.660247802734375, -2.57440185546875, -2.488555908203125, -2.4027099609375, -2.316864013671875, -2.23101806640625, -2.145172119140625, -2.059326171875, -1.973480224609375, -1.88763427734375, -1.801788330078125, -1.7159423828125, -1.630096435546875, -1.54425048828125, -1.458404541015625, -1.37255859375, -1.286712646484375, -1.20086669921875, -1.115020751953125, -1.0291748046875, -0.943328857421875, -0.85748291015625, -0.771636962890625, -0.685791015625, -0.599945068359375, -0.51409912109375, -0.428253173828125, -0.3424072265625, -0.256561279296875, -0.17071533203125, -0.084869384765625, 0.0009765625, 0.086822509765625, 0.17266845703125, 0.258514404296875, 0.3443603515625, 0.430206298828125, 0.51605224609375, 0.601898193359375, 0.687744140625, 0.773590087890625, 0.85943603515625, 0.945281982421875, 1.0311279296875, 1.116973876953125, 1.20281982421875, 1.288665771484375, 1.37451171875, 1.460357666015625, 1.54620361328125, 1.632049560546875, 1.7178955078125, 1.803741455078125, 1.88958740234375, 1.975433349609375, 2.061279296875, 2.147125244140625, 2.23297119140625, 2.318817138671875, 2.4046630859375, 2.490509033203125, 2.57635498046875, 2.662200927734375, 2.748046875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 24.0, 71.0, 234.0, 434.0, 130.0, 54.0, 29.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-160.96388244628906, -155.81455993652344, -150.66525268554688, -145.51593017578125, -140.3666229248047, -135.21730041503906, -130.0679931640625, -124.91867065429688, -119.76934814453125, -114.62003326416016, -109.47071838378906, -104.32139587402344, -99.17208099365234, -94.02276611328125, -88.87345123291016, -83.72413635253906, -78.57482147216797, -73.42550659179688, -68.27619171142578, -63.12687301635742, -57.97755432128906, -52.82823944091797, -47.678924560546875, -42.529605865478516, -37.38029098510742, -32.23097610473633, -27.08165740966797, -21.932342529296875, -16.78302574157715, -11.633708953857422, -6.484394073486328, -1.3350753784179688, 3.814239501953125, 8.963556289672852, 14.112872123718262, 19.262187957763672, 24.4115047454834, 29.560821533203125, 34.71013641357422, 39.85945510864258, 45.00876998901367, 50.158084869384766, 55.307403564453125, 60.45671844482422, 65.60603332519531, 70.75535583496094, 75.9046630859375, 81.05398559570312, 86.20330047607422, 91.35261535644531, 96.5019302368164, 101.6512451171875, 106.80056762695312, 111.94988250732422, 117.09919738769531, 122.24851989746094, 127.3978271484375, 132.54714965820312, 137.6964569091797, 142.8457794189453, 147.99508666992188, 153.1444091796875, 158.29373168945312, 163.4430389404297, 168.5923614501953]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 2.0, 4.0, 1.0, 6.0, 5.0, 5.0, 10.0, 8.0, 8.0, 24.0, 17.0, 15.0, 21.0, 20.0, 22.0, 29.0, 29.0, 32.0, 38.0, 60.0, 68.0, 79.0, 90.0, 69.0, 51.0, 30.0, 40.0, 26.0, 24.0, 27.0, 21.0, 21.0, 13.0, 14.0, 14.0, 8.0, 11.0, 13.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-74.34905242919922, -72.20501708984375, -70.06098937988281, -67.91695404052734, -65.77291870117188, -63.628883361816406, -61.4848518371582, -59.3408203125, -57.19678497314453, -55.05274963378906, -52.90871810913086, -50.764686584472656, -48.62065124511719, -46.47661590576172, -44.332584381103516, -42.18855285644531, -40.044517517089844, -37.900482177734375, -35.75645065307617, -33.61241912841797, -31.4683837890625, -29.324350357055664, -27.180316925048828, -25.036283493041992, -22.892250061035156, -20.74821662902832, -18.604183197021484, -16.46014976501465, -14.316116333007812, -12.172082901000977, -10.02804946899414, -7.884016036987305, -5.739982604980469, -3.595949172973633, -1.4519157409667969, 0.6921176910400391, 2.836151123046875, 4.980184555053711, 7.124217987060547, 9.268251419067383, 11.412284851074219, 13.556318283081055, 15.70035171508789, 17.844385147094727, 19.988418579101562, 22.1324520111084, 24.276485443115234, 26.42051887512207, 28.564552307128906, 30.708585739135742, 32.85261917114258, 34.99665069580078, 37.14068603515625, 39.28472137451172, 41.42875289916992, 43.572784423828125, 45.716819763183594, 47.86085510253906, 50.004886627197266, 52.14891815185547, 54.29295349121094, 56.436988830566406, 58.58102035522461, 60.72505187988281, 62.86908721923828]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 5.0, 10.0, 18.0, 24.0, 50.0, 67.0, 74.0, 136.0, 195.0, 374.0, 631.0, 1151.0, 2486.0, 5726.0, 15197.0, 47923.0, 193835.0, 890053.0, 2045975.0, 756997.0, 166595.0, 42954.0, 13734.0, 5236.0, 2254.0, 1065.0, 637.0, 340.0, 191.0, 119.0, 91.0, 38.0, 37.0, 20.0, 11.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.953125, -7.7001953125, -7.447265625, -7.1943359375, -6.94140625, -6.6884765625, -6.435546875, -6.1826171875, -5.9296875, -5.6767578125, -5.423828125, -5.1708984375, -4.91796875, -4.6650390625, -4.412109375, -4.1591796875, -3.90625, -3.6533203125, -3.400390625, -3.1474609375, -2.89453125, -2.6416015625, -2.388671875, -2.1357421875, -1.8828125, -1.6298828125, -1.376953125, -1.1240234375, -0.87109375, -0.6181640625, -0.365234375, -0.1123046875, 0.140625, 0.3935546875, 0.646484375, 0.8994140625, 1.15234375, 1.4052734375, 1.658203125, 1.9111328125, 2.1640625, 2.4169921875, 2.669921875, 2.9228515625, 3.17578125, 3.4287109375, 3.681640625, 3.9345703125, 4.1875, 4.4404296875, 4.693359375, 4.9462890625, 5.19921875, 5.4521484375, 5.705078125, 5.9580078125, 6.2109375, 6.4638671875, 6.716796875, 6.9697265625, 7.22265625, 7.4755859375, 7.728515625, 7.9814453125, 8.234375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 4.0, 14.0, 15.0, 20.0, 16.0, 24.0, 18.0, 23.0, 38.0, 45.0, 47.0, 43.0, 46.0, 53.0, 58.0, 54.0, 42.0, 49.0, 53.0, 47.0, 39.0, 38.0, 29.0, 27.0, 30.0, 18.0, 25.0, 18.0, 14.0, 15.0, 5.0, 11.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.68701171875, -4.5224609375, -4.35791015625, -4.193359375, -4.02880859375, -3.8642578125, -3.69970703125, -3.53515625, -3.37060546875, -3.2060546875, -3.04150390625, -2.876953125, -2.71240234375, -2.5478515625, -2.38330078125, -2.21875, -2.05419921875, -1.8896484375, -1.72509765625, -1.560546875, -1.39599609375, -1.2314453125, -1.06689453125, -0.90234375, -0.73779296875, -0.5732421875, -0.40869140625, -0.244140625, -0.07958984375, 0.0849609375, 0.24951171875, 0.4140625, 0.57861328125, 0.7431640625, 0.90771484375, 1.072265625, 1.23681640625, 1.4013671875, 1.56591796875, 1.73046875, 1.89501953125, 2.0595703125, 2.22412109375, 2.388671875, 2.55322265625, 2.7177734375, 2.88232421875, 3.046875, 3.21142578125, 3.3759765625, 3.54052734375, 3.705078125, 3.86962890625, 4.0341796875, 4.19873046875, 4.36328125, 4.52783203125, 4.6923828125, 4.85693359375, 5.021484375, 5.18603515625, 5.3505859375, 5.51513671875, 5.6796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 12.0, 11.0, 21.0, 36.0, 46.0, 92.0, 164.0, 389.0, 1116.0, 5586.0, 324932.0, 3844292.0, 14651.0, 1858.0, 573.0, 242.0, 108.0, 70.0, 28.0, 15.0, 7.0, 6.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.60205078125, -33.1103515625, -31.61865234375, -30.126953125, -28.63525390625, -27.1435546875, -25.65185546875, -24.16015625, -22.66845703125, -21.1767578125, -19.68505859375, -18.193359375, -16.70166015625, -15.2099609375, -13.71826171875, -12.2265625, -10.73486328125, -9.2431640625, -7.75146484375, -6.259765625, -4.76806640625, -3.2763671875, -1.78466796875, -0.29296875, 1.19873046875, 2.6904296875, 4.18212890625, 5.673828125, 7.16552734375, 8.6572265625, 10.14892578125, 11.640625, 13.13232421875, 14.6240234375, 16.11572265625, 17.607421875, 19.09912109375, 20.5908203125, 22.08251953125, 23.57421875, 25.06591796875, 26.5576171875, 28.04931640625, 29.541015625, 31.03271484375, 32.5244140625, 34.01611328125, 35.5078125, 36.99951171875, 38.4912109375, 39.98291015625, 41.474609375, 42.96630859375, 44.4580078125, 45.94970703125, 47.44140625, 48.93310546875, 50.4248046875, 51.91650390625, 53.408203125, 54.89990234375, 56.3916015625, 57.88330078125, 59.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 7.0, 14.0, 15.0, 23.0, 38.0, 56.0, 76.0, 95.0, 140.0, 180.0, 292.0, 388.0, 507.0, 564.0, 493.0, 373.0, 268.0, 170.0, 106.0, 89.0, 57.0, 31.0, 30.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.609375, -18.0841064453125, -17.558837890625, -17.0335693359375, -16.50830078125, -15.9830322265625, -15.457763671875, -14.9324951171875, -14.4072265625, -13.8819580078125, -13.356689453125, -12.8314208984375, -12.30615234375, -11.7808837890625, -11.255615234375, -10.7303466796875, -10.205078125, -9.6798095703125, -9.154541015625, -8.6292724609375, -8.10400390625, -7.5787353515625, -7.053466796875, -6.5281982421875, -6.0029296875, -5.4776611328125, -4.952392578125, -4.4271240234375, -3.90185546875, -3.3765869140625, -2.851318359375, -2.3260498046875, -1.80078125, -1.2755126953125, -0.750244140625, -0.2249755859375, 0.30029296875, 0.8255615234375, 1.350830078125, 1.8760986328125, 2.4013671875, 2.9266357421875, 3.451904296875, 3.9771728515625, 4.50244140625, 5.0277099609375, 5.552978515625, 6.0782470703125, 6.603515625, 7.1287841796875, 7.654052734375, 8.1793212890625, 8.70458984375, 9.2298583984375, 9.755126953125, 10.2803955078125, 10.8056640625, 11.3309326171875, 11.856201171875, 12.3814697265625, 12.90673828125, 13.4320068359375, 13.957275390625, 14.4825439453125, 15.0078125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 21.0, 37.0, 100.0, 192.0, 242.0, 208.0, 107.0, 41.0, 13.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.9296875, -263.7324523925781, -254.5352020263672, -245.3379669189453, -236.14073181152344, -226.9434814453125, -217.74624633789062, -208.54901123046875, -199.35177612304688, -190.154541015625, -180.95729064941406, -171.7600555419922, -162.5628204345703, -153.36557006835938, -144.1683349609375, -134.97109985351562, -125.77384948730469, -116.57660675048828, -107.3793716430664, -98.18212890625, -88.98489379882812, -79.78765106201172, -70.59040832519531, -61.39317321777344, -52.19593048095703, -42.99869155883789, -33.80145263671875, -24.604209899902344, -15.406970977783203, -6.2097320556640625, 2.9875106811523438, 12.184745788574219, 21.381988525390625, 30.579227447509766, 39.776466369628906, 48.97370910644531, 58.17094802856445, 67.3681869506836, 76.5654296875, 85.76266479492188, 94.95990753173828, 104.15715026855469, 113.35438537597656, 122.55162811279297, 131.74887084960938, 140.94610595703125, 150.14334106445312, 159.340576171875, 168.53782653808594, 177.7350616455078, 186.93231201171875, 196.12954711914062, 205.3267822265625, 214.52401733398438, 223.7212677001953, 232.9185028076172, 242.11575317382812, 251.31298828125, 260.5102233886719, 269.70745849609375, 278.90472412109375, 288.1019592285156, 297.2991943359375, 306.4964294433594, 315.69366455078125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 10.0, 19.0, 19.0, 25.0, 16.0, 27.0, 33.0, 32.0, 32.0, 46.0, 51.0, 49.0, 49.0, 64.0, 55.0, 46.0, 38.0, 51.0, 29.0, 40.0, 26.0, 30.0, 37.0, 21.0, 21.0, 16.0, 10.0, 7.0, 8.0, 10.0, 3.0, 5.0, 9.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.403629302978516, -58.99705505371094, -56.590476989746094, -54.183902740478516, -51.77732849121094, -49.37075424194336, -46.96417999267578, -44.55760192871094, -42.15102767944336, -39.74445343017578, -37.33787536621094, -34.93130111694336, -32.52472686767578, -30.118152618408203, -27.711576461791992, -25.30500030517578, -22.898426055908203, -20.491851806640625, -18.085275650024414, -15.67870044708252, -13.272125244140625, -10.86555004119873, -8.458974838256836, -6.052398681640625, -3.645824432373047, -1.2392492294311523, 1.1673259735107422, 3.5739011764526367, 5.980476379394531, 8.387051582336426, 10.79362678527832, 13.200202941894531, 15.606773376464844, 18.013347625732422, 20.419923782348633, 22.826499938964844, 25.233074188232422, 27.6396484375, 30.04622459411621, 32.45280075073242, 34.859375, 37.26594924926758, 39.672523498535156, 42.0791015625, 44.48567581176758, 46.892250061035156, 49.298828125, 51.70540237426758, 54.111976623535156, 56.518550872802734, 58.92512512207031, 61.331703186035156, 63.738277435302734, 66.14485168457031, 68.55142974853516, 70.9580078125, 73.36457824707031, 75.77115631103516, 78.17772674560547, 80.58430480957031, 82.99087524414062, 85.39745330810547, 87.80403137207031, 90.21060180664062, 92.61717987060547]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 6.0, 18.0, 16.0, 29.0, 28.0, 58.0, 78.0, 135.0, 204.0, 359.0, 667.0, 1314.0, 2511.0, 5482.0, 13046.0, 35253.0, 114738.0, 527066.0, 247381.0, 62976.0, 21072.0, 8485.0, 3675.0, 1753.0, 885.0, 515.0, 298.0, 169.0, 101.0, 66.0, 48.0, 24.0, 27.0, 19.0, 11.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.65625, -6.43255615234375, -6.2088623046875, -5.98516845703125, -5.761474609375, -5.53778076171875, -5.3140869140625, -5.09039306640625, -4.86669921875, -4.64300537109375, -4.4193115234375, -4.19561767578125, -3.971923828125, -3.74822998046875, -3.5245361328125, -3.30084228515625, -3.0771484375, -2.85345458984375, -2.6297607421875, -2.40606689453125, -2.182373046875, -1.95867919921875, -1.7349853515625, -1.51129150390625, -1.28759765625, -1.06390380859375, -0.8402099609375, -0.61651611328125, -0.392822265625, -0.16912841796875, 0.0545654296875, 0.27825927734375, 0.501953125, 0.72564697265625, 0.9493408203125, 1.17303466796875, 1.396728515625, 1.62042236328125, 1.8441162109375, 2.06781005859375, 2.29150390625, 2.51519775390625, 2.7388916015625, 2.96258544921875, 3.186279296875, 3.40997314453125, 3.6336669921875, 3.85736083984375, 4.0810546875, 4.30474853515625, 4.5284423828125, 4.75213623046875, 4.975830078125, 5.19952392578125, 5.4232177734375, 5.64691162109375, 5.87060546875, 6.09429931640625, 6.3179931640625, 6.54168701171875, 6.765380859375, 6.98907470703125, 7.2127685546875, 7.43646240234375, 7.66015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 15.0, 5.0, 27.0, 19.0, 24.0, 22.0, 33.0, 42.0, 39.0, 34.0, 50.0, 70.0, 71.0, 59.0, 57.0, 59.0, 47.0, 48.0, 48.0, 30.0, 34.0, 28.0, 37.0, 23.0, 13.0, 8.0, 9.0, 6.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.91009521484375, -6.6600341796875, -6.40997314453125, -6.159912109375, -5.90985107421875, -5.6597900390625, -5.40972900390625, -5.15966796875, -4.90960693359375, -4.6595458984375, -4.40948486328125, -4.159423828125, -3.90936279296875, -3.6593017578125, -3.40924072265625, -3.1591796875, -2.90911865234375, -2.6590576171875, -2.40899658203125, -2.158935546875, -1.90887451171875, -1.6588134765625, -1.40875244140625, -1.15869140625, -0.90863037109375, -0.6585693359375, -0.40850830078125, -0.158447265625, 0.09161376953125, 0.3416748046875, 0.59173583984375, 0.841796875, 1.09185791015625, 1.3419189453125, 1.59197998046875, 1.842041015625, 2.09210205078125, 2.3421630859375, 2.59222412109375, 2.84228515625, 3.09234619140625, 3.3424072265625, 3.59246826171875, 3.842529296875, 4.09259033203125, 4.3426513671875, 4.59271240234375, 4.8427734375, 5.09283447265625, 5.3428955078125, 5.59295654296875, 5.843017578125, 6.09307861328125, 6.3431396484375, 6.59320068359375, 6.84326171875, 7.09332275390625, 7.3433837890625, 7.59344482421875, 7.843505859375, 8.09356689453125, 8.3436279296875, 8.59368896484375, 8.84375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 17.0, 26.0, 34.0, 45.0, 75.0, 137.0, 223.0, 478.0, 1133.0, 3974.0, 22104.0, 770837.0, 227364.0, 17043.0, 3072.0, 1017.0, 446.0, 216.0, 107.0, 63.0, 45.0, 22.0, 27.0, 17.0, 9.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5703125, -13.1453857421875, -12.720458984375, -12.2955322265625, -11.87060546875, -11.4456787109375, -11.020751953125, -10.5958251953125, -10.1708984375, -9.7459716796875, -9.321044921875, -8.8961181640625, -8.47119140625, -8.0462646484375, -7.621337890625, -7.1964111328125, -6.771484375, -6.3465576171875, -5.921630859375, -5.4967041015625, -5.07177734375, -4.6468505859375, -4.221923828125, -3.7969970703125, -3.3720703125, -2.9471435546875, -2.522216796875, -2.0972900390625, -1.67236328125, -1.2474365234375, -0.822509765625, -0.3975830078125, 0.02734375, 0.4522705078125, 0.877197265625, 1.3021240234375, 1.72705078125, 2.1519775390625, 2.576904296875, 3.0018310546875, 3.4267578125, 3.8516845703125, 4.276611328125, 4.7015380859375, 5.12646484375, 5.5513916015625, 5.976318359375, 6.4012451171875, 6.826171875, 7.2510986328125, 7.676025390625, 8.1009521484375, 8.52587890625, 8.9508056640625, 9.375732421875, 9.8006591796875, 10.2255859375, 10.6505126953125, 11.075439453125, 11.5003662109375, 11.92529296875, 12.3502197265625, 12.775146484375, 13.2000732421875, 13.625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 6.0, 13.0, 15.0, 15.0, 9.0, 23.0, 26.0, 35.0, 34.0, 32.0, 50.0, 70.0, 69.0, 93.0, 73.0, 71.0, 63.0, 57.0, 49.0, 42.0, 18.0, 17.0, 24.0, 21.0, 16.0, 11.0, 11.0, 7.0, 9.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.3125, -26.434814453125, -25.55712890625, -24.679443359375, -23.8017578125, -22.924072265625, -22.04638671875, -21.168701171875, -20.291015625, -19.413330078125, -18.53564453125, -17.657958984375, -16.7802734375, -15.902587890625, -15.02490234375, -14.147216796875, -13.26953125, -12.391845703125, -11.51416015625, -10.636474609375, -9.7587890625, -8.881103515625, -8.00341796875, -7.125732421875, -6.248046875, -5.370361328125, -4.49267578125, -3.614990234375, -2.7373046875, -1.859619140625, -0.98193359375, -0.104248046875, 0.7734375, 1.651123046875, 2.52880859375, 3.406494140625, 4.2841796875, 5.161865234375, 6.03955078125, 6.917236328125, 7.794921875, 8.672607421875, 9.55029296875, 10.427978515625, 11.3056640625, 12.183349609375, 13.06103515625, 13.938720703125, 14.81640625, 15.694091796875, 16.57177734375, 17.449462890625, 18.3271484375, 19.204833984375, 20.08251953125, 20.960205078125, 21.837890625, 22.715576171875, 23.59326171875, 24.470947265625, 25.3486328125, 26.226318359375, 27.10400390625, 27.981689453125, 28.859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 1.0, 6.0, 8.0, 10.0, 8.0, 16.0, 26.0, 35.0, 60.0, 72.0, 99.0, 125.0, 234.0, 372.0, 670.0, 1223.0, 2480.0, 5296.0, 13273.0, 37207.0, 165597.0, 728211.0, 60086.0, 18745.0, 7516.0, 3368.0, 1609.0, 885.0, 440.0, 288.0, 156.0, 120.0, 78.0, 54.0, 55.0, 29.0, 27.0, 15.0, 15.0, 11.0, 7.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4765625, -1.43206787109375, -1.3875732421875, -1.34307861328125, -1.298583984375, -1.25408935546875, -1.2095947265625, -1.16510009765625, -1.12060546875, -1.07611083984375, -1.0316162109375, -0.98712158203125, -0.942626953125, -0.89813232421875, -0.8536376953125, -0.80914306640625, -0.7646484375, -0.72015380859375, -0.6756591796875, -0.63116455078125, -0.586669921875, -0.54217529296875, -0.4976806640625, -0.45318603515625, -0.40869140625, -0.36419677734375, -0.3197021484375, -0.27520751953125, -0.230712890625, -0.18621826171875, -0.1417236328125, -0.09722900390625, -0.052734375, -0.00823974609375, 0.0362548828125, 0.08074951171875, 0.125244140625, 0.16973876953125, 0.2142333984375, 0.25872802734375, 0.30322265625, 0.34771728515625, 0.3922119140625, 0.43670654296875, 0.481201171875, 0.52569580078125, 0.5701904296875, 0.61468505859375, 0.6591796875, 0.70367431640625, 0.7481689453125, 0.79266357421875, 0.837158203125, 0.88165283203125, 0.9261474609375, 0.97064208984375, 1.01513671875, 1.05963134765625, 1.1041259765625, 1.14862060546875, 1.193115234375, 1.23760986328125, 1.2821044921875, 1.32659912109375, 1.37109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 2.0, 6.0, 5.0, 12.0, 14.0, 14.0, 32.0, 35.0, 56.0, 88.0, 154.0, 186.0, 149.0, 74.0, 54.0, 34.0, 16.0, 6.0, 19.0, 8.0, 5.0, 3.0, 6.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006451606750488281, -0.0006232038140296936, -0.0006012469530105591, -0.0005792900919914246, -0.00055733323097229, -0.0005353763699531555, -0.000513419508934021, -0.0004914626479148865, -0.00046950578689575195, -0.00044754892587661743, -0.0004255920648574829, -0.0004036352038383484, -0.00038167834281921387, -0.00035972148180007935, -0.0003377646207809448, -0.0003158077597618103, -0.0002938508987426758, -0.00027189403772354126, -0.00024993717670440674, -0.00022798031568527222, -0.0002060234546661377, -0.00018406659364700317, -0.00016210973262786865, -0.00014015287160873413, -0.00011819601058959961, -9.623914957046509e-05, -7.428228855133057e-05, -5.2325427532196045e-05, -3.0368566513061523e-05, -8.411705493927002e-06, 1.354515552520752e-05, 3.550201654434204e-05, 5.745887756347656e-05, 7.941573858261108e-05, 0.0001013725996017456, 0.00012332946062088013, 0.00014528632164001465, 0.00016724318265914917, 0.0001892000436782837, 0.0002111569046974182, 0.00023311376571655273, 0.00025507062673568726, 0.0002770274877548218, 0.0002989843487739563, 0.0003209412097930908, 0.00034289807081222534, 0.00036485493183135986, 0.0003868117928504944, 0.0004087686538696289, 0.00043072551488876343, 0.00045268237590789795, 0.00047463923692703247, 0.000496596097946167, 0.0005185529589653015, 0.000540509819984436, 0.0005624666810035706, 0.0005844235420227051, 0.0006063804030418396, 0.0006283372640609741, 0.0006502941250801086, 0.0006722509860992432, 0.0006942078471183777, 0.0007161647081375122, 0.0007381215691566467, 0.0007600784301757812]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 16.0, 16.0, 24.0, 38.0, 44.0, 84.0, 110.0, 207.0, 344.0, 600.0, 1272.0, 2814.0, 6892.0, 19365.0, 75892.0, 806085.0, 97802.0, 22853.0, 7929.0, 3138.0, 1415.0, 669.0, 352.0, 181.0, 134.0, 88.0, 49.0, 29.0, 22.0, 23.0, 12.0, 13.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.17828369140625, -2.1046142578125, -2.03094482421875, -1.957275390625, -1.88360595703125, -1.8099365234375, -1.73626708984375, -1.66259765625, -1.58892822265625, -1.5152587890625, -1.44158935546875, -1.367919921875, -1.29425048828125, -1.2205810546875, -1.14691162109375, -1.0732421875, -0.99957275390625, -0.9259033203125, -0.85223388671875, -0.778564453125, -0.70489501953125, -0.6312255859375, -0.55755615234375, -0.48388671875, -0.41021728515625, -0.3365478515625, -0.26287841796875, -0.189208984375, -0.11553955078125, -0.0418701171875, 0.03179931640625, 0.10546875, 0.17913818359375, 0.2528076171875, 0.32647705078125, 0.400146484375, 0.47381591796875, 0.5474853515625, 0.62115478515625, 0.69482421875, 0.76849365234375, 0.8421630859375, 0.91583251953125, 0.989501953125, 1.06317138671875, 1.1368408203125, 1.21051025390625, 1.2841796875, 1.35784912109375, 1.4315185546875, 1.50518798828125, 1.578857421875, 1.65252685546875, 1.7261962890625, 1.79986572265625, 1.87353515625, 1.94720458984375, 2.0208740234375, 2.09454345703125, 2.168212890625, 2.24188232421875, 2.3155517578125, 2.38922119140625, 2.462890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 6.0, 7.0, 8.0, 9.0, 14.0, 17.0, 13.0, 17.0, 24.0, 47.0, 42.0, 65.0, 102.0, 122.0, 112.0, 107.0, 55.0, 54.0, 39.0, 26.0, 26.0, 16.0, 10.0, 14.0, 10.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.320404052734375, -2.25213623046875, -2.183868408203125, -2.1156005859375, -2.047332763671875, -1.97906494140625, -1.910797119140625, -1.842529296875, -1.774261474609375, -1.70599365234375, -1.637725830078125, -1.5694580078125, -1.501190185546875, -1.43292236328125, -1.364654541015625, -1.29638671875, -1.228118896484375, -1.15985107421875, -1.091583251953125, -1.0233154296875, -0.955047607421875, -0.88677978515625, -0.818511962890625, -0.750244140625, -0.681976318359375, -0.61370849609375, -0.545440673828125, -0.4771728515625, -0.408905029296875, -0.34063720703125, -0.272369384765625, -0.2041015625, -0.135833740234375, -0.06756591796875, 0.000701904296875, 0.0689697265625, 0.137237548828125, 0.20550537109375, 0.273773193359375, 0.342041015625, 0.410308837890625, 0.47857666015625, 0.546844482421875, 0.6151123046875, 0.683380126953125, 0.75164794921875, 0.819915771484375, 0.88818359375, 0.956451416015625, 1.02471923828125, 1.092987060546875, 1.1612548828125, 1.229522705078125, 1.29779052734375, 1.366058349609375, 1.434326171875, 1.502593994140625, 1.57086181640625, 1.639129638671875, 1.7073974609375, 1.775665283203125, 1.84393310546875, 1.912200927734375, 1.98046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 27.0, 32.0, 68.0, 193.0, 419.0, 127.0, 61.0, 28.0, 15.0, 9.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.74527740478516, -116.0442123413086, -112.34315490722656, -108.64208984375, -104.94103240966797, -101.2399673461914, -97.53890991210938, -93.83784484863281, -90.13678741455078, -86.43572235107422, -82.73466491699219, -79.03359985351562, -75.3325424194336, -71.63147735595703, -67.930419921875, -64.22935485839844, -60.52829360961914, -56.827232360839844, -53.12617111206055, -49.42510986328125, -45.72404861450195, -42.022987365722656, -38.321922302246094, -34.62086486816406, -30.919801712036133, -27.218740463256836, -23.51767921447754, -19.81661605834961, -16.115554809570312, -12.414493560791016, -8.713432312011719, -5.012371063232422, -1.311309814453125, 2.389751672744751, 6.090813159942627, 9.791874885559082, 13.492936134338379, 17.193998336791992, 20.89505958557129, 24.596120834350586, 28.297182083129883, 31.99824333190918, 35.69930648803711, 39.400367736816406, 43.1014289855957, 46.802490234375, 50.5035514831543, 54.204612731933594, 57.90567398071289, 61.60673522949219, 65.30780029296875, 69.00885772705078, 72.70992279052734, 76.41098022460938, 80.11204528808594, 83.81310272216797, 87.51416778564453, 91.2152328491211, 94.91629028320312, 98.61735534667969, 102.31841278076172, 106.01947784423828, 109.72053527832031, 113.42160034179688, 117.1226577758789]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 8.0, 7.0, 15.0, 22.0, 15.0, 22.0, 18.0, 22.0, 30.0, 44.0, 79.0, 99.0, 100.0, 112.0, 100.0, 72.0, 38.0, 14.0, 20.0, 23.0, 19.0, 14.0, 17.0, 15.0, 12.0, 8.0, 11.0, 1.0, 5.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-81.29576110839844, -79.1492691040039, -77.00277709960938, -74.85628509521484, -72.70979309082031, -70.56330871582031, -68.41681671142578, -66.27032470703125, -64.12383270263672, -61.97734069824219, -59.830848693847656, -57.68436050415039, -55.53786849975586, -53.39137649536133, -51.24488830566406, -49.09839630126953, -46.951904296875, -44.80541229248047, -42.65892028808594, -40.51243209838867, -38.36594009399414, -36.21944808959961, -34.072959899902344, -31.926467895507812, -29.77997589111328, -27.63348388671875, -25.48699378967285, -23.340503692626953, -21.194011688232422, -19.04751968383789, -16.901029586791992, -14.754538536071777, -12.608051300048828, -10.461560249328613, -8.315069198608398, -6.168578147888184, -4.022087097167969, -1.875596046447754, 0.27089500427246094, 2.417386054992676, 4.563877105712891, 6.7103681564331055, 8.85685920715332, 11.003350257873535, 13.14984130859375, 15.296332359313965, 17.44282341003418, 19.589313507080078, 21.73580551147461, 23.88229751586914, 26.02878761291504, 28.175277709960938, 30.32176971435547, 32.46826171875, 34.61475372314453, 36.7612419128418, 38.90773391723633, 41.05422592163086, 43.200714111328125, 45.347206115722656, 47.49369812011719, 49.64019012451172, 51.78668212890625, 53.933170318603516, 56.07966232299805]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 9.0, 10.0, 12.0, 18.0, 21.0, 20.0, 30.0, 22.0, 26.0, 41.0, 61.0, 78.0, 172.0, 105.0, 59.0, 28.0, 31.0, 32.0, 23.0, 25.0, 22.0, 22.0, 18.0, 8.0, 12.0, 12.0, 12.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.88671875, -5.6810302734375, -5.475341796875, -5.2696533203125, -5.06396484375, -4.8582763671875, -4.652587890625, -4.4468994140625, -4.2412109375, -4.0355224609375, -3.829833984375, -3.6241455078125, -3.41845703125, -3.2127685546875, -3.007080078125, -2.8013916015625, -2.595703125, -2.3900146484375, -2.184326171875, -1.9786376953125, -1.77294921875, -1.5672607421875, -1.361572265625, -1.1558837890625, -0.9501953125, -0.7445068359375, -0.538818359375, -0.3331298828125, -0.12744140625, 0.0782470703125, 0.283935546875, 0.4896240234375, 0.6953125, 0.9010009765625, 1.106689453125, 1.3123779296875, 1.51806640625, 1.7237548828125, 1.929443359375, 2.1351318359375, 2.3408203125, 2.5465087890625, 2.752197265625, 2.9578857421875, 3.16357421875, 3.3692626953125, 3.574951171875, 3.7806396484375, 3.986328125, 4.1920166015625, 4.397705078125, 4.6033935546875, 4.80908203125, 5.0147705078125, 5.220458984375, 5.4261474609375, 5.6318359375, 5.8375244140625, 6.043212890625, 6.2489013671875, 6.45458984375, 6.6602783203125, 6.865966796875, 7.0716552734375, 7.27734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 1.0, 1.0, 11.0, 9.0, 11.0, 17.0, 21.0, 27.0, 23.0, 47.0, 84.0, 248.0, 613.0, 1922.0, 7562.0, 329895.0, 8035202.0, 9407.0, 2208.0, 678.0, 258.0, 119.0, 70.0, 33.0, 25.0, 24.0, 14.0, 9.0, 10.0, 8.0, 2.0, 1.0, 5.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0], "bins": [-55.632381439208984, -54.20823669433594, -52.784088134765625, -51.35994338989258, -49.93579864501953, -48.51165008544922, -47.08750534057617, -45.663360595703125, -44.23921203613281, -42.815067291259766, -41.39091873168945, -39.966773986816406, -38.54262924194336, -37.11848449707031, -35.6943359375, -34.27019119262695, -32.846046447753906, -31.421899795532227, -29.99775505065918, -28.5736083984375, -27.149463653564453, -25.725317001342773, -24.301170349121094, -22.877025604248047, -21.452878952026367, -20.028732299804688, -18.60458755493164, -17.18044090270996, -15.756295204162598, -14.332149505615234, -12.908002853393555, -11.483857154846191, -10.059711456298828, -8.635565757751465, -7.211419582366943, -5.787273406982422, -4.363127708435059, -2.9389820098876953, -1.5148353576660156, -0.09068965911865234, 1.333456039428711, 2.7576019763946533, 4.181747913360596, 5.605894088745117, 7.0300397872924805, 8.454185485839844, 9.878332138061523, 11.302477836608887, 12.72662353515625, 14.150769233703613, 15.574914932250977, 16.999061584472656, 18.423206329345703, 19.847352981567383, 21.271499633789062, 22.69564437866211, 24.11979103088379, 25.54393768310547, 26.968082427978516, 28.392229080200195, 29.816375732421875, 31.240520477294922, 32.66466522216797, 34.08881378173828, 35.51295852661133]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 5.0, 5.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 7.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-64.3568344116211, -62.140445709228516, -59.92405700683594, -57.70766830444336, -55.49127960205078, -53.27488708496094, -51.05849838256836, -48.84210968017578, -46.6257209777832, -44.409332275390625, -42.19294357299805, -39.97655487060547, -37.760162353515625, -35.54377746582031, -33.32738494873047, -31.11099624633789, -28.894607543945312, -26.678218841552734, -24.461830139160156, -22.245439529418945, -20.029050827026367, -17.81266212463379, -15.596272468566895, -13.3798828125, -11.163494110107422, -8.947105407714844, -6.730715751647949, -4.514326572418213, -2.2979373931884766, -0.08154869079589844, 2.134840965270996, 4.351230621337891, 6.5676116943359375, 8.784000396728516, 11.00039005279541, 13.216779708862305, 15.433168411254883, 17.64955711364746, 19.865947723388672, 22.08233642578125, 24.298725128173828, 26.515113830566406, 28.731502532958984, 30.947893142700195, 33.164283752441406, 35.38066864013672, 37.59706115722656, 39.81344985961914, 42.02983856201172, 44.2462272644043, 46.462615966796875, 48.67900466918945, 50.89539337158203, 53.111785888671875, 55.32817459106445, 57.54456329345703, 59.76095199584961, 61.97734069824219, 64.19373321533203, 66.41011810302734, 68.62651062011719, 70.8428955078125, 73.05928802490234, 75.27568054199219, 77.4920654296875]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 8.0, 9.0, 17.0, 21.0, 15.0, 21.0, 30.0, 33.0, 35.0, 45.0, 44.0, 48.0, 55.0, 52.0, 58.0, 55.0, 64.0, 55.0, 52.0, 38.0, 35.0, 33.0, 27.0, 27.0, 18.0, 13.0, 12.0, 13.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.776611328125, -5.58447265625, -5.392333984375, -5.2001953125, -5.008056640625, -4.81591796875, -4.623779296875, -4.431640625, -4.239501953125, -4.04736328125, -3.855224609375, -3.6630859375, -3.470947265625, -3.27880859375, -3.086669921875, -2.89453125, -2.702392578125, -2.51025390625, -2.318115234375, -2.1259765625, -1.933837890625, -1.74169921875, -1.549560546875, -1.357421875, -1.165283203125, -0.97314453125, -0.781005859375, -0.5888671875, -0.396728515625, -0.20458984375, -0.012451171875, 0.1796875, 0.371826171875, 0.56396484375, 0.756103515625, 0.9482421875, 1.140380859375, 1.33251953125, 1.524658203125, 1.716796875, 1.908935546875, 2.10107421875, 2.293212890625, 2.4853515625, 2.677490234375, 2.86962890625, 3.061767578125, 3.25390625, 3.446044921875, 3.63818359375, 3.830322265625, 4.0224609375, 4.214599609375, 4.40673828125, 4.598876953125, 4.791015625, 4.983154296875, 5.17529296875, 5.367431640625, 5.5595703125, 5.751708984375, 5.94384765625, 6.135986328125, 6.328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 17.0, 24.0, 54.0, 64.0, 68.0, 168.0, 293.0, 470.0, 1016.0, 2372.0, 5990.0, 15436.0, 44074.0, 125406.0, 191216.0, 88723.0, 30476.0, 10903.0, 4130.0, 1663.0, 770.0, 381.0, 210.0, 126.0, 71.0, 39.0, 30.0, 19.0, 14.0, 7.0, 10.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.9375, -43.66552734375, -42.3935546875, -41.12158203125, -39.849609375, -38.57763671875, -37.3056640625, -36.03369140625, -34.76171875, -33.48974609375, -32.2177734375, -30.94580078125, -29.673828125, -28.40185546875, -27.1298828125, -25.85791015625, -24.5859375, -23.31396484375, -22.0419921875, -20.77001953125, -19.498046875, -18.22607421875, -16.9541015625, -15.68212890625, -14.41015625, -13.13818359375, -11.8662109375, -10.59423828125, -9.322265625, -8.05029296875, -6.7783203125, -5.50634765625, -4.234375, -2.96240234375, -1.6904296875, -0.41845703125, 0.853515625, 2.12548828125, 3.3974609375, 4.66943359375, 5.94140625, 7.21337890625, 8.4853515625, 9.75732421875, 11.029296875, 12.30126953125, 13.5732421875, 14.84521484375, 16.1171875, 17.38916015625, 18.6611328125, 19.93310546875, 21.205078125, 22.47705078125, 23.7490234375, 25.02099609375, 26.29296875, 27.56494140625, 28.8369140625, 30.10888671875, 31.380859375, 32.65283203125, 33.9248046875, 35.19677734375, 36.46875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 8.0, 8.0, 13.0, 16.0, 31.0, 17.0, 25.0, 26.0, 20.0, 35.0, 54.0, 68.0, 51.0, 68.0, 50.0, 65.0, 73.0, 55.0, 55.0, 42.0, 46.0, 41.0, 26.0, 21.0, 22.0, 12.0, 8.0, 13.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.910400390625, -5.70751953125, -5.504638671875, -5.3017578125, -5.098876953125, -4.89599609375, -4.693115234375, -4.490234375, -4.287353515625, -4.08447265625, -3.881591796875, -3.6787109375, -3.475830078125, -3.27294921875, -3.070068359375, -2.8671875, -2.664306640625, -2.46142578125, -2.258544921875, -2.0556640625, -1.852783203125, -1.64990234375, -1.447021484375, -1.244140625, -1.041259765625, -0.83837890625, -0.635498046875, -0.4326171875, -0.229736328125, -0.02685546875, 0.176025390625, 0.37890625, 0.581787109375, 0.78466796875, 0.987548828125, 1.1904296875, 1.393310546875, 1.59619140625, 1.799072265625, 2.001953125, 2.204833984375, 2.40771484375, 2.610595703125, 2.8134765625, 3.016357421875, 3.21923828125, 3.422119140625, 3.625, 3.827880859375, 4.03076171875, 4.233642578125, 4.4365234375, 4.639404296875, 4.84228515625, 5.045166015625, 5.248046875, 5.450927734375, 5.65380859375, 5.856689453125, 6.0595703125, 6.262451171875, 6.46533203125, 6.668212890625, 6.87109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 11.0, 13.0, 38.0, 91.0, 143.0, 74.0, 40.0, 21.0, 6.0, 5.0, 14.0, 4.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.96226501464844, -66.92040252685547, -64.87854766845703, -62.83668518066406, -60.79482650756836, -58.752967834472656, -56.71110534667969, -54.669246673583984, -52.62738800048828, -50.58552932739258, -48.543670654296875, -46.501808166503906, -44.4599494934082, -42.4180908203125, -40.37622833251953, -38.33436965942383, -36.292510986328125, -34.25065231323242, -32.20879364013672, -30.16693115234375, -28.125072479248047, -26.083213806152344, -24.041353225708008, -21.999492645263672, -19.95763397216797, -17.915775299072266, -15.87391471862793, -13.83205509185791, -11.79019546508789, -9.748335838317871, -7.706476211547852, -5.664616584777832, -3.6227645874023438, -1.5809049606323242, 0.4609546661376953, 2.502814292907715, 4.544673919677734, 6.586533546447754, 8.628393173217773, 10.670252799987793, 12.712112426757812, 14.753972053527832, 16.79583168029785, 18.837692260742188, 20.87955093383789, 22.921409606933594, 24.96327018737793, 27.005130767822266, 29.04698944091797, 31.088848114013672, 33.130706787109375, 35.172569274902344, 37.21442794799805, 39.25628662109375, 41.29814910888672, 43.34000778198242, 45.381866455078125, 47.42372512817383, 49.46558380126953, 51.5074462890625, 53.5493049621582, 55.591163635253906, 57.633026123046875, 59.67488479614258, 61.71674346923828]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 28.0, 34.0, 57.0, 72.0, 67.0, 68.0, 45.0, 20.0, 11.0, 8.0, 4.0, 3.0, 6.0, 10.0, 4.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-53.238895416259766, -51.81538391113281, -50.391876220703125, -48.96836471557617, -47.544857025146484, -46.12134552001953, -44.697837829589844, -43.27432632446289, -41.85081481933594, -40.427303314208984, -39.0037956237793, -37.580284118652344, -36.156776428222656, -34.7332649230957, -33.30975341796875, -31.886245727539062, -30.462738037109375, -29.039228439331055, -27.615718841552734, -26.19220733642578, -24.768699645996094, -23.34518814086914, -21.92167854309082, -20.4981689453125, -19.07465934753418, -17.65114974975586, -16.22764015197754, -14.804129600524902, -13.380620002746582, -11.957110404968262, -10.533599853515625, -9.110090255737305, -7.68658447265625, -6.26307487487793, -4.839564800262451, -3.4160547256469727, -1.9925451278686523, -0.569035530090332, 0.8544750213623047, 2.277984619140625, 3.7014942169189453, 5.125003814697266, 6.548513889312744, 7.972023963928223, 9.395533561706543, 10.819043159484863, 12.2425537109375, 13.66606330871582, 15.08957290649414, 16.51308250427246, 17.93659210205078, 19.360103607177734, 20.783611297607422, 22.207122802734375, 23.630632400512695, 25.054141998291016, 26.477651596069336, 27.901161193847656, 29.324670791625977, 30.748180389404297, 32.17169189453125, 33.59519958496094, 35.01871109008789, 36.442222595214844, 37.86573028564453]}, "eval/loss": 1.85287344455719, "eval/wer": 0.9976993256644189, "eval/runtime": 896.1552, "eval/samples_per_second": 2.948, "eval/steps_per_second": 0.369} \ No newline at end of file +{"train/loss": 0.0608, "train/learning_rate": 4.156769596199525e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 114529, "_timestamp": 1647708406, "_step": 17847, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 6.0, 15.0, 19.0, 22.0, 48.0, 65.0, 61.0, 84.0, 114.0, 110.0, 103.0, 76.0, 77.0, 49.0, 35.0, 19.0, 15.0, 16.0, 9.0, 7.0, 10.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.100801467895508, -26.244380950927734, -25.38796043395996, -24.531539916992188, -23.675119400024414, -22.81869888305664, -21.9622802734375, -21.105859756469727, -20.249439239501953, -19.39301872253418, -18.536598205566406, -17.680177688598633, -16.82375717163086, -15.967337608337402, -15.110917091369629, -14.254497528076172, -13.398076057434082, -12.541655540466309, -11.685235023498535, -10.828815460205078, -9.972394943237305, -9.115974426269531, -8.259553909301758, -7.403133869171143, -6.546713352203369, -5.690292835235596, -4.8338727951049805, -3.977452278137207, -3.1210319995880127, -2.2646117210388184, -1.408191204071045, -0.5517711639404297, 0.30464935302734375, 1.161069631576538, 2.0174899101257324, 2.873910427093506, 3.7303307056427, 4.5867509841918945, 5.443171501159668, 6.299591541290283, 7.156012058258057, 8.012432098388672, 8.868852615356445, 9.725273132324219, 10.581693649291992, 11.438114166259766, 12.294534683227539, 13.150954246520996, 14.00737476348877, 14.863795280456543, 15.720215797424316, 16.576635360717773, 17.433055877685547, 18.28947639465332, 19.145896911621094, 20.002317428588867, 20.85873794555664, 21.715158462524414, 22.571578979492188, 23.42799949645996, 24.284420013427734, 25.140838623046875, 25.99726104736328, 26.853679656982422, 27.710100173950195]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 13.0, 14.0, 18.0, 24.0, 29.0, 38.0, 54.0, 58.0, 64.0, 54.0, 61.0, 62.0, 63.0, 63.0, 54.0, 68.0, 43.0, 42.0, 37.0, 36.0, 24.0, 15.0, 15.0, 10.0, 5.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.098886489868164, -20.288461685180664, -19.478036880493164, -18.66761016845703, -17.85718536376953, -17.04676055908203, -16.23633575439453, -15.425910949707031, -14.615485191345215, -13.805060386657715, -12.994634628295898, -12.184209823608398, -11.373785018920898, -10.563359260559082, -9.752934455871582, -8.942508697509766, -8.132083892822266, -7.321658611297607, -6.511233329772949, -5.700808525085449, -4.890383243560791, -4.079957962036133, -3.269533157348633, -2.4591078758239746, -1.6486825942993164, -0.8382574319839478, -0.0278322696685791, 0.7825927734375, 1.5930180549621582, 2.4034433364868164, 3.2138681411743164, 4.024293422698975, 4.834716796875, 5.645142078399658, 6.455567359924316, 7.265992164611816, 8.076417922973633, 8.886842727661133, 9.697267532348633, 10.507692337036133, 11.31811809539795, 12.12854290008545, 12.938968658447266, 13.749393463134766, 14.559818267822266, 15.370244026184082, 16.180667877197266, 16.9910945892334, 17.8015193939209, 18.6119441986084, 19.4223690032959, 20.23279571533203, 21.04322052001953, 21.85364532470703, 22.66407012939453, 23.47449493408203, 24.28491973876953, 25.09534454345703, 25.90576934814453, 26.71619415283203, 27.526620864868164, 28.337045669555664, 29.147470474243164, 29.957895278930664, 30.768321990966797]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 8.0, 9.0, 16.0, 16.0, 30.0, 23.0, 38.0, 41.0, 47.0, 67.0, 64.0, 59.0, 52.0, 64.0, 59.0, 64.0, 69.0, 52.0, 27.0, 43.0, 26.0, 33.0, 21.0, 15.0, 14.0, 3.0, 8.0, 8.0, 5.0, 4.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.3742828369140625, -1.317901611328125, -1.2615203857421875, -1.20513916015625, -1.1487579345703125, -1.092376708984375, -1.0359954833984375, -0.9796142578125, -0.9232330322265625, -0.866851806640625, -0.8104705810546875, -0.75408935546875, -0.6977081298828125, -0.641326904296875, -0.5849456787109375, -0.528564453125, -0.4721832275390625, -0.415802001953125, -0.3594207763671875, -0.30303955078125, -0.2466583251953125, -0.190277099609375, -0.1338958740234375, -0.0775146484375, -0.0211334228515625, 0.035247802734375, 0.0916290283203125, 0.14801025390625, 0.2043914794921875, 0.260772705078125, 0.3171539306640625, 0.37353515625, 0.4299163818359375, 0.486297607421875, 0.5426788330078125, 0.59906005859375, 0.6554412841796875, 0.711822509765625, 0.7682037353515625, 0.8245849609375, 0.8809661865234375, 0.937347412109375, 0.9937286376953125, 1.05010986328125, 1.1064910888671875, 1.162872314453125, 1.2192535400390625, 1.275634765625, 1.3320159912109375, 1.388397216796875, 1.4447784423828125, 1.50115966796875, 1.5575408935546875, 1.613922119140625, 1.6703033447265625, 1.7266845703125, 1.7830657958984375, 1.839447021484375, 1.8958282470703125, 1.95220947265625, 2.0085906982421875, 2.064971923828125, 2.1213531494140625, 2.177734375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 15.0, 16.0, 30.0, 34.0, 41.0, 80.0, 131.0, 151.0, 344.0, 714.0, 1926.0, 6215.0, 26205.0, 199978.0, 3804105.0, 125763.0, 19798.0, 5179.0, 1791.0, 763.0, 362.0, 202.0, 134.0, 92.0, 56.0, 38.0, 24.0, 22.0, 17.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.3924560546875, -11.839599609375, -11.2867431640625, -10.73388671875, -10.1810302734375, -9.628173828125, -9.0753173828125, -8.5224609375, -7.9696044921875, -7.416748046875, -6.8638916015625, -6.31103515625, -5.7581787109375, -5.205322265625, -4.6524658203125, -4.099609375, -3.5467529296875, -2.993896484375, -2.4410400390625, -1.88818359375, -1.3353271484375, -0.782470703125, -0.2296142578125, 0.3232421875, 0.8760986328125, 1.428955078125, 1.9818115234375, 2.53466796875, 3.0875244140625, 3.640380859375, 4.1932373046875, 4.74609375, 5.2989501953125, 5.851806640625, 6.4046630859375, 6.95751953125, 7.5103759765625, 8.063232421875, 8.6160888671875, 9.1689453125, 9.7218017578125, 10.274658203125, 10.8275146484375, 11.38037109375, 11.9332275390625, 12.486083984375, 13.0389404296875, 13.591796875, 14.1446533203125, 14.697509765625, 15.2503662109375, 15.80322265625, 16.3560791015625, 16.908935546875, 17.4617919921875, 18.0146484375, 18.5675048828125, 19.120361328125, 19.6732177734375, 20.22607421875, 20.7789306640625, 21.331787109375, 21.8846435546875, 22.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 6.0, 15.0, 35.0, 68.0, 88.0, 197.0, 534.0, 1911.0, 663.0, 258.0, 125.0, 63.0, 40.0, 25.0, 19.0, 8.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9921875, -13.5498046875, -13.107421875, -12.6650390625, -12.22265625, -11.7802734375, -11.337890625, -10.8955078125, -10.453125, -10.0107421875, -9.568359375, -9.1259765625, -8.68359375, -8.2412109375, -7.798828125, -7.3564453125, -6.9140625, -6.4716796875, -6.029296875, -5.5869140625, -5.14453125, -4.7021484375, -4.259765625, -3.8173828125, -3.375, -2.9326171875, -2.490234375, -2.0478515625, -1.60546875, -1.1630859375, -0.720703125, -0.2783203125, 0.1640625, 0.6064453125, 1.048828125, 1.4912109375, 1.93359375, 2.3759765625, 2.818359375, 3.2607421875, 3.703125, 4.1455078125, 4.587890625, 5.0302734375, 5.47265625, 5.9150390625, 6.357421875, 6.7998046875, 7.2421875, 7.6845703125, 8.126953125, 8.5693359375, 9.01171875, 9.4541015625, 9.896484375, 10.3388671875, 10.78125, 11.2236328125, 11.666015625, 12.1083984375, 12.55078125, 12.9931640625, 13.435546875, 13.8779296875, 14.3203125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 17.0, 38.0, 40.0, 66.0, 94.0, 142.0, 256.0, 571.0, 1528.0, 5103.0, 24760.0, 246907.0, 3771734.0, 120822.0, 16099.0, 3772.0, 1178.0, 476.0, 235.0, 141.0, 101.0, 70.0, 39.0, 30.0, 21.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.58349609375, -36.3857421875, -35.18798828125, -33.990234375, -32.79248046875, -31.5947265625, -30.39697265625, -29.19921875, -28.00146484375, -26.8037109375, -25.60595703125, -24.408203125, -23.21044921875, -22.0126953125, -20.81494140625, -19.6171875, -18.41943359375, -17.2216796875, -16.02392578125, -14.826171875, -13.62841796875, -12.4306640625, -11.23291015625, -10.03515625, -8.83740234375, -7.6396484375, -6.44189453125, -5.244140625, -4.04638671875, -2.8486328125, -1.65087890625, -0.453125, 0.74462890625, 1.9423828125, 3.14013671875, 4.337890625, 5.53564453125, 6.7333984375, 7.93115234375, 9.12890625, 10.32666015625, 11.5244140625, 12.72216796875, 13.919921875, 15.11767578125, 16.3154296875, 17.51318359375, 18.7109375, 19.90869140625, 21.1064453125, 22.30419921875, 23.501953125, 24.69970703125, 25.8974609375, 27.09521484375, 28.29296875, 29.49072265625, 30.6884765625, 31.88623046875, 33.083984375, 34.28173828125, 35.4794921875, 36.67724609375, 37.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 15.0, 11.0, 16.0, 36.0, 54.0, 90.0, 97.0, 144.0, 154.0, 118.0, 78.0, 61.0, 31.0, 30.0, 27.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.96833801269531, -54.66822052001953, -53.36810302734375, -52.06798553466797, -50.76786804199219, -49.467750549316406, -48.167633056640625, -46.867515563964844, -45.56739807128906, -44.26728057861328, -42.9671630859375, -41.66704559326172, -40.36692810058594, -39.066810607910156, -37.766693115234375, -36.466575622558594, -35.16645431518555, -33.866336822509766, -32.566219329833984, -31.266101837158203, -29.965984344482422, -28.66586685180664, -27.365747451782227, -26.065629959106445, -24.765512466430664, -23.465394973754883, -22.1652774810791, -20.86515998840332, -19.565040588378906, -18.264923095703125, -16.964805603027344, -15.664688110351562, -14.364574432373047, -13.064456939697266, -11.764339447021484, -10.464221000671387, -9.164103507995605, -7.863986015319824, -6.563868045806885, -5.263750076293945, -3.963632583618164, -2.6635148525238037, -1.3633971214294434, -0.06327939033508301, 1.2368383407592773, 2.5369558334350586, 3.837073802947998, 5.1371917724609375, 6.437309265136719, 7.7374267578125, 9.037544250488281, 10.337662696838379, 11.63778018951416, 12.937897682189941, 14.238016128540039, 15.53813362121582, 16.8382511138916, 18.138368606567383, 19.438486099243164, 20.738603591918945, 22.03872299194336, 23.33884048461914, 24.638957977294922, 25.939075469970703, 27.239192962646484]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 16.0, 9.0, 18.0, 16.0, 14.0, 33.0, 21.0, 28.0, 30.0, 41.0, 50.0, 37.0, 39.0, 39.0, 40.0, 51.0, 35.0, 51.0, 41.0, 38.0, 31.0, 33.0, 35.0, 30.0, 27.0, 10.0, 18.0, 19.0, 26.0, 15.0, 12.0, 16.0, 10.0, 8.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.482481002807617, -20.81058120727539, -20.13867950439453, -19.466779708862305, -18.794879913330078, -18.12297821044922, -17.451078414916992, -16.779178619384766, -16.107276916503906, -15.435376167297363, -14.76347541809082, -14.091575622558594, -13.41967487335205, -12.747774124145508, -12.075874328613281, -11.403973579406738, -10.732072830200195, -10.060172080993652, -9.38827133178711, -8.716371536254883, -8.04447078704834, -7.372570037841797, -6.700669765472412, -6.028769493103027, -5.356868743896484, -4.684967994689941, -4.013067722320557, -3.3411672115325928, -2.669266700744629, -1.997366189956665, -1.3254656791687012, -0.6535654067993164, 0.018337249755859375, 0.6902377605438232, 1.362138271331787, 2.034038782119751, 2.705939292907715, 3.3778398036956787, 4.049740314483643, 4.721640586853027, 5.39354133605957, 6.065442085266113, 6.737342357635498, 7.409242630004883, 8.081143379211426, 8.753044128417969, 9.424943923950195, 10.096844673156738, 10.768745422363281, 11.440646171569824, 12.112546920776367, 12.784446716308594, 13.456347465515137, 14.12824821472168, 14.800148010253906, 15.47204875946045, 16.143949508666992, 16.81584930419922, 17.487751007080078, 18.159650802612305, 18.83155059814453, 19.50345230102539, 20.175352096557617, 20.847251892089844, 21.519153594970703]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 4.0, 8.0, 10.0, 14.0, 12.0, 22.0, 25.0, 30.0, 35.0, 35.0, 35.0, 40.0, 47.0, 60.0, 54.0, 61.0, 59.0, 52.0, 54.0, 56.0, 44.0, 32.0, 34.0, 38.0, 28.0, 29.0, 17.0, 14.0, 13.0, 7.0, 15.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7455596923828125, -1.691314697265625, -1.6370697021484375, -1.58282470703125, -1.5285797119140625, -1.474334716796875, -1.4200897216796875, -1.3658447265625, -1.3115997314453125, -1.257354736328125, -1.2031097412109375, -1.14886474609375, -1.0946197509765625, -1.040374755859375, -0.9861297607421875, -0.931884765625, -0.8776397705078125, -0.823394775390625, -0.7691497802734375, -0.71490478515625, -0.6606597900390625, -0.606414794921875, -0.5521697998046875, -0.4979248046875, -0.4436798095703125, -0.389434814453125, -0.3351898193359375, -0.28094482421875, -0.2266998291015625, -0.172454833984375, -0.1182098388671875, -0.06396484375, -0.0097198486328125, 0.044525146484375, 0.0987701416015625, 0.15301513671875, 0.2072601318359375, 0.261505126953125, 0.3157501220703125, 0.3699951171875, 0.4242401123046875, 0.478485107421875, 0.5327301025390625, 0.58697509765625, 0.6412200927734375, 0.695465087890625, 0.7497100830078125, 0.803955078125, 0.8582000732421875, 0.912445068359375, 0.9666900634765625, 1.02093505859375, 1.0751800537109375, 1.129425048828125, 1.1836700439453125, 1.2379150390625, 1.2921600341796875, 1.346405029296875, 1.4006500244140625, 1.45489501953125, 1.5091400146484375, 1.563385009765625, 1.6176300048828125, 1.671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 16.0, 13.0, 20.0, 20.0, 48.0, 60.0, 103.0, 149.0, 240.0, 362.0, 684.0, 1206.0, 2251.0, 4407.0, 9451.0, 22248.0, 66329.0, 679915.0, 191254.0, 40420.0, 15206.0, 6726.0, 3343.0, 1734.0, 923.0, 526.0, 301.0, 201.0, 140.0, 80.0, 45.0, 44.0, 26.0, 18.0, 15.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.43798828125, -8.1806640625, -7.92333984375, -7.666015625, -7.40869140625, -7.1513671875, -6.89404296875, -6.63671875, -6.37939453125, -6.1220703125, -5.86474609375, -5.607421875, -5.35009765625, -5.0927734375, -4.83544921875, -4.578125, -4.32080078125, -4.0634765625, -3.80615234375, -3.548828125, -3.29150390625, -3.0341796875, -2.77685546875, -2.51953125, -2.26220703125, -2.0048828125, -1.74755859375, -1.490234375, -1.23291015625, -0.9755859375, -0.71826171875, -0.4609375, -0.20361328125, 0.0537109375, 0.31103515625, 0.568359375, 0.82568359375, 1.0830078125, 1.34033203125, 1.59765625, 1.85498046875, 2.1123046875, 2.36962890625, 2.626953125, 2.88427734375, 3.1416015625, 3.39892578125, 3.65625, 3.91357421875, 4.1708984375, 4.42822265625, 4.685546875, 4.94287109375, 5.2001953125, 5.45751953125, 5.71484375, 5.97216796875, 6.2294921875, 6.48681640625, 6.744140625, 7.00146484375, 7.2587890625, 7.51611328125, 7.7734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 2.0, 10.0, 12.0, 13.0, 13.0, 18.0, 20.0, 25.0, 26.0, 36.0, 35.0, 39.0, 32.0, 45.0, 31.0, 43.0, 38.0, 39.0, 1057.0, 46.0, 44.0, 45.0, 42.0, 35.0, 32.0, 31.0, 26.0, 22.0, 19.0, 22.0, 17.0, 17.0, 9.0, 17.0, 14.0, 7.0, 10.0, 7.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.058868408203125, -1.02105712890625, -0.983245849609375, -0.9454345703125, -0.907623291015625, -0.86981201171875, -0.832000732421875, -0.794189453125, -0.756378173828125, -0.71856689453125, -0.680755615234375, -0.6429443359375, -0.605133056640625, -0.56732177734375, -0.529510498046875, -0.49169921875, -0.453887939453125, -0.41607666015625, -0.378265380859375, -0.3404541015625, -0.302642822265625, -0.26483154296875, -0.227020263671875, -0.189208984375, -0.151397705078125, -0.11358642578125, -0.075775146484375, -0.0379638671875, -0.000152587890625, 0.03765869140625, 0.075469970703125, 0.11328125, 0.151092529296875, 0.18890380859375, 0.226715087890625, 0.2645263671875, 0.302337646484375, 0.34014892578125, 0.377960205078125, 0.415771484375, 0.453582763671875, 0.49139404296875, 0.529205322265625, 0.5670166015625, 0.604827880859375, 0.64263916015625, 0.680450439453125, 0.71826171875, 0.756072998046875, 0.79388427734375, 0.831695556640625, 0.8695068359375, 0.907318115234375, 0.94512939453125, 0.982940673828125, 1.020751953125, 1.058563232421875, 1.09637451171875, 1.134185791015625, 1.1719970703125, 1.209808349609375, 1.24761962890625, 1.285430908203125, 1.3232421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 13.0, 12.0, 15.0, 22.0, 25.0, 34.0, 57.0, 75.0, 89.0, 131.0, 197.0, 290.0, 402.0, 590.0, 972.0, 1543.0, 2527.0, 4484.0, 8431.0, 19502.0, 60751.0, 1383133.0, 529715.0, 49483.0, 16652.0, 7581.0, 3949.0, 2268.0, 1377.0, 895.0, 585.0, 405.0, 263.0, 199.0, 109.0, 93.0, 60.0, 48.0, 40.0, 27.0, 19.0, 16.0, 15.0, 3.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.810546875, -2.71966552734375, -2.6287841796875, -2.53790283203125, -2.447021484375, -2.35614013671875, -2.2652587890625, -2.17437744140625, -2.08349609375, -1.99261474609375, -1.9017333984375, -1.81085205078125, -1.719970703125, -1.62908935546875, -1.5382080078125, -1.44732666015625, -1.3564453125, -1.26556396484375, -1.1746826171875, -1.08380126953125, -0.992919921875, -0.90203857421875, -0.8111572265625, -0.72027587890625, -0.62939453125, -0.53851318359375, -0.4476318359375, -0.35675048828125, -0.265869140625, -0.17498779296875, -0.0841064453125, 0.00677490234375, 0.09765625, 0.18853759765625, 0.2794189453125, 0.37030029296875, 0.461181640625, 0.55206298828125, 0.6429443359375, 0.73382568359375, 0.82470703125, 0.91558837890625, 1.0064697265625, 1.09735107421875, 1.188232421875, 1.27911376953125, 1.3699951171875, 1.46087646484375, 1.5517578125, 1.64263916015625, 1.7335205078125, 1.82440185546875, 1.915283203125, 2.00616455078125, 2.0970458984375, 2.18792724609375, 2.27880859375, 2.36968994140625, 2.4605712890625, 2.55145263671875, 2.642333984375, 2.73321533203125, 2.8240966796875, 2.91497802734375, 3.005859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 8.0, 19.0, 149.0, 709.0, 73.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.934814453125, -2.85400390625, -2.773193359375, -2.6923828125, -2.611572265625, -2.53076171875, -2.449951171875, -2.369140625, -2.288330078125, -2.20751953125, -2.126708984375, -2.0458984375, -1.965087890625, -1.88427734375, -1.803466796875, -1.72265625, -1.641845703125, -1.56103515625, -1.480224609375, -1.3994140625, -1.318603515625, -1.23779296875, -1.156982421875, -1.076171875, -0.995361328125, -0.91455078125, -0.833740234375, -0.7529296875, -0.672119140625, -0.59130859375, -0.510498046875, -0.4296875, -0.348876953125, -0.26806640625, -0.187255859375, -0.1064453125, -0.025634765625, 0.05517578125, 0.135986328125, 0.216796875, 0.297607421875, 0.37841796875, 0.459228515625, 0.5400390625, 0.620849609375, 0.70166015625, 0.782470703125, 0.86328125, 0.944091796875, 1.02490234375, 1.105712890625, 1.1865234375, 1.267333984375, 1.34814453125, 1.428955078125, 1.509765625, 1.590576171875, 1.67138671875, 1.752197265625, 1.8330078125, 1.913818359375, 1.99462890625, 2.075439453125, 2.15625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 3.0, 9.0, 12.0, 11.0, 17.0, 28.0, 87.0, 377.0, 3379.0, 1025580.0, 17285.0, 1361.0, 210.0, 74.0, 25.0, 17.0, 9.0, 9.0, 3.0, 4.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.7587890625, -36.673828125, -35.5888671875, -34.50390625, -33.4189453125, -32.333984375, -31.2490234375, -30.1640625, -29.0791015625, -27.994140625, -26.9091796875, -25.82421875, -24.7392578125, -23.654296875, -22.5693359375, -21.484375, -20.3994140625, -19.314453125, -18.2294921875, -17.14453125, -16.0595703125, -14.974609375, -13.8896484375, -12.8046875, -11.7197265625, -10.634765625, -9.5498046875, -8.46484375, -7.3798828125, -6.294921875, -5.2099609375, -4.125, -3.0400390625, -1.955078125, -0.8701171875, 0.21484375, 1.2998046875, 2.384765625, 3.4697265625, 4.5546875, 5.6396484375, 6.724609375, 7.8095703125, 8.89453125, 9.9794921875, 11.064453125, 12.1494140625, 13.234375, 14.3193359375, 15.404296875, 16.4892578125, 17.57421875, 18.6591796875, 19.744140625, 20.8291015625, 21.9140625, 22.9990234375, 24.083984375, 25.1689453125, 26.25390625, 27.3388671875, 28.423828125, 29.5087890625, 30.59375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 12.0, 65.0, 204.0, 488.0, 172.0, 41.0, 19.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.455366611480713, -7.2503156661987305, -7.045264720916748, -6.840213775634766, -6.635162830352783, -6.430111885070801, -6.225060939788818, -6.020009994506836, -5.8149590492248535, -5.609908103942871, -5.404857158660889, -5.199806213378906, -4.994755268096924, -4.789704322814941, -4.584653377532959, -4.379602432250977, -4.174551486968994, -3.9695005416870117, -3.7644495964050293, -3.559398651123047, -3.3543477058410645, -3.149296760559082, -2.9442458152770996, -2.739194869995117, -2.5341439247131348, -2.3290929794311523, -2.12404203414917, -1.9189910888671875, -1.713940143585205, -1.5088891983032227, -1.3038382530212402, -1.0987873077392578, -0.8937363624572754, -0.688685417175293, -0.48363447189331055, -0.2785835266113281, -0.0735325813293457, 0.13151836395263672, 0.33656930923461914, 0.5416202545166016, 0.746671199798584, 0.9517221450805664, 1.1567730903625488, 1.3618240356445312, 1.5668749809265137, 1.771925926208496, 1.9769768714904785, 2.182027816772461, 2.3870787620544434, 2.592129707336426, 2.797180652618408, 3.0022315979003906, 3.207282543182373, 3.4123334884643555, 3.617384433746338, 3.8224353790283203, 4.027486324310303, 4.232537269592285, 4.437588214874268, 4.64263916015625, 4.847690105438232, 5.052741050720215, 5.257791996002197, 5.46284294128418, 5.667893886566162]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 9.0, 5.0, 6.0, 15.0, 16.0, 23.0, 12.0, 25.0, 37.0, 25.0, 33.0, 27.0, 36.0, 37.0, 45.0, 40.0, 34.0, 35.0, 35.0, 34.0, 45.0, 33.0, 42.0, 38.0, 24.0, 30.0, 31.0, 23.0, 32.0, 30.0, 27.0, 16.0, 10.0, 16.0, 12.0, 12.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4209628105163574, -1.3770132064819336, -1.3330636024475098, -1.289113998413086, -1.245164394378662, -1.2012147903442383, -1.1572651863098145, -1.1133155822753906, -1.0693659782409668, -1.025416374206543, -0.9814667701721191, -0.9375171661376953, -0.8935675621032715, -0.8496179580688477, -0.8056683540344238, -0.76171875, -0.7177691459655762, -0.6738195419311523, -0.6298699378967285, -0.5859203338623047, -0.5419707298278809, -0.49802112579345703, -0.4540715217590332, -0.4101219177246094, -0.36617231369018555, -0.3222227096557617, -0.2782731056213379, -0.23432350158691406, -0.19037389755249023, -0.1464242935180664, -0.10247468948364258, -0.05852508544921875, -0.014575481414794922, 0.029374122619628906, 0.07332372665405273, 0.11727333068847656, 0.1612229347229004, 0.20517253875732422, 0.24912214279174805, 0.2930717468261719, 0.3370213508605957, 0.38097095489501953, 0.42492055892944336, 0.4688701629638672, 0.512819766998291, 0.5567693710327148, 0.6007189750671387, 0.6446685791015625, 0.6886181831359863, 0.7325677871704102, 0.776517391204834, 0.8204669952392578, 0.8644165992736816, 0.9083662033081055, 0.9523158073425293, 0.9962654113769531, 1.040215015411377, 1.0841646194458008, 1.1281142234802246, 1.1720638275146484, 1.2160134315490723, 1.259963035583496, 1.30391263961792, 1.3478622436523438, 1.3918118476867676]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 10.0, 19.0, 20.0, 17.0, 32.0, 41.0, 37.0, 45.0, 55.0, 62.0, 64.0, 74.0, 69.0, 61.0, 46.0, 50.0, 49.0, 40.0, 44.0, 34.0, 25.0, 24.0, 15.0, 12.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9296417236328125, -1.868072509765625, -1.8065032958984375, -1.74493408203125, -1.6833648681640625, -1.621795654296875, -1.5602264404296875, -1.4986572265625, -1.4370880126953125, -1.375518798828125, -1.3139495849609375, -1.25238037109375, -1.1908111572265625, -1.129241943359375, -1.0676727294921875, -1.006103515625, -0.9445343017578125, -0.882965087890625, -0.8213958740234375, -0.75982666015625, -0.6982574462890625, -0.636688232421875, -0.5751190185546875, -0.5135498046875, -0.4519805908203125, -0.390411376953125, -0.3288421630859375, -0.26727294921875, -0.2057037353515625, -0.144134521484375, -0.0825653076171875, -0.02099609375, 0.0405731201171875, 0.102142333984375, 0.1637115478515625, 0.22528076171875, 0.2868499755859375, 0.348419189453125, 0.4099884033203125, 0.4715576171875, 0.5331268310546875, 0.594696044921875, 0.6562652587890625, 0.71783447265625, 0.7794036865234375, 0.840972900390625, 0.9025421142578125, 0.964111328125, 1.0256805419921875, 1.087249755859375, 1.1488189697265625, 1.21038818359375, 1.2719573974609375, 1.333526611328125, 1.3950958251953125, 1.4566650390625, 1.5182342529296875, 1.579803466796875, 1.6413726806640625, 1.70294189453125, 1.7645111083984375, 1.826080322265625, 1.8876495361328125, 1.94921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 13.0, 26.0, 43.0, 71.0, 101.0, 159.0, 323.0, 636.0, 1258.0, 2356.0, 4870.0, 11814.0, 31549.0, 109248.0, 485832.0, 295952.0, 66730.0, 21353.0, 8443.0, 3852.0, 1804.0, 969.0, 512.0, 255.0, 156.0, 87.0, 42.0, 28.0, 17.0, 12.0, 6.0, 8.0, 6.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.55206298828125, -5.3775634765625, -5.20306396484375, -5.028564453125, -4.85406494140625, -4.6795654296875, -4.50506591796875, -4.33056640625, -4.15606689453125, -3.9815673828125, -3.80706787109375, -3.632568359375, -3.45806884765625, -3.2835693359375, -3.10906982421875, -2.9345703125, -2.76007080078125, -2.5855712890625, -2.41107177734375, -2.236572265625, -2.06207275390625, -1.8875732421875, -1.71307373046875, -1.53857421875, -1.36407470703125, -1.1895751953125, -1.01507568359375, -0.840576171875, -0.66607666015625, -0.4915771484375, -0.31707763671875, -0.142578125, 0.03192138671875, 0.2064208984375, 0.38092041015625, 0.555419921875, 0.72991943359375, 0.9044189453125, 1.07891845703125, 1.25341796875, 1.42791748046875, 1.6024169921875, 1.77691650390625, 1.951416015625, 2.12591552734375, 2.3004150390625, 2.47491455078125, 2.6494140625, 2.82391357421875, 2.9984130859375, 3.17291259765625, 3.347412109375, 3.52191162109375, 3.6964111328125, 3.87091064453125, 4.04541015625, 4.21990966796875, 4.3944091796875, 4.56890869140625, 4.743408203125, 4.91790771484375, 5.0924072265625, 5.26690673828125, 5.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 11.0, 12.0, 12.0, 16.0, 27.0, 29.0, 41.0, 51.0, 69.0, 104.0, 117.0, 249.0, 1515.0, 264.0, 134.0, 79.0, 66.0, 60.0, 43.0, 27.0, 16.0, 18.0, 19.0, 21.0, 5.0, 5.0, 8.0, 3.0, 9.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.78125, -8.547119140625, -8.31298828125, -8.078857421875, -7.8447265625, -7.610595703125, -7.37646484375, -7.142333984375, -6.908203125, -6.674072265625, -6.43994140625, -6.205810546875, -5.9716796875, -5.737548828125, -5.50341796875, -5.269287109375, -5.03515625, -4.801025390625, -4.56689453125, -4.332763671875, -4.0986328125, -3.864501953125, -3.63037109375, -3.396240234375, -3.162109375, -2.927978515625, -2.69384765625, -2.459716796875, -2.2255859375, -1.991455078125, -1.75732421875, -1.523193359375, -1.2890625, -1.054931640625, -0.82080078125, -0.586669921875, -0.3525390625, -0.118408203125, 0.11572265625, 0.349853515625, 0.583984375, 0.818115234375, 1.05224609375, 1.286376953125, 1.5205078125, 1.754638671875, 1.98876953125, 2.222900390625, 2.45703125, 2.691162109375, 2.92529296875, 3.159423828125, 3.3935546875, 3.627685546875, 3.86181640625, 4.095947265625, 4.330078125, 4.564208984375, 4.79833984375, 5.032470703125, 5.2666015625, 5.500732421875, 5.73486328125, 5.968994140625, 6.203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 12.0, 15.0, 11.0, 16.0, 24.0, 30.0, 37.0, 42.0, 86.0, 247.0, 3052.0, 528091.0, 2606748.0, 6641.0, 334.0, 81.0, 60.0, 35.0, 36.0, 21.0, 18.0, 11.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.21875, -27.177734375, -26.13671875, -25.095703125, -24.0546875, -23.013671875, -21.97265625, -20.931640625, -19.890625, -18.849609375, -17.80859375, -16.767578125, -15.7265625, -14.685546875, -13.64453125, -12.603515625, -11.5625, -10.521484375, -9.48046875, -8.439453125, -7.3984375, -6.357421875, -5.31640625, -4.275390625, -3.234375, -2.193359375, -1.15234375, -0.111328125, 0.9296875, 1.970703125, 3.01171875, 4.052734375, 5.09375, 6.134765625, 7.17578125, 8.216796875, 9.2578125, 10.298828125, 11.33984375, 12.380859375, 13.421875, 14.462890625, 15.50390625, 16.544921875, 17.5859375, 18.626953125, 19.66796875, 20.708984375, 21.75, 22.791015625, 23.83203125, 24.873046875, 25.9140625, 26.955078125, 27.99609375, 29.037109375, 30.078125, 31.119140625, 32.16015625, 33.201171875, 34.2421875, 35.283203125, 36.32421875, 37.365234375, 38.40625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 105.0, 311.0, 411.0, 143.0, 33.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.548988342285156, -15.81141471862793, -14.07384204864502, -12.33626937866211, -10.598695755004883, -8.861122131347656, -7.123549461364746, -5.385976791381836, -3.6484031677246094, -1.910830020904541, -0.17325687408447266, 1.5643162727355957, 3.301889419555664, 5.039463043212891, 6.777035713195801, 8.514608383178711, 10.252182006835938, 11.989755630493164, 13.727328300476074, 15.464900970458984, 17.20247459411621, 18.940048217773438, 20.67761993408203, 22.415193557739258, 24.152767181396484, 25.89034080505371, 27.627914428710938, 29.36548614501953, 31.103059768676758, 32.840633392333984, 34.57820510864258, 36.31578063964844, 38.05335235595703, 39.790924072265625, 41.528499603271484, 43.26607131958008, 45.00364685058594, 46.74121856689453, 48.478790283203125, 50.21636199951172, 51.95393753051758, 53.69150924682617, 55.42908477783203, 57.166656494140625, 58.90422821044922, 60.64180374145508, 62.37937545776367, 64.11695098876953, 65.85452270507812, 67.59209442138672, 69.32966613769531, 71.06724548339844, 72.80481719970703, 74.54238891601562, 76.27996063232422, 78.01753234863281, 79.75511169433594, 81.49268341064453, 83.23025512695312, 84.96783447265625, 86.70540618896484, 88.44297790527344, 90.18054962158203, 91.91812133789062, 93.65569305419922]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 2.0, 6.0, 10.0, 8.0, 17.0, 15.0, 25.0, 17.0, 22.0, 29.0, 28.0, 44.0, 30.0, 45.0, 46.0, 44.0, 45.0, 48.0, 57.0, 40.0, 38.0, 40.0, 42.0, 34.0, 29.0, 36.0, 31.0, 23.0, 19.0, 21.0, 21.0, 18.0, 16.0, 9.0, 11.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-18.908187866210938, -18.34250259399414, -17.776817321777344, -17.211132049560547, -16.64544677734375, -16.079761505126953, -15.514076232910156, -14.94839096069336, -14.382705688476562, -13.817020416259766, -13.251335144042969, -12.685649871826172, -12.119964599609375, -11.554279327392578, -10.988594055175781, -10.422908782958984, -9.857222557067871, -9.291537284851074, -8.725852012634277, -8.16016674041748, -7.594481468200684, -7.028796195983887, -6.463110446929932, -5.897425174713135, -5.331739902496338, -4.766054630279541, -4.200369358062744, -3.634683847427368, -3.0689985752105713, -2.5033133029937744, -1.9376277923583984, -1.3719425201416016, -0.8062572479248047, -0.24057191610336304, 0.3251134157180786, 0.890798807144165, 1.456484079360962, 2.022169351577759, 2.5878548622131348, 3.1535401344299316, 3.7192254066467285, 4.284910678863525, 4.850595951080322, 5.416281700134277, 5.981966972351074, 6.547652244567871, 7.113337516784668, 7.679022789001465, 8.244708061218262, 8.810393333435059, 9.376078605651855, 9.941763877868652, 10.50744915008545, 11.073134422302246, 11.63882064819336, 12.204505920410156, 12.770191192626953, 13.33587646484375, 13.901561737060547, 14.467247009277344, 15.03293228149414, 15.598617553710938, 16.164302825927734, 16.72998809814453, 17.295673370361328]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 9.0, 12.0, 16.0, 20.0, 31.0, 30.0, 36.0, 36.0, 43.0, 50.0, 51.0, 53.0, 55.0, 56.0, 49.0, 46.0, 53.0, 53.0, 36.0, 48.0, 34.0, 36.0, 23.0, 20.0, 16.0, 16.0, 17.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6923980712890625, -1.635772705078125, -1.5791473388671875, -1.52252197265625, -1.4658966064453125, -1.409271240234375, -1.3526458740234375, -1.2960205078125, -1.2393951416015625, -1.182769775390625, -1.1261444091796875, -1.06951904296875, -1.0128936767578125, -0.956268310546875, -0.8996429443359375, -0.843017578125, -0.7863922119140625, -0.729766845703125, -0.6731414794921875, -0.61651611328125, -0.5598907470703125, -0.503265380859375, -0.4466400146484375, -0.3900146484375, -0.3333892822265625, -0.276763916015625, -0.2201385498046875, -0.16351318359375, -0.1068878173828125, -0.050262451171875, 0.0063629150390625, 0.06298828125, 0.1196136474609375, 0.176239013671875, 0.2328643798828125, 0.28948974609375, 0.3461151123046875, 0.402740478515625, 0.4593658447265625, 0.5159912109375, 0.5726165771484375, 0.629241943359375, 0.6858673095703125, 0.74249267578125, 0.7991180419921875, 0.855743408203125, 0.9123687744140625, 0.968994140625, 1.0256195068359375, 1.082244873046875, 1.1388702392578125, 1.19549560546875, 1.2521209716796875, 1.308746337890625, 1.3653717041015625, 1.4219970703125, 1.4786224365234375, 1.535247802734375, 1.5918731689453125, 1.64849853515625, 1.7051239013671875, 1.761749267578125, 1.8183746337890625, 1.875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 16.0, 19.0, 23.0, 39.0, 63.0, 99.0, 161.0, 247.0, 440.0, 763.0, 1389.0, 2432.0, 4509.0, 9173.0, 19044.0, 45304.0, 142590.0, 2512468.0, 1276869.0, 108832.0, 37382.0, 16242.0, 7622.0, 3742.0, 2093.0, 1023.0, 634.0, 368.0, 247.0, 133.0, 93.0, 72.0, 32.0, 27.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.2421875, -7.98388671875, -7.7255859375, -7.46728515625, -7.208984375, -6.95068359375, -6.6923828125, -6.43408203125, -6.17578125, -5.91748046875, -5.6591796875, -5.40087890625, -5.142578125, -4.88427734375, -4.6259765625, -4.36767578125, -4.109375, -3.85107421875, -3.5927734375, -3.33447265625, -3.076171875, -2.81787109375, -2.5595703125, -2.30126953125, -2.04296875, -1.78466796875, -1.5263671875, -1.26806640625, -1.009765625, -0.75146484375, -0.4931640625, -0.23486328125, 0.0234375, 0.28173828125, 0.5400390625, 0.79833984375, 1.056640625, 1.31494140625, 1.5732421875, 1.83154296875, 2.08984375, 2.34814453125, 2.6064453125, 2.86474609375, 3.123046875, 3.38134765625, 3.6396484375, 3.89794921875, 4.15625, 4.41455078125, 4.6728515625, 4.93115234375, 5.189453125, 5.44775390625, 5.7060546875, 5.96435546875, 6.22265625, 6.48095703125, 6.7392578125, 6.99755859375, 7.255859375, 7.51416015625, 7.7724609375, 8.03076171875, 8.2890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 11.0, 17.0, 23.0, 35.0, 54.0, 47.0, 78.0, 110.0, 160.0, 243.0, 453.0, 862.0, 817.0, 435.0, 243.0, 136.0, 97.0, 68.0, 38.0, 39.0, 22.0, 15.0, 13.0, 10.0, 10.0, 8.0, 5.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.63653564453125, -8.3824462890625, -8.12835693359375, -7.874267578125, -7.62017822265625, -7.3660888671875, -7.11199951171875, -6.85791015625, -6.60382080078125, -6.3497314453125, -6.09564208984375, -5.841552734375, -5.58746337890625, -5.3333740234375, -5.07928466796875, -4.8251953125, -4.57110595703125, -4.3170166015625, -4.06292724609375, -3.808837890625, -3.55474853515625, -3.3006591796875, -3.04656982421875, -2.79248046875, -2.53839111328125, -2.2843017578125, -2.03021240234375, -1.776123046875, -1.52203369140625, -1.2679443359375, -1.01385498046875, -0.759765625, -0.50567626953125, -0.2515869140625, 0.00250244140625, 0.256591796875, 0.51068115234375, 0.7647705078125, 1.01885986328125, 1.27294921875, 1.52703857421875, 1.7811279296875, 2.03521728515625, 2.289306640625, 2.54339599609375, 2.7974853515625, 3.05157470703125, 3.3056640625, 3.55975341796875, 3.8138427734375, 4.06793212890625, 4.322021484375, 4.57611083984375, 4.8302001953125, 5.08428955078125, 5.33837890625, 5.59246826171875, 5.8465576171875, 6.10064697265625, 6.354736328125, 6.60882568359375, 6.8629150390625, 7.11700439453125, 7.37109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 6.0, 16.0, 33.0, 45.0, 83.0, 133.0, 211.0, 333.0, 617.0, 1089.0, 2109.0, 4169.0, 8404.0, 18610.0, 47134.0, 151846.0, 1340661.0, 2332577.0, 189572.0, 56206.0, 21460.0, 9447.0, 4509.0, 2160.0, 1175.0, 659.0, 404.0, 192.0, 148.0, 90.0, 45.0, 40.0, 23.0, 18.0, 18.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.39208984375, -14.9404296875, -14.48876953125, -14.037109375, -13.58544921875, -13.1337890625, -12.68212890625, -12.23046875, -11.77880859375, -11.3271484375, -10.87548828125, -10.423828125, -9.97216796875, -9.5205078125, -9.06884765625, -8.6171875, -8.16552734375, -7.7138671875, -7.26220703125, -6.810546875, -6.35888671875, -5.9072265625, -5.45556640625, -5.00390625, -4.55224609375, -4.1005859375, -3.64892578125, -3.197265625, -2.74560546875, -2.2939453125, -1.84228515625, -1.390625, -0.93896484375, -0.4873046875, -0.03564453125, 0.416015625, 0.86767578125, 1.3193359375, 1.77099609375, 2.22265625, 2.67431640625, 3.1259765625, 3.57763671875, 4.029296875, 4.48095703125, 4.9326171875, 5.38427734375, 5.8359375, 6.28759765625, 6.7392578125, 7.19091796875, 7.642578125, 8.09423828125, 8.5458984375, 8.99755859375, 9.44921875, 9.90087890625, 10.3525390625, 10.80419921875, 11.255859375, 11.70751953125, 12.1591796875, 12.61083984375, 13.0625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 17.0, 30.0, 35.0, 72.0, 139.0, 220.0, 203.0, 116.0, 72.0, 30.0, 33.0, 14.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.809171676635742, -23.043285369873047, -21.27739906311035, -19.511512756347656, -17.745624542236328, -15.97973918914795, -14.213851928710938, -12.447965621948242, -10.682079315185547, -8.916193008422852, -7.150306224822998, -5.3844194412231445, -3.618533134460449, -1.852646827697754, -0.08675956726074219, 1.6791267395019531, 3.4450130462646484, 5.210899353027344, 6.976786136627197, 8.74267292022705, 10.508559226989746, 12.274445533752441, 14.040332794189453, 15.806219100952148, 17.572105407714844, 19.33799171447754, 21.103878021240234, 22.869766235351562, 24.635650634765625, 26.401538848876953, 28.16742515563965, 29.933311462402344, 31.699195861816406, 33.465084075927734, 35.2309684753418, 36.996856689453125, 38.76274108886719, 40.528629302978516, 42.294517517089844, 44.060401916503906, 45.82628631591797, 47.5921745300293, 49.35805892944336, 51.12394714355469, 52.88983154296875, 54.65571975708008, 56.421607971191406, 58.18749237060547, 59.9533805847168, 61.719268798828125, 63.48515319824219, 65.25103759765625, 67.01692962646484, 68.7828140258789, 70.54869842529297, 72.31459045410156, 74.08047485351562, 75.84635925292969, 77.61225128173828, 79.37813568115234, 81.1440200805664, 82.90990447998047, 84.67579650878906, 86.44168090820312, 88.20756530761719]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 8.0, 13.0, 17.0, 15.0, 21.0, 16.0, 21.0, 25.0, 23.0, 26.0, 26.0, 28.0, 35.0, 42.0, 34.0, 34.0, 30.0, 32.0, 43.0, 42.0, 37.0, 24.0, 32.0, 27.0, 30.0, 22.0, 26.0, 21.0, 39.0, 20.0, 20.0, 23.0, 23.0, 20.0, 14.0, 14.0, 8.0, 10.0, 11.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.984928131103516, -18.428075790405273, -17.87122344970703, -17.31437110900879, -16.757518768310547, -16.200666427612305, -15.643814086914062, -15.08696174621582, -14.530109405517578, -13.973257064819336, -13.416404724121094, -12.859552383422852, -12.30270004272461, -11.745847702026367, -11.188995361328125, -10.632143020629883, -10.075289726257324, -9.518437385559082, -8.96158504486084, -8.404732704162598, -7.8478803634643555, -7.291028022766113, -6.734175205230713, -6.177322864532471, -5.6204705238342285, -5.063618183135986, -4.506765842437744, -3.949913263320923, -3.3930609226226807, -2.8362085819244385, -2.279356002807617, -1.722503662109375, -1.1656513214111328, -0.6087989211082458, -0.05194652080535889, 0.5049059391021729, 1.061758279800415, 1.6186106204986572, 2.1754631996154785, 2.7323155403137207, 3.289167881011963, 3.846020221710205, 4.402872562408447, 4.959725379943848, 5.51657772064209, 6.073430061340332, 6.630282402038574, 7.187134742736816, 7.743987083435059, 8.3008394241333, 8.857691764831543, 9.414544105529785, 9.971396446228027, 10.52824878692627, 11.085102081298828, 11.64195442199707, 12.198806762695312, 12.755659103393555, 13.312511444091797, 13.869363784790039, 14.426216125488281, 14.983068466186523, 15.539920806884766, 16.096773147583008, 16.65362548828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 7.0, 7.0, 9.0, 13.0, 13.0, 18.0, 20.0, 25.0, 23.0, 36.0, 28.0, 28.0, 30.0, 47.0, 49.0, 49.0, 50.0, 48.0, 59.0, 60.0, 54.0, 36.0, 38.0, 44.0, 25.0, 21.0, 25.0, 24.0, 27.0, 13.0, 15.0, 12.0, 9.0, 12.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6366424560546875, -1.584808349609375, -1.5329742431640625, -1.48114013671875, -1.4293060302734375, -1.377471923828125, -1.3256378173828125, -1.2738037109375, -1.2219696044921875, -1.170135498046875, -1.1183013916015625, -1.06646728515625, -1.0146331787109375, -0.962799072265625, -0.9109649658203125, -0.859130859375, -0.8072967529296875, -0.755462646484375, -0.7036285400390625, -0.65179443359375, -0.5999603271484375, -0.548126220703125, -0.4962921142578125, -0.4444580078125, -0.3926239013671875, -0.340789794921875, -0.2889556884765625, -0.23712158203125, -0.1852874755859375, -0.133453369140625, -0.0816192626953125, -0.02978515625, 0.0220489501953125, 0.073883056640625, 0.1257171630859375, 0.17755126953125, 0.2293853759765625, 0.281219482421875, 0.3330535888671875, 0.3848876953125, 0.4367218017578125, 0.488555908203125, 0.5403900146484375, 0.59222412109375, 0.6440582275390625, 0.695892333984375, 0.7477264404296875, 0.799560546875, 0.8513946533203125, 0.903228759765625, 0.9550628662109375, 1.00689697265625, 1.0587310791015625, 1.110565185546875, 1.1623992919921875, 1.2142333984375, 1.2660675048828125, 1.317901611328125, 1.3697357177734375, 1.42156982421875, 1.4734039306640625, 1.525238037109375, 1.5770721435546875, 1.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 7.0, 6.0, 9.0, 20.0, 22.0, 45.0, 59.0, 82.0, 120.0, 191.0, 326.0, 494.0, 722.0, 1188.0, 1899.0, 3161.0, 5391.0, 9684.0, 18303.0, 39062.0, 104645.0, 453598.0, 271888.0, 73123.0, 30123.0, 14815.0, 7935.0, 4505.0, 2621.0, 1626.0, 1074.0, 609.0, 421.0, 263.0, 157.0, 95.0, 90.0, 43.0, 29.0, 25.0, 17.0, 13.0, 15.0, 9.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-8.6640625, -8.41534423828125, -8.1666259765625, -7.91790771484375, -7.669189453125, -7.42047119140625, -7.1717529296875, -6.92303466796875, -6.67431640625, -6.42559814453125, -6.1768798828125, -5.92816162109375, -5.679443359375, -5.43072509765625, -5.1820068359375, -4.93328857421875, -4.6845703125, -4.43585205078125, -4.1871337890625, -3.93841552734375, -3.689697265625, -3.44097900390625, -3.1922607421875, -2.94354248046875, -2.69482421875, -2.44610595703125, -2.1973876953125, -1.94866943359375, -1.699951171875, -1.45123291015625, -1.2025146484375, -0.95379638671875, -0.705078125, -0.45635986328125, -0.2076416015625, 0.04107666015625, 0.289794921875, 0.53851318359375, 0.7872314453125, 1.03594970703125, 1.28466796875, 1.53338623046875, 1.7821044921875, 2.03082275390625, 2.279541015625, 2.52825927734375, 2.7769775390625, 3.02569580078125, 3.2744140625, 3.52313232421875, 3.7718505859375, 4.02056884765625, 4.269287109375, 4.51800537109375, 4.7667236328125, 5.01544189453125, 5.26416015625, 5.51287841796875, 5.7615966796875, 6.01031494140625, 6.259033203125, 6.50775146484375, 6.7564697265625, 7.00518798828125, 7.25390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 2.0, 10.0, 12.0, 8.0, 10.0, 16.0, 9.0, 20.0, 33.0, 41.0, 40.0, 41.0, 35.0, 30.0, 51.0, 50.0, 35.0, 1065.0, 46.0, 40.0, 38.0, 48.0, 47.0, 42.0, 34.0, 33.0, 29.0, 35.0, 20.0, 16.0, 21.0, 7.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2813262939453125, -1.239410400390625, -1.1974945068359375, -1.15557861328125, -1.1136627197265625, -1.071746826171875, -1.0298309326171875, -0.9879150390625, -0.9459991455078125, -0.904083251953125, -0.8621673583984375, -0.82025146484375, -0.7783355712890625, -0.736419677734375, -0.6945037841796875, -0.652587890625, -0.6106719970703125, -0.568756103515625, -0.5268402099609375, -0.48492431640625, -0.4430084228515625, -0.401092529296875, -0.3591766357421875, -0.3172607421875, -0.2753448486328125, -0.233428955078125, -0.1915130615234375, -0.14959716796875, -0.1076812744140625, -0.065765380859375, -0.0238494873046875, 0.01806640625, 0.0599822998046875, 0.101898193359375, 0.1438140869140625, 0.18572998046875, 0.2276458740234375, 0.269561767578125, 0.3114776611328125, 0.3533935546875, 0.3953094482421875, 0.437225341796875, 0.4791412353515625, 0.52105712890625, 0.5629730224609375, 0.604888916015625, 0.6468048095703125, 0.688720703125, 0.7306365966796875, 0.772552490234375, 0.8144683837890625, 0.85638427734375, 0.8983001708984375, 0.940216064453125, 0.9821319580078125, 1.0240478515625, 1.0659637451171875, 1.107879638671875, 1.1497955322265625, 1.19171142578125, 1.2336273193359375, 1.275543212890625, 1.3174591064453125, 1.359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 8.0, 16.0, 19.0, 24.0, 43.0, 49.0, 70.0, 83.0, 142.0, 213.0, 274.0, 400.0, 624.0, 880.0, 1410.0, 2124.0, 3360.0, 5928.0, 11335.0, 26321.0, 84356.0, 1206892.0, 629569.0, 73494.0, 24076.0, 10481.0, 5511.0, 3260.0, 2039.0, 1249.0, 861.0, 576.0, 403.0, 279.0, 217.0, 131.0, 98.0, 64.0, 64.0, 43.0, 34.0, 19.0, 17.0, 9.0, 17.0, 3.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.83203125, -5.64361572265625, -5.4552001953125, -5.26678466796875, -5.078369140625, -4.88995361328125, -4.7015380859375, -4.51312255859375, -4.32470703125, -4.13629150390625, -3.9478759765625, -3.75946044921875, -3.571044921875, -3.38262939453125, -3.1942138671875, -3.00579833984375, -2.8173828125, -2.62896728515625, -2.4405517578125, -2.25213623046875, -2.063720703125, -1.87530517578125, -1.6868896484375, -1.49847412109375, -1.31005859375, -1.12164306640625, -0.9332275390625, -0.74481201171875, -0.556396484375, -0.36798095703125, -0.1795654296875, 0.00885009765625, 0.197265625, 0.38568115234375, 0.5740966796875, 0.76251220703125, 0.950927734375, 1.13934326171875, 1.3277587890625, 1.51617431640625, 1.70458984375, 1.89300537109375, 2.0814208984375, 2.26983642578125, 2.458251953125, 2.64666748046875, 2.8350830078125, 3.02349853515625, 3.2119140625, 3.40032958984375, 3.5887451171875, 3.77716064453125, 3.965576171875, 4.15399169921875, 4.3424072265625, 4.53082275390625, 4.71923828125, 4.90765380859375, 5.0960693359375, 5.28448486328125, 5.472900390625, 5.66131591796875, 5.8497314453125, 6.03814697265625, 6.2265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 14.0, 49.0, 182.0, 521.0, 80.0, 27.0, 14.0, 11.0, 10.0, 7.0, 5.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.212493896484375, -3.09881591796875, -2.985137939453125, -2.8714599609375, -2.757781982421875, -2.64410400390625, -2.530426025390625, -2.416748046875, -2.303070068359375, -2.18939208984375, -2.075714111328125, -1.9620361328125, -1.848358154296875, -1.73468017578125, -1.621002197265625, -1.50732421875, -1.393646240234375, -1.27996826171875, -1.166290283203125, -1.0526123046875, -0.938934326171875, -0.82525634765625, -0.711578369140625, -0.597900390625, -0.484222412109375, -0.37054443359375, -0.256866455078125, -0.1431884765625, -0.029510498046875, 0.08416748046875, 0.197845458984375, 0.3115234375, 0.425201416015625, 0.53887939453125, 0.652557373046875, 0.7662353515625, 0.879913330078125, 0.99359130859375, 1.107269287109375, 1.220947265625, 1.334625244140625, 1.44830322265625, 1.561981201171875, 1.6756591796875, 1.789337158203125, 1.90301513671875, 2.016693115234375, 2.13037109375, 2.244049072265625, 2.35772705078125, 2.471405029296875, 2.5850830078125, 2.698760986328125, 2.81243896484375, 2.926116943359375, 3.039794921875, 3.153472900390625, 3.26715087890625, 3.380828857421875, 3.4945068359375, 3.608184814453125, 3.72186279296875, 3.835540771484375, 3.94921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 11.0, 19.0, 22.0, 37.0, 48.0, 103.0, 309.0, 1315.0, 9255.0, 1002341.0, 31241.0, 2921.0, 543.0, 171.0, 65.0, 46.0, 26.0, 20.0, 8.0, 4.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.8125, -53.23388671875, -51.6552734375, -50.07666015625, -48.498046875, -46.91943359375, -45.3408203125, -43.76220703125, -42.18359375, -40.60498046875, -39.0263671875, -37.44775390625, -35.869140625, -34.29052734375, -32.7119140625, -31.13330078125, -29.5546875, -27.97607421875, -26.3974609375, -24.81884765625, -23.240234375, -21.66162109375, -20.0830078125, -18.50439453125, -16.92578125, -15.34716796875, -13.7685546875, -12.18994140625, -10.611328125, -9.03271484375, -7.4541015625, -5.87548828125, -4.296875, -2.71826171875, -1.1396484375, 0.43896484375, 2.017578125, 3.59619140625, 5.1748046875, 6.75341796875, 8.33203125, 9.91064453125, 11.4892578125, 13.06787109375, 14.646484375, 16.22509765625, 17.8037109375, 19.38232421875, 20.9609375, 22.53955078125, 24.1181640625, 25.69677734375, 27.275390625, 28.85400390625, 30.4326171875, 32.01123046875, 33.58984375, 35.16845703125, 36.7470703125, 38.32568359375, 39.904296875, 41.48291015625, 43.0615234375, 44.64013671875, 46.21875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 8.0, 5.0, 17.0, 27.0, 16.0, 46.0, 66.0, 71.0, 139.0, 140.0, 114.0, 94.0, 57.0, 36.0, 29.0, 25.0, 14.0, 17.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6988325119018555, -2.601017475128174, -2.503202438354492, -2.4053874015808105, -2.307572364807129, -2.2097573280334473, -2.1119422912597656, -2.014127492904663, -1.9163124561309814, -1.8184974193572998, -1.7206823825836182, -1.6228673458099365, -1.5250524282455444, -1.4272373914718628, -1.3294223546981812, -1.231607437133789, -1.1337922811508179, -1.0359772443771362, -0.9381622672080994, -0.8403472304344177, -0.7425322532653809, -0.6447172164916992, -0.5469021797180176, -0.4490872025489807, -0.3512721657752991, -0.2534571588039398, -0.15564213693141937, -0.057827115058898926, 0.03998789191246033, 0.13780289888381958, 0.23561793565750122, 0.3334329128265381, 0.4312479496002197, 0.5290629863739014, 0.6268779635429382, 0.7246930003166199, 0.8225079774856567, 0.9203230142593384, 1.01813805103302, 1.115952968597412, 1.2137680053710938, 1.3115830421447754, 1.409398078918457, 1.5072131156921387, 1.6050280332565308, 1.7028430700302124, 1.800658106803894, 1.8984730243682861, 1.9962881803512573, 2.0941030979156494, 2.191918134689331, 2.2897331714630127, 2.3875482082366943, 2.485363245010376, 2.5831782817840576, 2.6809933185577393, 2.778808355331421, 2.8766233921051025, 2.974438428878784, 3.072253465652466, 3.1700685024261475, 3.26788330078125, 3.3656983375549316, 3.4635133743286133, 3.561328411102295]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 10.0, 14.0, 11.0, 13.0, 7.0, 22.0, 28.0, 21.0, 29.0, 31.0, 29.0, 45.0, 46.0, 30.0, 48.0, 40.0, 59.0, 50.0, 44.0, 45.0, 47.0, 36.0, 37.0, 36.0, 25.0, 29.0, 31.0, 28.0, 21.0, 11.0, 14.0, 12.0, 14.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5662386417388916, -2.489405632019043, -2.4125723838806152, -2.3357393741607666, -2.258906364440918, -2.1820731163024902, -2.1052401065826416, -2.028407096862793, -1.9515738487243652, -1.874740719795227, -1.7979077100753784, -1.7210745811462402, -1.644241452217102, -1.5674083232879639, -1.4905753135681152, -1.413742184638977, -1.3369091749191284, -1.2600760459899902, -1.1832430362701416, -1.1064099073410034, -1.0295767784118652, -0.9527437090873718, -0.8759106397628784, -0.7990775108337402, -0.7222444415092468, -0.6454113721847534, -0.5685782432556152, -0.4917451739311218, -0.41491207480430603, -0.33807897567749023, -0.2612459063529968, -0.18441277742385864, -0.10757970809936523, -0.030746616423130035, 0.046086475253105164, 0.12291955947875977, 0.19975265860557556, 0.27658575773239136, 0.35341882705688477, 0.43025195598602295, 0.5070850253105164, 0.5839180946350098, 0.660751223564148, 0.7375842928886414, 0.8144173622131348, 0.891250491142273, 0.9680835604667664, 1.0449166297912598, 1.121749758720398, 1.1985828876495361, 1.2754158973693848, 1.352249026298523, 1.4290821552276611, 1.5059151649475098, 1.582748293876648, 1.6595814228057861, 1.7364144325256348, 1.813247561454773, 1.8900805711746216, 1.9669137001037598, 2.0437467098236084, 2.120579957962036, 2.1974129676818848, 2.2742462158203125, 2.351079225540161]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 10.0, 4.0, 10.0, 15.0, 17.0, 13.0, 19.0, 24.0, 22.0, 27.0, 36.0, 30.0, 35.0, 46.0, 52.0, 38.0, 50.0, 58.0, 52.0, 53.0, 50.0, 42.0, 48.0, 40.0, 29.0, 23.0, 25.0, 22.0, 21.0, 12.0, 16.0, 9.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4736785888671875, -1.421966552734375, -1.3702545166015625, -1.31854248046875, -1.2668304443359375, -1.215118408203125, -1.1634063720703125, -1.1116943359375, -1.0599822998046875, -1.008270263671875, -0.9565582275390625, -0.90484619140625, -0.8531341552734375, -0.801422119140625, -0.7497100830078125, -0.697998046875, -0.6462860107421875, -0.594573974609375, -0.5428619384765625, -0.49114990234375, -0.4394378662109375, -0.387725830078125, -0.3360137939453125, -0.2843017578125, -0.2325897216796875, -0.180877685546875, -0.1291656494140625, -0.07745361328125, -0.0257415771484375, 0.025970458984375, 0.0776824951171875, 0.12939453125, 0.1811065673828125, 0.232818603515625, 0.2845306396484375, 0.33624267578125, 0.3879547119140625, 0.439666748046875, 0.4913787841796875, 0.5430908203125, 0.5948028564453125, 0.646514892578125, 0.6982269287109375, 0.74993896484375, 0.8016510009765625, 0.853363037109375, 0.9050750732421875, 0.956787109375, 1.0084991455078125, 1.060211181640625, 1.1119232177734375, 1.16363525390625, 1.2153472900390625, 1.267059326171875, 1.3187713623046875, 1.3704833984375, 1.4221954345703125, 1.473907470703125, 1.5256195068359375, 1.57733154296875, 1.6290435791015625, 1.680755615234375, 1.7324676513671875, 1.7841796875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 20.0, 21.0, 48.0, 63.0, 101.0, 146.0, 252.0, 426.0, 799.0, 1555.0, 3268.0, 7324.0, 19001.0, 64964.0, 405593.0, 440507.0, 69748.0, 20190.0, 7629.0, 3264.0, 1549.0, 864.0, 469.0, 267.0, 165.0, 108.0, 61.0, 40.0, 32.0, 11.0, 9.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9349365234375, -5.760498046875, -5.5860595703125, -5.41162109375, -5.2371826171875, -5.062744140625, -4.8883056640625, -4.7138671875, -4.5394287109375, -4.364990234375, -4.1905517578125, -4.01611328125, -3.8416748046875, -3.667236328125, -3.4927978515625, -3.318359375, -3.1439208984375, -2.969482421875, -2.7950439453125, -2.62060546875, -2.4461669921875, -2.271728515625, -2.0972900390625, -1.9228515625, -1.7484130859375, -1.573974609375, -1.3995361328125, -1.22509765625, -1.0506591796875, -0.876220703125, -0.7017822265625, -0.52734375, -0.3529052734375, -0.178466796875, -0.0040283203125, 0.17041015625, 0.3448486328125, 0.519287109375, 0.6937255859375, 0.8681640625, 1.0426025390625, 1.217041015625, 1.3914794921875, 1.56591796875, 1.7403564453125, 1.914794921875, 2.0892333984375, 2.263671875, 2.4381103515625, 2.612548828125, 2.7869873046875, 2.96142578125, 3.1358642578125, 3.310302734375, 3.4847412109375, 3.6591796875, 3.8336181640625, 4.008056640625, 4.1824951171875, 4.35693359375, 4.5313720703125, 4.705810546875, 4.8802490234375, 5.0546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 13.0, 10.0, 7.0, 14.0, 14.0, 18.0, 19.0, 23.0, 32.0, 28.0, 31.0, 32.0, 38.0, 57.0, 67.0, 78.0, 131.0, 293.0, 1410.0, 158.0, 88.0, 80.0, 60.0, 39.0, 40.0, 37.0, 37.0, 28.0, 22.0, 22.0, 21.0, 15.0, 14.0, 10.0, 12.0, 7.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.64453125, -6.45556640625, -6.2666015625, -6.07763671875, -5.888671875, -5.69970703125, -5.5107421875, -5.32177734375, -5.1328125, -4.94384765625, -4.7548828125, -4.56591796875, -4.376953125, -4.18798828125, -3.9990234375, -3.81005859375, -3.62109375, -3.43212890625, -3.2431640625, -3.05419921875, -2.865234375, -2.67626953125, -2.4873046875, -2.29833984375, -2.109375, -1.92041015625, -1.7314453125, -1.54248046875, -1.353515625, -1.16455078125, -0.9755859375, -0.78662109375, -0.59765625, -0.40869140625, -0.2197265625, -0.03076171875, 0.158203125, 0.34716796875, 0.5361328125, 0.72509765625, 0.9140625, 1.10302734375, 1.2919921875, 1.48095703125, 1.669921875, 1.85888671875, 2.0478515625, 2.23681640625, 2.42578125, 2.61474609375, 2.8037109375, 2.99267578125, 3.181640625, 3.37060546875, 3.5595703125, 3.74853515625, 3.9375, 4.12646484375, 4.3154296875, 4.50439453125, 4.693359375, 4.88232421875, 5.0712890625, 5.26025390625, 5.44921875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 5.0, 11.0, 19.0, 17.0, 23.0, 31.0, 47.0, 76.0, 105.0, 203.0, 369.0, 755.0, 1600.0, 3776.0, 9398.0, 26711.0, 104771.0, 938916.0, 1853056.0, 150674.0, 35031.0, 11654.0, 4638.0, 1823.0, 874.0, 468.0, 226.0, 148.0, 85.0, 51.0, 29.0, 26.0, 20.0, 9.0, 11.0, 9.0, 8.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.521484375, -7.25390625, -6.986328125, -6.71875, -6.451171875, -6.18359375, -5.916015625, -5.6484375, -5.380859375, -5.11328125, -4.845703125, -4.578125, -4.310546875, -4.04296875, -3.775390625, -3.5078125, -3.240234375, -2.97265625, -2.705078125, -2.4375, -2.169921875, -1.90234375, -1.634765625, -1.3671875, -1.099609375, -0.83203125, -0.564453125, -0.296875, -0.029296875, 0.23828125, 0.505859375, 0.7734375, 1.041015625, 1.30859375, 1.576171875, 1.84375, 2.111328125, 2.37890625, 2.646484375, 2.9140625, 3.181640625, 3.44921875, 3.716796875, 3.984375, 4.251953125, 4.51953125, 4.787109375, 5.0546875, 5.322265625, 5.58984375, 5.857421875, 6.125, 6.392578125, 6.66015625, 6.927734375, 7.1953125, 7.462890625, 7.73046875, 7.998046875, 8.265625, 8.533203125, 8.80078125, 9.068359375, 9.3359375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 10.0, 78.0, 349.0, 436.0, 121.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.652995109558105, -13.462892532348633, -11.272789001464844, -9.082686424255371, -6.892583847045898, -4.702481269836426, -2.5123777389526367, -0.32227516174316406, 1.8678274154663086, 4.057929992675781, 6.248033046722412, 8.438136100769043, 10.628238677978516, 12.818341255187988, 15.008444786071777, 17.19854736328125, 19.388648986816406, 21.578752517700195, 23.76885414123535, 25.95895767211914, 28.149059295654297, 30.339162826538086, 32.529266357421875, 34.71936798095703, 36.90947341918945, 39.09957504272461, 41.28968048095703, 43.47978210449219, 45.669883728027344, 47.8599853515625, 50.05009078979492, 52.24019241333008, 54.43029022216797, 56.620391845703125, 58.81049728393555, 61.0005989074707, 63.19070053100586, 65.38080596923828, 67.57090759277344, 69.7610092163086, 71.95111083984375, 74.1412124633789, 76.33131408691406, 78.52142333984375, 80.7115249633789, 82.90162658691406, 85.09172821044922, 87.28182983398438, 89.47193908691406, 91.66204071044922, 93.85214233398438, 96.04225158691406, 98.23235321044922, 100.42245483398438, 102.61255645751953, 104.80265808105469, 106.99275970458984, 109.182861328125, 111.37296295166016, 113.56306457519531, 115.753173828125, 117.94327545166016, 120.13337707519531, 122.32347869873047, 124.51358032226562]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 15.0, 11.0, 21.0, 12.0, 14.0, 19.0, 24.0, 24.0, 36.0, 36.0, 36.0, 29.0, 35.0, 46.0, 69.0, 31.0, 39.0, 43.0, 43.0, 46.0, 40.0, 45.0, 47.0, 26.0, 17.0, 32.0, 20.0, 25.0, 21.0, 9.0, 11.0, 13.0, 4.0, 10.0, 4.0, 2.0, 6.0, 7.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.92365074157715, -21.245601654052734, -20.56755256652832, -19.889503479003906, -19.21145248413086, -18.533403396606445, -17.85535430908203, -17.177305221557617, -16.499256134033203, -15.821207046508789, -15.143157005310059, -14.465107917785645, -13.787057876586914, -13.1090087890625, -12.430959701538086, -11.752910614013672, -11.074859619140625, -10.396810531616211, -9.71876049041748, -9.040711402893066, -8.362661361694336, -7.684612274169922, -7.006563186645508, -6.3285136222839355, -5.650464057922363, -4.972414493560791, -4.294364929199219, -3.6163158416748047, -2.9382662773132324, -2.26021671295166, -1.582167625427246, -0.9041180610656738, -0.22606849670410156, 0.45198094844818115, 1.1300303936004639, 1.808079719543457, 2.4861292839050293, 3.1641788482666016, 3.8422279357910156, 4.520277500152588, 5.19832706451416, 5.876376628875732, 6.554426193237305, 7.232475280761719, 7.910524845123291, 8.588574409484863, 9.266623497009277, 9.944673538208008, 10.622722625732422, 11.300771713256836, 11.978821754455566, 12.65687084197998, 13.334920883178711, 14.012969970703125, 14.691019058227539, 15.369068145751953, 16.047119140625, 16.725168228149414, 17.403217315673828, 18.081268310546875, 18.75931739807129, 19.437366485595703, 20.115415573120117, 20.79346466064453, 21.471513748168945]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 12.0, 20.0, 18.0, 24.0, 24.0, 27.0, 29.0, 38.0, 28.0, 38.0, 46.0, 52.0, 55.0, 49.0, 55.0, 60.0, 42.0, 41.0, 50.0, 47.0, 49.0, 37.0, 24.0, 18.0, 21.0, 21.0, 9.0, 14.0, 8.0, 5.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.798919677734375, -1.73944091796875, -1.679962158203125, -1.6204833984375, -1.561004638671875, -1.50152587890625, -1.442047119140625, -1.382568359375, -1.323089599609375, -1.26361083984375, -1.204132080078125, -1.1446533203125, -1.085174560546875, -1.02569580078125, -0.966217041015625, -0.90673828125, -0.847259521484375, -0.78778076171875, -0.728302001953125, -0.6688232421875, -0.609344482421875, -0.54986572265625, -0.490386962890625, -0.430908203125, -0.371429443359375, -0.31195068359375, -0.252471923828125, -0.1929931640625, -0.133514404296875, -0.07403564453125, -0.014556884765625, 0.044921875, 0.104400634765625, 0.16387939453125, 0.223358154296875, 0.2828369140625, 0.342315673828125, 0.40179443359375, 0.461273193359375, 0.520751953125, 0.580230712890625, 0.63970947265625, 0.699188232421875, 0.7586669921875, 0.818145751953125, 0.87762451171875, 0.937103271484375, 0.99658203125, 1.056060791015625, 1.11553955078125, 1.175018310546875, 1.2344970703125, 1.293975830078125, 1.35345458984375, 1.412933349609375, 1.472412109375, 1.531890869140625, 1.59136962890625, 1.650848388671875, 1.7103271484375, 1.769805908203125, 1.82928466796875, 1.888763427734375, 1.9482421875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 16.0, 23.0, 23.0, 36.0, 63.0, 129.0, 198.0, 399.0, 863.0, 2439.0, 8102.0, 31760.0, 256106.0, 3760769.0, 106491.0, 18688.0, 5237.0, 1573.0, 620.0, 285.0, 175.0, 103.0, 56.0, 40.0, 17.0, 17.0, 17.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.17431640625, -12.6923828125, -12.21044921875, -11.728515625, -11.24658203125, -10.7646484375, -10.28271484375, -9.80078125, -9.31884765625, -8.8369140625, -8.35498046875, -7.873046875, -7.39111328125, -6.9091796875, -6.42724609375, -5.9453125, -5.46337890625, -4.9814453125, -4.49951171875, -4.017578125, -3.53564453125, -3.0537109375, -2.57177734375, -2.08984375, -1.60791015625, -1.1259765625, -0.64404296875, -0.162109375, 0.31982421875, 0.8017578125, 1.28369140625, 1.765625, 2.24755859375, 2.7294921875, 3.21142578125, 3.693359375, 4.17529296875, 4.6572265625, 5.13916015625, 5.62109375, 6.10302734375, 6.5849609375, 7.06689453125, 7.548828125, 8.03076171875, 8.5126953125, 8.99462890625, 9.4765625, 9.95849609375, 10.4404296875, 10.92236328125, 11.404296875, 11.88623046875, 12.3681640625, 12.85009765625, 13.33203125, 13.81396484375, 14.2958984375, 14.77783203125, 15.259765625, 15.74169921875, 16.2236328125, 16.70556640625, 17.1875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 2.0, 14.0, 16.0, 27.0, 37.0, 43.0, 69.0, 94.0, 142.0, 290.0, 600.0, 1024.0, 822.0, 329.0, 198.0, 104.0, 75.0, 63.0, 28.0, 29.0, 18.0, 11.0, 5.0, 9.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.364013671875, -10.05615234375, -9.748291015625, -9.4404296875, -9.132568359375, -8.82470703125, -8.516845703125, -8.208984375, -7.901123046875, -7.59326171875, -7.285400390625, -6.9775390625, -6.669677734375, -6.36181640625, -6.053955078125, -5.74609375, -5.438232421875, -5.13037109375, -4.822509765625, -4.5146484375, -4.206787109375, -3.89892578125, -3.591064453125, -3.283203125, -2.975341796875, -2.66748046875, -2.359619140625, -2.0517578125, -1.743896484375, -1.43603515625, -1.128173828125, -0.8203125, -0.512451171875, -0.20458984375, 0.103271484375, 0.4111328125, 0.718994140625, 1.02685546875, 1.334716796875, 1.642578125, 1.950439453125, 2.25830078125, 2.566162109375, 2.8740234375, 3.181884765625, 3.48974609375, 3.797607421875, 4.10546875, 4.413330078125, 4.72119140625, 5.029052734375, 5.3369140625, 5.644775390625, 5.95263671875, 6.260498046875, 6.568359375, 6.876220703125, 7.18408203125, 7.491943359375, 7.7998046875, 8.107666015625, 8.41552734375, 8.723388671875, 9.03125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 4.0, 13.0, 12.0, 18.0, 18.0, 32.0, 61.0, 68.0, 129.0, 203.0, 343.0, 579.0, 1065.0, 2054.0, 4148.0, 8872.0, 21268.0, 57608.0, 197488.0, 2362900.0, 1305131.0, 151496.0, 47402.0, 18012.0, 7658.0, 3720.0, 1752.0, 931.0, 496.0, 291.0, 188.0, 105.0, 75.0, 32.0, 25.0, 15.0, 22.0, 10.0, 10.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.2838134765625, -12.880126953125, -12.4764404296875, -12.07275390625, -11.6690673828125, -11.265380859375, -10.8616943359375, -10.4580078125, -10.0543212890625, -9.650634765625, -9.2469482421875, -8.84326171875, -8.4395751953125, -8.035888671875, -7.6322021484375, -7.228515625, -6.8248291015625, -6.421142578125, -6.0174560546875, -5.61376953125, -5.2100830078125, -4.806396484375, -4.4027099609375, -3.9990234375, -3.5953369140625, -3.191650390625, -2.7879638671875, -2.38427734375, -1.9805908203125, -1.576904296875, -1.1732177734375, -0.76953125, -0.3658447265625, 0.037841796875, 0.4415283203125, 0.84521484375, 1.2489013671875, 1.652587890625, 2.0562744140625, 2.4599609375, 2.8636474609375, 3.267333984375, 3.6710205078125, 4.07470703125, 4.4783935546875, 4.882080078125, 5.2857666015625, 5.689453125, 6.0931396484375, 6.496826171875, 6.9005126953125, 7.30419921875, 7.7078857421875, 8.111572265625, 8.5152587890625, 8.9189453125, 9.3226318359375, 9.726318359375, 10.1300048828125, 10.53369140625, 10.9373779296875, 11.341064453125, 11.7447509765625, 12.1484375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 14.0, 32.0, 46.0, 63.0, 100.0, 134.0, 131.0, 141.0, 84.0, 66.0, 52.0, 36.0, 19.0, 14.0, 12.0, 10.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.166698455810547, -28.94232749938965, -27.71795654296875, -26.493587493896484, -25.269216537475586, -24.044845581054688, -22.820476531982422, -21.596105575561523, -20.371734619140625, -19.147363662719727, -17.922992706298828, -16.698623657226562, -15.474252700805664, -14.249881744384766, -13.025511741638184, -11.801141738891602, -10.576770782470703, -9.352399826049805, -8.128029823303223, -6.903659343719482, -5.679288864135742, -4.454918384552002, -3.2305479049682617, -2.0061779022216797, -0.7818069458007812, 0.442563533782959, 1.6669340133666992, 2.8913044929504395, 4.11567497253418, 5.34004545211792, 6.56441593170166, 7.788785934448242, 9.01315689086914, 10.237527847290039, 11.461897850036621, 12.686267852783203, 13.910638809204102, 15.135009765625, 16.359378814697266, 17.583749771118164, 18.808120727539062, 20.03249168395996, 21.25686264038086, 22.481231689453125, 23.705602645874023, 24.929973602294922, 26.154342651367188, 27.378713607788086, 28.603084564208984, 29.827455520629883, 31.05182647705078, 32.27619552612305, 33.50056457519531, 34.724937438964844, 35.94930648803711, 37.173675537109375, 38.398048400878906, 39.62241744995117, 40.8467903137207, 42.07115936279297, 43.2955322265625, 44.519901275634766, 45.74427032470703, 46.96864318847656, 48.19301223754883]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 6.0, 4.0, 17.0, 11.0, 19.0, 19.0, 22.0, 28.0, 21.0, 32.0, 35.0, 35.0, 38.0, 35.0, 51.0, 51.0, 46.0, 49.0, 42.0, 43.0, 43.0, 35.0, 49.0, 30.0, 37.0, 46.0, 34.0, 20.0, 22.0, 10.0, 10.0, 11.0, 11.0, 2.0, 7.0, 4.0, 5.0, 0.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.810224533081055, -19.05238151550293, -18.294538497924805, -17.536697387695312, -16.778854370117188, -16.021011352539062, -15.263168334960938, -14.505325317382812, -13.747483253479004, -12.989640235900879, -12.23179817199707, -11.473955154418945, -10.71611213684082, -9.958270072937012, -9.200427055358887, -8.442584991455078, -7.684741973876953, -6.926899433135986, -6.1690568923950195, -5.4112138748168945, -4.653371334075928, -3.895528793334961, -3.137685775756836, -2.379843235015869, -1.6220006942749023, -0.864158034324646, -0.10631537437438965, 0.6515274047851562, 1.409369945526123, 2.16721248626709, 2.925055503845215, 3.6828980445861816, 4.440740585327148, 5.198583126068115, 5.956425666809082, 6.714268684387207, 7.472111225128174, 8.22995376586914, 8.987796783447266, 9.74563980102539, 10.5034818649292, 11.261324882507324, 12.019166946411133, 12.777009963989258, 13.534852981567383, 14.292695045471191, 15.050538063049316, 15.808380126953125, 16.56622314453125, 17.324066162109375, 18.0819091796875, 18.839752197265625, 19.597593307495117, 20.355436325073242, 21.113279342651367, 21.871122360229492, 22.628963470458984, 23.38680648803711, 24.144649505615234, 24.90249252319336, 25.66033363342285, 26.418176651000977, 27.1760196685791, 27.933862686157227, 28.69170570373535]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 13.0, 6.0, 8.0, 18.0, 17.0, 24.0, 26.0, 26.0, 22.0, 30.0, 30.0, 31.0, 39.0, 43.0, 46.0, 30.0, 58.0, 49.0, 44.0, 41.0, 55.0, 41.0, 44.0, 34.0, 28.0, 28.0, 32.0, 16.0, 21.0, 17.0, 15.0, 12.0, 12.0, 9.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8505859375, -1.7976531982421875, -1.744720458984375, -1.6917877197265625, -1.63885498046875, -1.5859222412109375, -1.532989501953125, -1.4800567626953125, -1.4271240234375, -1.3741912841796875, -1.321258544921875, -1.2683258056640625, -1.21539306640625, -1.1624603271484375, -1.109527587890625, -1.0565948486328125, -1.003662109375, -0.9507293701171875, -0.897796630859375, -0.8448638916015625, -0.79193115234375, -0.7389984130859375, -0.686065673828125, -0.6331329345703125, -0.5802001953125, -0.5272674560546875, -0.474334716796875, -0.4214019775390625, -0.36846923828125, -0.3155364990234375, -0.262603759765625, -0.2096710205078125, -0.15673828125, -0.1038055419921875, -0.050872802734375, 0.0020599365234375, 0.05499267578125, 0.1079254150390625, 0.160858154296875, 0.2137908935546875, 0.2667236328125, 0.3196563720703125, 0.372589111328125, 0.4255218505859375, 0.47845458984375, 0.5313873291015625, 0.584320068359375, 0.6372528076171875, 0.690185546875, 0.7431182861328125, 0.796051025390625, 0.8489837646484375, 0.90191650390625, 0.9548492431640625, 1.007781982421875, 1.0607147216796875, 1.1136474609375, 1.1665802001953125, 1.219512939453125, 1.2724456787109375, 1.32537841796875, 1.3783111572265625, 1.431243896484375, 1.4841766357421875, 1.537109375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 3.0, 6.0, 11.0, 15.0, 29.0, 44.0, 71.0, 88.0, 150.0, 221.0, 446.0, 738.0, 1334.0, 2427.0, 4721.0, 9796.0, 21573.0, 48253.0, 117982.0, 291562.0, 318361.0, 131426.0, 53521.0, 23522.0, 11069.0, 5136.0, 2687.0, 1446.0, 809.0, 416.0, 249.0, 151.0, 87.0, 63.0, 45.0, 39.0, 17.0, 11.0, 10.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.1915283203125, -8.875244140625, -8.5589599609375, -8.24267578125, -7.9263916015625, -7.610107421875, -7.2938232421875, -6.9775390625, -6.6612548828125, -6.344970703125, -6.0286865234375, -5.71240234375, -5.3961181640625, -5.079833984375, -4.7635498046875, -4.447265625, -4.1309814453125, -3.814697265625, -3.4984130859375, -3.18212890625, -2.8658447265625, -2.549560546875, -2.2332763671875, -1.9169921875, -1.6007080078125, -1.284423828125, -0.9681396484375, -0.65185546875, -0.3355712890625, -0.019287109375, 0.2969970703125, 0.61328125, 0.9295654296875, 1.245849609375, 1.5621337890625, 1.87841796875, 2.1947021484375, 2.510986328125, 2.8272705078125, 3.1435546875, 3.4598388671875, 3.776123046875, 4.0924072265625, 4.40869140625, 4.7249755859375, 5.041259765625, 5.3575439453125, 5.673828125, 5.9901123046875, 6.306396484375, 6.6226806640625, 6.93896484375, 7.2552490234375, 7.571533203125, 7.8878173828125, 8.2041015625, 8.5203857421875, 8.836669921875, 9.1529541015625, 9.46923828125, 9.7855224609375, 10.101806640625, 10.4180908203125, 10.734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 7.0, 13.0, 15.0, 13.0, 18.0, 16.0, 17.0, 16.0, 26.0, 32.0, 29.0, 39.0, 43.0, 35.0, 34.0, 48.0, 1063.0, 47.0, 44.0, 38.0, 53.0, 46.0, 29.0, 42.0, 36.0, 33.0, 26.0, 20.0, 33.0, 13.0, 17.0, 9.0, 10.0, 6.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4404296875, -1.3959197998046875, -1.351409912109375, -1.3069000244140625, -1.26239013671875, -1.2178802490234375, -1.173370361328125, -1.1288604736328125, -1.0843505859375, -1.0398406982421875, -0.995330810546875, -0.9508209228515625, -0.90631103515625, -0.8618011474609375, -0.817291259765625, -0.7727813720703125, -0.728271484375, -0.6837615966796875, -0.639251708984375, -0.5947418212890625, -0.55023193359375, -0.5057220458984375, -0.461212158203125, -0.4167022705078125, -0.3721923828125, -0.3276824951171875, -0.283172607421875, -0.2386627197265625, -0.19415283203125, -0.1496429443359375, -0.105133056640625, -0.0606231689453125, -0.01611328125, 0.0283966064453125, 0.072906494140625, 0.1174163818359375, 0.16192626953125, 0.2064361572265625, 0.250946044921875, 0.2954559326171875, 0.3399658203125, 0.3844757080078125, 0.428985595703125, 0.4734954833984375, 0.51800537109375, 0.5625152587890625, 0.607025146484375, 0.6515350341796875, 0.696044921875, 0.7405548095703125, 0.785064697265625, 0.8295745849609375, 0.87408447265625, 0.9185943603515625, 0.963104248046875, 1.0076141357421875, 1.0521240234375, 1.0966339111328125, 1.141143798828125, 1.1856536865234375, 1.23016357421875, 1.2746734619140625, 1.319183349609375, 1.3636932373046875, 1.408203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 7.0, 35.0, 34.0, 44.0, 89.0, 114.0, 227.0, 374.0, 550.0, 1078.0, 1815.0, 3912.0, 9233.0, 30366.0, 170941.0, 1609085.0, 214818.0, 35321.0, 10293.0, 4083.0, 2018.0, 1013.0, 605.0, 398.0, 216.0, 144.0, 82.0, 74.0, 45.0, 20.0, 16.0, 12.0, 19.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.6009521484375, -12.225341796875, -11.8497314453125, -11.47412109375, -11.0985107421875, -10.722900390625, -10.3472900390625, -9.9716796875, -9.5960693359375, -9.220458984375, -8.8448486328125, -8.46923828125, -8.0936279296875, -7.718017578125, -7.3424072265625, -6.966796875, -6.5911865234375, -6.215576171875, -5.8399658203125, -5.46435546875, -5.0887451171875, -4.713134765625, -4.3375244140625, -3.9619140625, -3.5863037109375, -3.210693359375, -2.8350830078125, -2.45947265625, -2.0838623046875, -1.708251953125, -1.3326416015625, -0.95703125, -0.5814208984375, -0.205810546875, 0.1697998046875, 0.54541015625, 0.9210205078125, 1.296630859375, 1.6722412109375, 2.0478515625, 2.4234619140625, 2.799072265625, 3.1746826171875, 3.55029296875, 3.9259033203125, 4.301513671875, 4.6771240234375, 5.052734375, 5.4283447265625, 5.803955078125, 6.1795654296875, 6.55517578125, 6.9307861328125, 7.306396484375, 7.6820068359375, 8.0576171875, 8.4332275390625, 8.808837890625, 9.1844482421875, 9.56005859375, 9.9356689453125, 10.311279296875, 10.6868896484375, 11.0625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 6.0, 3.0, 8.0, 3.0, 10.0, 8.0, 9.0, 23.0, 34.0, 74.0, 94.0, 163.0, 175.0, 155.0, 77.0, 36.0, 27.0, 26.0, 13.0, 9.0, 10.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.265625, -3.16156005859375, -3.0574951171875, -2.95343017578125, -2.849365234375, -2.74530029296875, -2.6412353515625, -2.53717041015625, -2.43310546875, -2.32904052734375, -2.2249755859375, -2.12091064453125, -2.016845703125, -1.91278076171875, -1.8087158203125, -1.70465087890625, -1.6005859375, -1.49652099609375, -1.3924560546875, -1.28839111328125, -1.184326171875, -1.08026123046875, -0.9761962890625, -0.87213134765625, -0.76806640625, -0.66400146484375, -0.5599365234375, -0.45587158203125, -0.351806640625, -0.24774169921875, -0.1436767578125, -0.03961181640625, 0.064453125, 0.16851806640625, 0.2725830078125, 0.37664794921875, 0.480712890625, 0.58477783203125, 0.6888427734375, 0.79290771484375, 0.89697265625, 1.00103759765625, 1.1051025390625, 1.20916748046875, 1.313232421875, 1.41729736328125, 1.5213623046875, 1.62542724609375, 1.7294921875, 1.83355712890625, 1.9376220703125, 2.04168701171875, 2.145751953125, 2.24981689453125, 2.3538818359375, 2.45794677734375, 2.56201171875, 2.66607666015625, 2.7701416015625, 2.87420654296875, 2.978271484375, 3.08233642578125, 3.1864013671875, 3.29046630859375, 3.39453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 4.0, 8.0, 9.0, 12.0, 22.0, 18.0, 45.0, 42.0, 79.0, 154.0, 454.0, 2122.0, 19717.0, 1004554.0, 18438.0, 1969.0, 470.0, 172.0, 77.0, 44.0, 36.0, 28.0, 15.0, 7.0, 9.0, 10.0, 1.0, 4.0, 7.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -49.09716796875, -47.5380859375, -45.97900390625, -44.419921875, -42.86083984375, -41.3017578125, -39.74267578125, -38.18359375, -36.62451171875, -35.0654296875, -33.50634765625, -31.947265625, -30.38818359375, -28.8291015625, -27.27001953125, -25.7109375, -24.15185546875, -22.5927734375, -21.03369140625, -19.474609375, -17.91552734375, -16.3564453125, -14.79736328125, -13.23828125, -11.67919921875, -10.1201171875, -8.56103515625, -7.001953125, -5.44287109375, -3.8837890625, -2.32470703125, -0.765625, 0.79345703125, 2.3525390625, 3.91162109375, 5.470703125, 7.02978515625, 8.5888671875, 10.14794921875, 11.70703125, 13.26611328125, 14.8251953125, 16.38427734375, 17.943359375, 19.50244140625, 21.0615234375, 22.62060546875, 24.1796875, 25.73876953125, 27.2978515625, 28.85693359375, 30.416015625, 31.97509765625, 33.5341796875, 35.09326171875, 36.65234375, 38.21142578125, 39.7705078125, 41.32958984375, 42.888671875, 44.44775390625, 46.0068359375, 47.56591796875, 49.125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 10.0, 44.0, 99.0, 249.0, 350.0, 150.0, 63.0, 25.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.100538730621338, -6.691324710845947, -6.282110691070557, -5.872896194458008, -5.463682174682617, -5.054468154907227, -4.645254135131836, -4.236040115356445, -3.8268260955810547, -3.417612075805664, -3.0083980560302734, -2.5991837978363037, -2.189969778060913, -1.7807557582855225, -1.3715415000915527, -0.9623274803161621, -0.5531134605407715, -0.14389938116073608, 0.2653146982192993, 0.6745288372039795, 1.0837428569793701, 1.4929568767547607, 1.9021711349487305, 2.311385154724121, 2.7205991744995117, 3.1298131942749023, 3.539027214050293, 3.9482414722442627, 4.357455253601074, 4.766669273376465, 5.175883769989014, 5.585097789764404, 5.994312286376953, 6.403526306152344, 6.812740325927734, 7.221954345703125, 7.631168365478516, 8.040382385253906, 8.449596405029297, 8.858810424804688, 9.268024444580078, 9.677238464355469, 10.08645248413086, 10.49566650390625, 10.90488052368164, 11.314094543457031, 11.723308563232422, 12.132522583007812, 12.54173755645752, 12.95095157623291, 13.3601655960083, 13.769379615783691, 14.178593635559082, 14.587807655334473, 14.99702262878418, 15.40623664855957, 15.815450668334961, 16.22466468811035, 16.633878707885742, 17.043092727661133, 17.452306747436523, 17.861520767211914, 18.270734786987305, 18.679948806762695, 19.089162826538086]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 7.0, 3.0, 11.0, 10.0, 9.0, 21.0, 23.0, 23.0, 24.0, 29.0, 25.0, 35.0, 34.0, 48.0, 46.0, 46.0, 43.0, 51.0, 39.0, 53.0, 56.0, 38.0, 43.0, 41.0, 42.0, 22.0, 27.0, 26.0, 18.0, 27.0, 19.0, 15.0, 6.0, 11.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.884923934936523, -4.75705099105835, -4.629178524017334, -4.50130558013916, -4.373432636260986, -4.2455596923828125, -4.117687225341797, -3.989814281463623, -3.8619415760040283, -3.7340688705444336, -3.6061959266662598, -3.478323221206665, -3.3504505157470703, -3.2225775718688965, -3.0947048664093018, -2.966832160949707, -2.838959217071533, -2.7110865116119385, -2.5832135677337646, -2.45534086227417, -2.327467918395996, -2.1995952129364014, -2.0717225074768066, -1.9438496828079224, -1.815976858139038, -1.6881040334701538, -1.5602312088012695, -1.4323585033416748, -1.3044856786727905, -1.1766128540039062, -1.0487401485443115, -0.9208673238754272, -0.7929940223693848, -0.6651211977005005, -0.537248432636261, -0.4093756377696991, -0.2815028429031372, -0.15363001823425293, -0.025757253170013428, 0.10211551189422607, 0.22998833656311035, 0.35786113142967224, 0.48573392629623413, 0.6136066913604736, 0.7414795160293579, 0.8693523406982422, 0.9972251057624817, 1.1250978708267212, 1.2529706954956055, 1.3808435201644897, 1.508716344833374, 1.6365890502929688, 1.764461874961853, 1.8923346996307373, 2.020207405090332, 2.148080348968506, 2.2759530544281006, 2.4038257598876953, 2.531698703765869, 2.659571409225464, 2.7874441146850586, 2.9153170585632324, 3.043189764022827, 3.171062469482422, 3.2989354133605957]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 15.0, 9.0, 9.0, 8.0, 13.0, 9.0, 20.0, 24.0, 25.0, 31.0, 33.0, 31.0, 33.0, 35.0, 40.0, 34.0, 45.0, 45.0, 46.0, 40.0, 46.0, 46.0, 43.0, 37.0, 42.0, 26.0, 39.0, 23.0, 20.0, 26.0, 30.0, 17.0, 19.0, 11.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7112274169921875, -1.657806396484375, -1.6043853759765625, -1.55096435546875, -1.4975433349609375, -1.444122314453125, -1.3907012939453125, -1.3372802734375, -1.2838592529296875, -1.230438232421875, -1.1770172119140625, -1.12359619140625, -1.0701751708984375, -1.016754150390625, -0.9633331298828125, -0.909912109375, -0.8564910888671875, -0.803070068359375, -0.7496490478515625, -0.69622802734375, -0.6428070068359375, -0.589385986328125, -0.5359649658203125, -0.4825439453125, -0.4291229248046875, -0.375701904296875, -0.3222808837890625, -0.26885986328125, -0.2154388427734375, -0.162017822265625, -0.1085968017578125, -0.05517578125, -0.0017547607421875, 0.051666259765625, 0.1050872802734375, 0.15850830078125, 0.2119293212890625, 0.265350341796875, 0.3187713623046875, 0.3721923828125, 0.4256134033203125, 0.479034423828125, 0.5324554443359375, 0.58587646484375, 0.6392974853515625, 0.692718505859375, 0.7461395263671875, 0.799560546875, 0.8529815673828125, 0.906402587890625, 0.9598236083984375, 1.01324462890625, 1.0666656494140625, 1.120086669921875, 1.1735076904296875, 1.2269287109375, 1.2803497314453125, 1.333770751953125, 1.3871917724609375, 1.44061279296875, 1.4940338134765625, 1.547454833984375, 1.6008758544921875, 1.654296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 16.0, 21.0, 27.0, 51.0, 82.0, 111.0, 148.0, 195.0, 341.0, 549.0, 800.0, 1296.0, 2206.0, 4000.0, 8629.0, 32631.0, 586669.0, 369272.0, 24918.0, 7450.0, 3595.0, 2014.0, 1243.0, 735.0, 505.0, 352.0, 205.0, 138.0, 96.0, 62.0, 48.0, 36.0, 27.0, 14.0, 13.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.84765625, -6.64581298828125, -6.4439697265625, -6.24212646484375, -6.040283203125, -5.83843994140625, -5.6365966796875, -5.43475341796875, -5.23291015625, -5.03106689453125, -4.8292236328125, -4.62738037109375, -4.425537109375, -4.22369384765625, -4.0218505859375, -3.82000732421875, -3.6181640625, -3.41632080078125, -3.2144775390625, -3.01263427734375, -2.810791015625, -2.60894775390625, -2.4071044921875, -2.20526123046875, -2.00341796875, -1.80157470703125, -1.5997314453125, -1.39788818359375, -1.196044921875, -0.99420166015625, -0.7923583984375, -0.59051513671875, -0.388671875, -0.18682861328125, 0.0150146484375, 0.21685791015625, 0.418701171875, 0.62054443359375, 0.8223876953125, 1.02423095703125, 1.22607421875, 1.42791748046875, 1.6297607421875, 1.83160400390625, 2.033447265625, 2.23529052734375, 2.4371337890625, 2.63897705078125, 2.8408203125, 3.04266357421875, 3.2445068359375, 3.44635009765625, 3.648193359375, 3.85003662109375, 4.0518798828125, 4.25372314453125, 4.45556640625, 4.65740966796875, 4.8592529296875, 5.06109619140625, 5.262939453125, 5.46478271484375, 5.6666259765625, 5.86846923828125, 6.0703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 4.0, 6.0, 10.0, 15.0, 17.0, 21.0, 13.0, 19.0, 27.0, 29.0, 24.0, 47.0, 27.0, 46.0, 63.0, 73.0, 79.0, 179.0, 1620.0, 158.0, 93.0, 91.0, 62.0, 50.0, 53.0, 31.0, 29.0, 31.0, 24.0, 20.0, 15.0, 12.0, 10.0, 6.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.9140625, -7.6907958984375, -7.467529296875, -7.2442626953125, -7.02099609375, -6.7977294921875, -6.574462890625, -6.3511962890625, -6.1279296875, -5.9046630859375, -5.681396484375, -5.4581298828125, -5.23486328125, -5.0115966796875, -4.788330078125, -4.5650634765625, -4.341796875, -4.1185302734375, -3.895263671875, -3.6719970703125, -3.44873046875, -3.2254638671875, -3.002197265625, -2.7789306640625, -2.5556640625, -2.3323974609375, -2.109130859375, -1.8858642578125, -1.66259765625, -1.4393310546875, -1.216064453125, -0.9927978515625, -0.76953125, -0.5462646484375, -0.322998046875, -0.0997314453125, 0.12353515625, 0.3468017578125, 0.570068359375, 0.7933349609375, 1.0166015625, 1.2398681640625, 1.463134765625, 1.6864013671875, 1.90966796875, 2.1329345703125, 2.356201171875, 2.5794677734375, 2.802734375, 3.0260009765625, 3.249267578125, 3.4725341796875, 3.69580078125, 3.9190673828125, 4.142333984375, 4.3656005859375, 4.5888671875, 4.8121337890625, 5.035400390625, 5.2586669921875, 5.48193359375, 5.7052001953125, 5.928466796875, 6.1517333984375, 6.375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 4.0, 13.0, 24.0, 26.0, 38.0, 50.0, 109.0, 130.0, 293.0, 526.0, 1124.0, 2801.0, 8692.0, 34005.0, 351680.0, 2653148.0, 70702.0, 14561.0, 4482.0, 1711.0, 706.0, 366.0, 188.0, 103.0, 69.0, 50.0, 31.0, 24.0, 16.0, 15.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.0718994140625, -11.628173828125, -11.1844482421875, -10.74072265625, -10.2969970703125, -9.853271484375, -9.4095458984375, -8.9658203125, -8.5220947265625, -8.078369140625, -7.6346435546875, -7.19091796875, -6.7471923828125, -6.303466796875, -5.8597412109375, -5.416015625, -4.9722900390625, -4.528564453125, -4.0848388671875, -3.64111328125, -3.1973876953125, -2.753662109375, -2.3099365234375, -1.8662109375, -1.4224853515625, -0.978759765625, -0.5350341796875, -0.09130859375, 0.3524169921875, 0.796142578125, 1.2398681640625, 1.68359375, 2.1273193359375, 2.571044921875, 3.0147705078125, 3.45849609375, 3.9022216796875, 4.345947265625, 4.7896728515625, 5.2333984375, 5.6771240234375, 6.120849609375, 6.5645751953125, 7.00830078125, 7.4520263671875, 7.895751953125, 8.3394775390625, 8.783203125, 9.2269287109375, 9.670654296875, 10.1143798828125, 10.55810546875, 11.0018310546875, 11.445556640625, 11.8892822265625, 12.3330078125, 12.7767333984375, 13.220458984375, 13.6641845703125, 14.10791015625, 14.5516357421875, 14.995361328125, 15.4390869140625, 15.8828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 76.0, 378.0, 425.0, 101.0, 18.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90983581542969, -50.507896423339844, -48.10595703125, -45.704017639160156, -43.30207824707031, -40.90013885498047, -38.49819564819336, -36.096256256103516, -33.69431686401367, -31.292377471923828, -28.890438079833984, -26.488496780395508, -24.086557388305664, -21.68461799621582, -19.282676696777344, -16.8807373046875, -14.478797912597656, -12.076858520507812, -9.674918174743652, -7.27297830581665, -4.871038436889648, -2.4690990447998047, -0.06715869903564453, 2.3347816467285156, 4.736721038818359, 7.138660907745361, 9.540600776672363, 11.942541122436523, 14.344480514526367, 16.74641990661621, 19.148361206054688, 21.55030059814453, 23.952232360839844, 26.354171752929688, 28.75611114501953, 31.158052444458008, 33.55998992919922, 35.96192932128906, 38.36387252807617, 40.765811920166016, 43.16775131225586, 45.5696907043457, 47.97163009643555, 50.37356948852539, 52.7755126953125, 55.177452087402344, 57.57939147949219, 59.98133087158203, 62.383270263671875, 64.78520965576172, 67.18714904785156, 69.5890884399414, 71.99102783203125, 74.3929672241211, 76.79490661621094, 79.19685363769531, 81.59878540039062, 84.00072479248047, 86.40266418457031, 88.80460357666016, 91.20654296875, 93.60848236083984, 96.01042175292969, 98.41236877441406, 100.8143081665039]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 2.0, 5.0, 13.0, 8.0, 9.0, 22.0, 14.0, 23.0, 17.0, 29.0, 25.0, 31.0, 32.0, 41.0, 38.0, 51.0, 46.0, 41.0, 32.0, 43.0, 51.0, 41.0, 43.0, 37.0, 41.0, 29.0, 30.0, 26.0, 15.0, 26.0, 23.0, 22.0, 17.0, 18.0, 10.0, 13.0, 7.0, 10.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.594375610351562, -19.866798400878906, -19.139219284057617, -18.41164207458496, -17.684064865112305, -16.956485748291016, -16.22890853881836, -15.501331329345703, -14.77375316619873, -14.046175003051758, -13.318597793579102, -12.591019630432129, -11.863441467285156, -11.1358642578125, -10.408286094665527, -9.680707931518555, -8.953130722045898, -8.225552558898926, -7.4979753494262695, -6.770397186279297, -6.042819499969482, -5.315241813659668, -4.587663650512695, -3.860085964202881, -3.1325082778930664, -2.404930591583252, -1.6773526668548584, -0.9497747421264648, -0.2221970558166504, 0.5053806304931641, 1.2329587936401367, 1.9605364799499512, 2.688112258911133, 3.4156899452209473, 4.143267631530762, 4.870845794677734, 5.598423480987549, 6.326001167297363, 7.053579330444336, 7.78115701675415, 8.508734703063965, 9.236312866210938, 9.963890075683594, 10.691468238830566, 11.419046401977539, 12.146623611450195, 12.874201774597168, 13.60177993774414, 14.329357147216797, 15.05693531036377, 15.784512519836426, 16.5120906829834, 17.239667892456055, 17.967247009277344, 18.69482421875, 19.422401428222656, 20.149978637695312, 20.87755584716797, 21.605134963989258, 22.332712173461914, 23.06028938293457, 23.78786849975586, 24.515445709228516, 25.243022918701172, 25.97060203552246]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 6.0, 11.0, 10.0, 11.0, 9.0, 21.0, 15.0, 21.0, 34.0, 20.0, 24.0, 25.0, 34.0, 48.0, 36.0, 34.0, 43.0, 54.0, 39.0, 47.0, 43.0, 49.0, 35.0, 41.0, 29.0, 35.0, 33.0, 21.0, 24.0, 23.0, 21.0, 15.0, 14.0, 8.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.794921875, -1.7416534423828125, -1.688385009765625, -1.6351165771484375, -1.58184814453125, -1.5285797119140625, -1.475311279296875, -1.4220428466796875, -1.3687744140625, -1.3155059814453125, -1.262237548828125, -1.2089691162109375, -1.15570068359375, -1.1024322509765625, -1.049163818359375, -0.9958953857421875, -0.942626953125, -0.8893585205078125, -0.836090087890625, -0.7828216552734375, -0.72955322265625, -0.6762847900390625, -0.623016357421875, -0.5697479248046875, -0.5164794921875, -0.4632110595703125, -0.409942626953125, -0.3566741943359375, -0.30340576171875, -0.2501373291015625, -0.196868896484375, -0.1436004638671875, -0.09033203125, -0.0370635986328125, 0.016204833984375, 0.0694732666015625, 0.12274169921875, 0.1760101318359375, 0.229278564453125, 0.2825469970703125, 0.3358154296875, 0.3890838623046875, 0.442352294921875, 0.4956207275390625, 0.54888916015625, 0.6021575927734375, 0.655426025390625, 0.7086944580078125, 0.761962890625, 0.8152313232421875, 0.868499755859375, 0.9217681884765625, 0.97503662109375, 1.0283050537109375, 1.081573486328125, 1.1348419189453125, 1.1881103515625, 1.2413787841796875, 1.294647216796875, 1.3479156494140625, 1.40118408203125, 1.4544525146484375, 1.507720947265625, 1.5609893798828125, 1.6142578125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 13.0, 11.0, 21.0, 19.0, 18.0, 37.0, 43.0, 84.0, 124.0, 215.0, 304.0, 509.0, 870.0, 1611.0, 2886.0, 5368.0, 11372.0, 25495.0, 68031.0, 295125.0, 3256945.0, 400281.0, 75026.0, 27016.0, 11402.0, 5284.0, 2779.0, 1451.0, 766.0, 437.0, 250.0, 165.0, 103.0, 74.0, 30.0, 37.0, 28.0, 15.0, 14.0, 9.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.27337646484375, -7.0428466796875, -6.81231689453125, -6.581787109375, -6.35125732421875, -6.1207275390625, -5.89019775390625, -5.65966796875, -5.42913818359375, -5.1986083984375, -4.96807861328125, -4.737548828125, -4.50701904296875, -4.2764892578125, -4.04595947265625, -3.8154296875, -3.58489990234375, -3.3543701171875, -3.12384033203125, -2.893310546875, -2.66278076171875, -2.4322509765625, -2.20172119140625, -1.97119140625, -1.74066162109375, -1.5101318359375, -1.27960205078125, -1.049072265625, -0.81854248046875, -0.5880126953125, -0.35748291015625, -0.126953125, 0.10357666015625, 0.3341064453125, 0.56463623046875, 0.795166015625, 1.02569580078125, 1.2562255859375, 1.48675537109375, 1.71728515625, 1.94781494140625, 2.1783447265625, 2.40887451171875, 2.639404296875, 2.86993408203125, 3.1004638671875, 3.33099365234375, 3.5615234375, 3.79205322265625, 4.0225830078125, 4.25311279296875, 4.483642578125, 4.71417236328125, 4.9447021484375, 5.17523193359375, 5.40576171875, 5.63629150390625, 5.8668212890625, 6.09735107421875, 6.327880859375, 6.55841064453125, 6.7889404296875, 7.01947021484375, 7.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 12.0, 16.0, 18.0, 30.0, 41.0, 64.0, 60.0, 95.0, 125.0, 253.0, 458.0, 1021.0, 838.0, 362.0, 207.0, 157.0, 76.0, 69.0, 48.0, 38.0, 23.0, 18.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.78179931640625, -6.4971923828125, -6.21258544921875, -5.927978515625, -5.64337158203125, -5.3587646484375, -5.07415771484375, -4.78955078125, -4.50494384765625, -4.2203369140625, -3.93572998046875, -3.651123046875, -3.36651611328125, -3.0819091796875, -2.79730224609375, -2.5126953125, -2.22808837890625, -1.9434814453125, -1.65887451171875, -1.374267578125, -1.08966064453125, -0.8050537109375, -0.52044677734375, -0.23583984375, 0.04876708984375, 0.3333740234375, 0.61798095703125, 0.902587890625, 1.18719482421875, 1.4718017578125, 1.75640869140625, 2.041015625, 2.32562255859375, 2.6102294921875, 2.89483642578125, 3.179443359375, 3.46405029296875, 3.7486572265625, 4.03326416015625, 4.31787109375, 4.60247802734375, 4.8870849609375, 5.17169189453125, 5.456298828125, 5.74090576171875, 6.0255126953125, 6.31011962890625, 6.5947265625, 6.87933349609375, 7.1639404296875, 7.44854736328125, 7.733154296875, 8.01776123046875, 8.3023681640625, 8.58697509765625, 8.87158203125, 9.15618896484375, 9.4407958984375, 9.72540283203125, 10.010009765625, 10.29461669921875, 10.5792236328125, 10.86383056640625, 11.1484375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 11.0, 12.0, 23.0, 21.0, 26.0, 44.0, 66.0, 122.0, 193.0, 340.0, 598.0, 1199.0, 2514.0, 6167.0, 16359.0, 50694.0, 200574.0, 2786965.0, 950454.0, 123257.0, 34204.0, 11727.0, 4599.0, 1914.0, 929.0, 530.0, 257.0, 156.0, 98.0, 61.0, 51.0, 33.0, 17.0, 13.0, 10.0, 10.0, 7.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.4921875, -15.0474853515625, -14.602783203125, -14.1580810546875, -13.71337890625, -13.2686767578125, -12.823974609375, -12.3792724609375, -11.9345703125, -11.4898681640625, -11.045166015625, -10.6004638671875, -10.15576171875, -9.7110595703125, -9.266357421875, -8.8216552734375, -8.376953125, -7.9322509765625, -7.487548828125, -7.0428466796875, -6.59814453125, -6.1534423828125, -5.708740234375, -5.2640380859375, -4.8193359375, -4.3746337890625, -3.929931640625, -3.4852294921875, -3.04052734375, -2.5958251953125, -2.151123046875, -1.7064208984375, -1.26171875, -0.8170166015625, -0.372314453125, 0.0723876953125, 0.51708984375, 0.9617919921875, 1.406494140625, 1.8511962890625, 2.2958984375, 2.7406005859375, 3.185302734375, 3.6300048828125, 4.07470703125, 4.5194091796875, 4.964111328125, 5.4088134765625, 5.853515625, 6.2982177734375, 6.742919921875, 7.1876220703125, 7.63232421875, 8.0770263671875, 8.521728515625, 8.9664306640625, 9.4111328125, 9.8558349609375, 10.300537109375, 10.7452392578125, 11.18994140625, 11.6346435546875, 12.079345703125, 12.5240478515625, 12.96875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 10.0, 15.0, 19.0, 22.0, 27.0, 38.0, 70.0, 71.0, 103.0, 105.0, 102.0, 96.0, 72.0, 70.0, 36.0, 33.0, 19.0, 25.0, 14.0, 13.0, 6.0, 3.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.627105712890625, -40.634674072265625, -39.64223861694336, -38.649803161621094, -37.657371520996094, -36.664939880371094, -35.67250442504883, -34.68006896972656, -33.68763732910156, -32.69520568847656, -31.702770233154297, -30.710336685180664, -29.71790313720703, -28.7254695892334, -27.733036041259766, -26.740602493286133, -25.7481689453125, -24.755735397338867, -23.763301849365234, -22.7708683013916, -21.77843475341797, -20.786001205444336, -19.793567657470703, -18.80113410949707, -17.808700561523438, -16.816267013549805, -15.823833465576172, -14.831399917602539, -13.838966369628906, -12.846532821655273, -11.85409927368164, -10.861665725708008, -9.869230270385742, -8.87679672241211, -7.884363174438477, -6.891929626464844, -5.899496078491211, -4.907062530517578, -3.9146289825439453, -2.9221954345703125, -1.9297618865966797, -0.9373283386230469, 0.05510520935058594, 1.0475387573242188, 2.0399723052978516, 3.0324058532714844, 4.024839401245117, 5.01727294921875, 6.009706497192383, 7.002140045166016, 7.994573593139648, 8.987007141113281, 9.979440689086914, 10.971874237060547, 11.96430778503418, 12.956741333007812, 13.949174880981445, 14.941608428955078, 15.934041976928711, 16.926475524902344, 17.918909072875977, 18.91134262084961, 19.903776168823242, 20.896209716796875, 21.888643264770508]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 10.0, 10.0, 20.0, 12.0, 17.0, 28.0, 25.0, 21.0, 28.0, 28.0, 36.0, 40.0, 35.0, 36.0, 46.0, 38.0, 41.0, 49.0, 41.0, 41.0, 29.0, 41.0, 41.0, 27.0, 40.0, 15.0, 28.0, 27.0, 27.0, 15.0, 14.0, 14.0, 7.0, 10.0, 10.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.314502716064453, -21.644657135009766, -20.97481346130371, -20.304967880249023, -19.63512420654297, -18.96527862548828, -18.295434951782227, -17.62558937072754, -16.955745697021484, -16.285900115966797, -15.616056442260742, -14.946211814880371, -14.2763671875, -13.606522560119629, -12.936677932739258, -12.26683235168457, -11.5969877243042, -10.927143096923828, -10.257298469543457, -9.587453842163086, -8.917609214782715, -8.247764587402344, -7.5779194831848145, -6.908074855804443, -6.238230228424072, -5.568385601043701, -4.89854097366333, -4.228695869445801, -3.558851480484009, -2.8890068531036377, -2.2191619873046875, -1.5493173599243164, -0.8794727325439453, -0.20962804555892944, 0.4602166414260864, 1.130061388015747, 1.7999060153961182, 2.4697506427764893, 3.1395955085754395, 3.8094401359558105, 4.479284763336182, 5.149129390716553, 5.818974018096924, 6.488819122314453, 7.158663749694824, 7.828508377075195, 8.498353004455566, 9.168197631835938, 9.838042259216309, 10.50788688659668, 11.17773151397705, 11.847576141357422, 12.517420768737793, 13.187265396118164, 13.857110977172852, 14.526954650878906, 15.196800231933594, 15.866644859313965, 16.536489486694336, 17.206335067749023, 17.876178741455078, 18.546024322509766, 19.21586799621582, 19.885713577270508, 20.555557250976562]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 13.0, 19.0, 15.0, 20.0, 18.0, 27.0, 33.0, 30.0, 34.0, 35.0, 46.0, 38.0, 35.0, 60.0, 48.0, 33.0, 42.0, 51.0, 53.0, 40.0, 38.0, 26.0, 33.0, 32.0, 23.0, 24.0, 26.0, 24.0, 11.0, 12.0, 7.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.126953125, -2.0662384033203125, -2.005523681640625, -1.9448089599609375, -1.88409423828125, -1.8233795166015625, -1.762664794921875, -1.7019500732421875, -1.6412353515625, -1.5805206298828125, -1.519805908203125, -1.4590911865234375, -1.39837646484375, -1.3376617431640625, -1.276947021484375, -1.2162322998046875, -1.155517578125, -1.0948028564453125, -1.034088134765625, -0.9733734130859375, -0.91265869140625, -0.8519439697265625, -0.791229248046875, -0.7305145263671875, -0.6697998046875, -0.6090850830078125, -0.548370361328125, -0.4876556396484375, -0.42694091796875, -0.3662261962890625, -0.305511474609375, -0.2447967529296875, -0.18408203125, -0.1233673095703125, -0.062652587890625, -0.0019378662109375, 0.05877685546875, 0.1194915771484375, 0.180206298828125, 0.2409210205078125, 0.3016357421875, 0.3623504638671875, 0.423065185546875, 0.4837799072265625, 0.54449462890625, 0.6052093505859375, 0.665924072265625, 0.7266387939453125, 0.787353515625, 0.8480682373046875, 0.908782958984375, 0.9694976806640625, 1.03021240234375, 1.0909271240234375, 1.151641845703125, 1.2123565673828125, 1.2730712890625, 1.3337860107421875, 1.394500732421875, 1.4552154541015625, 1.51593017578125, 1.5766448974609375, 1.637359619140625, 1.6980743408203125, 1.7587890625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 5.0, 8.0, 14.0, 19.0, 26.0, 40.0, 75.0, 103.0, 164.0, 230.0, 325.0, 557.0, 890.0, 1386.0, 2401.0, 4185.0, 6981.0, 12640.0, 23114.0, 45474.0, 94733.0, 230778.0, 362975.0, 132082.0, 60989.0, 30189.0, 16326.0, 9055.0, 5108.0, 2979.0, 1714.0, 1074.0, 664.0, 399.0, 275.0, 196.0, 129.0, 79.0, 50.0, 36.0, 23.0, 21.0, 12.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3695068359375, -9.059326171875, -8.7491455078125, -8.43896484375, -8.1287841796875, -7.818603515625, -7.5084228515625, -7.1982421875, -6.8880615234375, -6.577880859375, -6.2677001953125, -5.95751953125, -5.6473388671875, -5.337158203125, -5.0269775390625, -4.716796875, -4.4066162109375, -4.096435546875, -3.7862548828125, -3.47607421875, -3.1658935546875, -2.855712890625, -2.5455322265625, -2.2353515625, -1.9251708984375, -1.614990234375, -1.3048095703125, -0.99462890625, -0.6844482421875, -0.374267578125, -0.0640869140625, 0.24609375, 0.5562744140625, 0.866455078125, 1.1766357421875, 1.48681640625, 1.7969970703125, 2.107177734375, 2.4173583984375, 2.7275390625, 3.0377197265625, 3.347900390625, 3.6580810546875, 3.96826171875, 4.2784423828125, 4.588623046875, 4.8988037109375, 5.208984375, 5.5191650390625, 5.829345703125, 6.1395263671875, 6.44970703125, 6.7598876953125, 7.070068359375, 7.3802490234375, 7.6904296875, 8.0006103515625, 8.310791015625, 8.6209716796875, 8.93115234375, 9.2413330078125, 9.551513671875, 9.8616943359375, 10.171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 10.0, 9.0, 11.0, 13.0, 19.0, 23.0, 30.0, 35.0, 28.0, 28.0, 31.0, 41.0, 46.0, 52.0, 51.0, 44.0, 1068.0, 46.0, 48.0, 27.0, 54.0, 29.0, 45.0, 45.0, 27.0, 26.0, 26.0, 19.0, 14.0, 10.0, 15.0, 13.0, 7.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9279937744140625, -1.865753173828125, -1.8035125732421875, -1.74127197265625, -1.6790313720703125, -1.616790771484375, -1.5545501708984375, -1.4923095703125, -1.4300689697265625, -1.367828369140625, -1.3055877685546875, -1.24334716796875, -1.1811065673828125, -1.118865966796875, -1.0566253662109375, -0.994384765625, -0.9321441650390625, -0.869903564453125, -0.8076629638671875, -0.74542236328125, -0.6831817626953125, -0.620941162109375, -0.5587005615234375, -0.4964599609375, -0.4342193603515625, -0.371978759765625, -0.3097381591796875, -0.24749755859375, -0.1852569580078125, -0.123016357421875, -0.0607757568359375, 0.00146484375, 0.0637054443359375, 0.125946044921875, 0.1881866455078125, 0.25042724609375, 0.3126678466796875, 0.374908447265625, 0.4371490478515625, 0.4993896484375, 0.5616302490234375, 0.623870849609375, 0.6861114501953125, 0.74835205078125, 0.8105926513671875, 0.872833251953125, 0.9350738525390625, 0.997314453125, 1.0595550537109375, 1.121795654296875, 1.1840362548828125, 1.24627685546875, 1.3085174560546875, 1.370758056640625, 1.4329986572265625, 1.4952392578125, 1.5574798583984375, 1.619720458984375, 1.6819610595703125, 1.74420166015625, 1.8064422607421875, 1.868682861328125, 1.9309234619140625, 1.9931640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 12.0, 9.0, 18.0, 33.0, 52.0, 83.0, 143.0, 251.0, 360.0, 687.0, 1285.0, 2331.0, 4612.0, 10008.0, 25140.0, 78515.0, 779240.0, 1062726.0, 85201.0, 25904.0, 10361.0, 4815.0, 2409.0, 1183.0, 734.0, 416.0, 251.0, 114.0, 94.0, 46.0, 31.0, 24.0, 12.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.953125, -12.5487060546875, -12.144287109375, -11.7398681640625, -11.33544921875, -10.9310302734375, -10.526611328125, -10.1221923828125, -9.7177734375, -9.3133544921875, -8.908935546875, -8.5045166015625, -8.10009765625, -7.6956787109375, -7.291259765625, -6.8868408203125, -6.482421875, -6.0780029296875, -5.673583984375, -5.2691650390625, -4.86474609375, -4.4603271484375, -4.055908203125, -3.6514892578125, -3.2470703125, -2.8426513671875, -2.438232421875, -2.0338134765625, -1.62939453125, -1.2249755859375, -0.820556640625, -0.4161376953125, -0.01171875, 0.3927001953125, 0.797119140625, 1.2015380859375, 1.60595703125, 2.0103759765625, 2.414794921875, 2.8192138671875, 3.2236328125, 3.6280517578125, 4.032470703125, 4.4368896484375, 4.84130859375, 5.2457275390625, 5.650146484375, 6.0545654296875, 6.458984375, 6.8634033203125, 7.267822265625, 7.6722412109375, 8.07666015625, 8.4810791015625, 8.885498046875, 9.2899169921875, 9.6943359375, 10.0987548828125, 10.503173828125, 10.9075927734375, 11.31201171875, 11.7164306640625, 12.120849609375, 12.5252685546875, 12.9296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 23.0, 27.0, 43.0, 65.0, 199.0, 302.0, 108.0, 65.0, 39.0, 23.0, 12.0, 11.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.54296875, -4.410369873046875, -4.27777099609375, -4.145172119140625, -4.0125732421875, -3.879974365234375, -3.74737548828125, -3.614776611328125, -3.482177734375, -3.349578857421875, -3.21697998046875, -3.084381103515625, -2.9517822265625, -2.819183349609375, -2.68658447265625, -2.553985595703125, -2.42138671875, -2.288787841796875, -2.15618896484375, -2.023590087890625, -1.8909912109375, -1.758392333984375, -1.62579345703125, -1.493194580078125, -1.360595703125, -1.227996826171875, -1.09539794921875, -0.962799072265625, -0.8302001953125, -0.697601318359375, -0.56500244140625, -0.432403564453125, -0.2998046875, -0.167205810546875, -0.03460693359375, 0.097991943359375, 0.2305908203125, 0.363189697265625, 0.49578857421875, 0.628387451171875, 0.760986328125, 0.893585205078125, 1.02618408203125, 1.158782958984375, 1.2913818359375, 1.423980712890625, 1.55657958984375, 1.689178466796875, 1.82177734375, 1.954376220703125, 2.08697509765625, 2.219573974609375, 2.3521728515625, 2.484771728515625, 2.61737060546875, 2.749969482421875, 2.882568359375, 3.015167236328125, 3.14776611328125, 3.280364990234375, 3.4129638671875, 3.545562744140625, 3.67816162109375, 3.810760498046875, 3.943359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 7.0, 16.0, 14.0, 29.0, 30.0, 42.0, 67.0, 133.0, 401.0, 1306.0, 6589.0, 203829.0, 825381.0, 8315.0, 1583.0, 409.0, 136.0, 77.0, 33.0, 31.0, 19.0, 16.0, 14.0, 9.0, 8.0, 6.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.97119140625, -47.2861328125, -45.60107421875, -43.916015625, -42.23095703125, -40.5458984375, -38.86083984375, -37.17578125, -35.49072265625, -33.8056640625, -32.12060546875, -30.435546875, -28.75048828125, -27.0654296875, -25.38037109375, -23.6953125, -22.01025390625, -20.3251953125, -18.64013671875, -16.955078125, -15.27001953125, -13.5849609375, -11.89990234375, -10.21484375, -8.52978515625, -6.8447265625, -5.15966796875, -3.474609375, -1.78955078125, -0.1044921875, 1.58056640625, 3.265625, 4.95068359375, 6.6357421875, 8.32080078125, 10.005859375, 11.69091796875, 13.3759765625, 15.06103515625, 16.74609375, 18.43115234375, 20.1162109375, 21.80126953125, 23.486328125, 25.17138671875, 26.8564453125, 28.54150390625, 30.2265625, 31.91162109375, 33.5966796875, 35.28173828125, 36.966796875, 38.65185546875, 40.3369140625, 42.02197265625, 43.70703125, 45.39208984375, 47.0771484375, 48.76220703125, 50.447265625, 52.13232421875, 53.8173828125, 55.50244140625, 57.1875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 18.0, 59.0, 165.0, 398.0, 257.0, 75.0, 19.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.732600212097168, -5.197275161743164, -4.661950588226318, -4.126626014709473, -3.5913009643554688, -3.055976152420044, -2.520651340484619, -1.9853265285491943, -1.4500017166137695, -0.9146769046783447, -0.3793520927429199, 0.15597271919250488, 0.6912975311279297, 1.2266223430633545, 1.7619471549987793, 2.297271966934204, 2.832596778869629, 3.3679215908050537, 3.9032464027404785, 4.438570976257324, 4.973896026611328, 5.509221076965332, 6.044545650482178, 6.579870223999023, 7.115195274353027, 7.650520324707031, 8.185844421386719, 8.721169471740723, 9.256494522094727, 9.79181957244873, 10.327144622802734, 10.862468719482422, 11.39779281616211, 11.933117866516113, 12.468442916870117, 13.003767013549805, 13.539092063903809, 14.074417114257812, 14.6097412109375, 15.145066261291504, 15.680391311645508, 16.215715408325195, 16.751041412353516, 17.286365509033203, 17.82168960571289, 18.35701560974121, 18.8923397064209, 19.42766571044922, 19.962989807128906, 20.498313903808594, 21.033639907836914, 21.5689640045166, 22.104290008544922, 22.63961410522461, 23.174938201904297, 23.710264205932617, 24.245588302612305, 24.780912399291992, 25.316238403320312, 25.8515625, 26.386886596679688, 26.922212600708008, 27.457536697387695, 27.992862701416016, 28.528186798095703]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 10.0, 4.0, 5.0, 9.0, 8.0, 18.0, 19.0, 22.0, 17.0, 24.0, 30.0, 32.0, 34.0, 44.0, 61.0, 46.0, 53.0, 50.0, 58.0, 49.0, 50.0, 49.0, 39.0, 36.0, 43.0, 48.0, 25.0, 20.0, 24.0, 25.0, 13.0, 14.0, 14.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4067554473876953, -2.2869205474853516, -2.167085886001587, -2.047250986099243, -1.927416205406189, -1.8075814247131348, -1.687746524810791, -1.5679117441177368, -1.4480769634246826, -1.3282421827316284, -1.2084074020385742, -1.0885725021362305, -0.9687377214431763, -0.8489029407501221, -0.7290681004524231, -0.6092332601547241, -0.4893984794616699, -0.36956366896629333, -0.24972885847091675, -0.12989404797554016, -0.010059237480163574, 0.10977554321289062, 0.2296103835105896, 0.3494452238082886, 0.4692800045013428, 0.589114785194397, 0.708949625492096, 0.8287844657897949, 0.9486192464828491, 1.0684540271759033, 1.188288927078247, 1.3081237077713013, 1.4279584884643555, 1.5477932691574097, 1.6676280498504639, 1.7874629497528076, 1.9072977304458618, 2.027132511138916, 2.1469674110412598, 2.2668023109436035, 2.386636972427368, 2.506471872329712, 2.6263065338134766, 2.7461414337158203, 2.865976333618164, 2.9858109951019287, 3.1056458950042725, 3.225480556488037, 3.345315456390381, 3.4651503562927246, 3.5849850177764893, 3.704819917678833, 3.8246545791625977, 3.9444894790649414, 4.064324378967285, 4.184159278869629, 4.303994178771973, 4.423829078674316, 4.54366397857666, 4.663498401641846, 4.7833333015441895, 4.903168201446533, 5.023003101348877, 5.142838001251221, 5.262672424316406]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 12.0, 10.0, 11.0, 17.0, 23.0, 24.0, 29.0, 25.0, 32.0, 30.0, 39.0, 57.0, 39.0, 58.0, 56.0, 46.0, 50.0, 45.0, 53.0, 41.0, 45.0, 33.0, 44.0, 27.0, 27.0, 29.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.17535400390625, -2.1085205078125, -2.04168701171875, -1.974853515625, -1.90802001953125, -1.8411865234375, -1.77435302734375, -1.70751953125, -1.64068603515625, -1.5738525390625, -1.50701904296875, -1.440185546875, -1.37335205078125, -1.3065185546875, -1.23968505859375, -1.1728515625, -1.10601806640625, -1.0391845703125, -0.97235107421875, -0.905517578125, -0.83868408203125, -0.7718505859375, -0.70501708984375, -0.63818359375, -0.57135009765625, -0.5045166015625, -0.43768310546875, -0.370849609375, -0.30401611328125, -0.2371826171875, -0.17034912109375, -0.103515625, -0.03668212890625, 0.0301513671875, 0.09698486328125, 0.163818359375, 0.23065185546875, 0.2974853515625, 0.36431884765625, 0.43115234375, 0.49798583984375, 0.5648193359375, 0.63165283203125, 0.698486328125, 0.76531982421875, 0.8321533203125, 0.89898681640625, 0.9658203125, 1.03265380859375, 1.0994873046875, 1.16632080078125, 1.233154296875, 1.29998779296875, 1.3668212890625, 1.43365478515625, 1.50048828125, 1.56732177734375, 1.6341552734375, 1.70098876953125, 1.767822265625, 1.83465576171875, 1.9014892578125, 1.96832275390625, 2.03515625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 16.0, 14.0, 20.0, 30.0, 33.0, 53.0, 89.0, 126.0, 224.0, 297.0, 479.0, 943.0, 1737.0, 3461.0, 7274.0, 18681.0, 61330.0, 308724.0, 493430.0, 104745.0, 27379.0, 10033.0, 4329.0, 2192.0, 1130.0, 657.0, 388.0, 238.0, 148.0, 96.0, 77.0, 47.0, 34.0, 21.0, 20.0, 16.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.135162353515625, -2.05938720703125, -1.983612060546875, -1.9078369140625, -1.832061767578125, -1.75628662109375, -1.680511474609375, -1.604736328125, -1.528961181640625, -1.45318603515625, -1.377410888671875, -1.3016357421875, -1.225860595703125, -1.15008544921875, -1.074310302734375, -0.99853515625, -0.922760009765625, -0.84698486328125, -0.771209716796875, -0.6954345703125, -0.619659423828125, -0.54388427734375, -0.468109130859375, -0.392333984375, -0.316558837890625, -0.24078369140625, -0.165008544921875, -0.0892333984375, -0.013458251953125, 0.06231689453125, 0.138092041015625, 0.2138671875, 0.289642333984375, 0.36541748046875, 0.441192626953125, 0.5169677734375, 0.592742919921875, 0.66851806640625, 0.744293212890625, 0.820068359375, 0.895843505859375, 0.97161865234375, 1.047393798828125, 1.1231689453125, 1.198944091796875, 1.27471923828125, 1.350494384765625, 1.42626953125, 1.502044677734375, 1.57781982421875, 1.653594970703125, 1.7293701171875, 1.805145263671875, 1.88092041015625, 1.956695556640625, 2.032470703125, 2.108245849609375, 2.18402099609375, 2.259796142578125, 2.3355712890625, 2.411346435546875, 2.48712158203125, 2.562896728515625, 2.638671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 17.0, 14.0, 11.0, 13.0, 22.0, 34.0, 35.0, 27.0, 30.0, 49.0, 37.0, 54.0, 104.0, 481.0, 1569.0, 102.0, 55.0, 53.0, 37.0, 42.0, 43.0, 29.0, 25.0, 25.0, 18.0, 21.0, 21.0, 13.0, 9.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.0390625, -7.79559326171875, -7.5521240234375, -7.30865478515625, -7.065185546875, -6.82171630859375, -6.5782470703125, -6.33477783203125, -6.09130859375, -5.84783935546875, -5.6043701171875, -5.36090087890625, -5.117431640625, -4.87396240234375, -4.6304931640625, -4.38702392578125, -4.1435546875, -3.90008544921875, -3.6566162109375, -3.41314697265625, -3.169677734375, -2.92620849609375, -2.6827392578125, -2.43927001953125, -2.19580078125, -1.95233154296875, -1.7088623046875, -1.46539306640625, -1.221923828125, -0.97845458984375, -0.7349853515625, -0.49151611328125, -0.248046875, -0.00457763671875, 0.2388916015625, 0.48236083984375, 0.725830078125, 0.96929931640625, 1.2127685546875, 1.45623779296875, 1.69970703125, 1.94317626953125, 2.1866455078125, 2.43011474609375, 2.673583984375, 2.91705322265625, 3.1605224609375, 3.40399169921875, 3.6474609375, 3.89093017578125, 4.1343994140625, 4.37786865234375, 4.621337890625, 4.86480712890625, 5.1082763671875, 5.35174560546875, 5.59521484375, 5.83868408203125, 6.0821533203125, 6.32562255859375, 6.569091796875, 6.81256103515625, 7.0560302734375, 7.29949951171875, 7.54296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 10.0, 7.0, 8.0, 19.0, 12.0, 28.0, 22.0, 41.0, 37.0, 67.0, 93.0, 169.0, 352.0, 963.0, 3785.0, 20974.0, 371483.0, 2680276.0, 56846.0, 7645.0, 1760.0, 505.0, 214.0, 96.0, 75.0, 56.0, 40.0, 28.0, 21.0, 10.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.16082763671875, -7.9075927734375, -7.65435791015625, -7.401123046875, -7.14788818359375, -6.8946533203125, -6.64141845703125, -6.38818359375, -6.13494873046875, -5.8817138671875, -5.62847900390625, -5.375244140625, -5.12200927734375, -4.8687744140625, -4.61553955078125, -4.3623046875, -4.10906982421875, -3.8558349609375, -3.60260009765625, -3.349365234375, -3.09613037109375, -2.8428955078125, -2.58966064453125, -2.33642578125, -2.08319091796875, -1.8299560546875, -1.57672119140625, -1.323486328125, -1.07025146484375, -0.8170166015625, -0.56378173828125, -0.310546875, -0.05731201171875, 0.1959228515625, 0.44915771484375, 0.702392578125, 0.95562744140625, 1.2088623046875, 1.46209716796875, 1.71533203125, 1.96856689453125, 2.2218017578125, 2.47503662109375, 2.728271484375, 2.98150634765625, 3.2347412109375, 3.48797607421875, 3.7412109375, 3.99444580078125, 4.2476806640625, 4.50091552734375, 4.754150390625, 5.00738525390625, 5.2606201171875, 5.51385498046875, 5.76708984375, 6.02032470703125, 6.2735595703125, 6.52679443359375, 6.780029296875, 7.03326416015625, 7.2864990234375, 7.53973388671875, 7.79296875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [25.0, 547.0, 427.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.352025032043457, -2.1149377822875977, 0.12214946746826172, 2.359236717224121, 4.5963239669799805, 6.83341121673584, 9.0704984664917, 11.307585716247559, 13.544672966003418, 15.781760215759277, 18.018848419189453, 20.255935668945312, 22.493022918701172, 24.73011016845703, 26.96719741821289, 29.20428466796875, 31.44137191772461, 33.67845916748047, 35.91554641723633, 38.15263366699219, 40.38972091674805, 42.626808166503906, 44.863895416259766, 47.100982666015625, 49.338069915771484, 51.575157165527344, 53.8122444152832, 56.04933166503906, 58.28641891479492, 60.52350616455078, 62.76059341430664, 64.9976806640625, 67.23477172851562, 69.47186279296875, 71.70894622802734, 73.94602966308594, 76.18312072753906, 78.42021179199219, 80.65729522705078, 82.89437866210938, 85.1314697265625, 87.36856079101562, 89.60564422607422, 91.84272766113281, 94.07981872558594, 96.31690979003906, 98.55399322509766, 100.79107666015625, 103.02816772460938, 105.2652587890625, 107.5023422241211, 109.73942565917969, 111.97651672363281, 114.21360778808594, 116.45069122314453, 118.68777465820312, 120.92486572265625, 123.16195678710938, 125.39904022216797, 127.63612365722656, 129.8732147216797, 132.1103057861328, 134.34738159179688, 136.58447265625, 138.82156372070312]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 13.0, 13.0, 18.0, 17.0, 24.0, 24.0, 34.0, 48.0, 36.0, 42.0, 48.0, 44.0, 37.0, 32.0, 34.0, 58.0, 39.0, 34.0, 23.0, 36.0, 38.0, 31.0, 34.0, 28.0, 27.0, 22.0, 17.0, 22.0, 19.0, 17.0, 9.0, 13.0, 8.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.37146759033203, -19.653667449951172, -18.935867309570312, -18.218067169189453, -17.500267028808594, -16.782468795776367, -16.064668655395508, -15.346868515014648, -14.629068374633789, -13.91126823425293, -13.19346809387207, -12.475668907165527, -11.757868766784668, -11.040068626403809, -10.322269439697266, -9.604469299316406, -8.886669158935547, -8.168869018554688, -7.451069355010986, -6.733269691467285, -6.015469551086426, -5.297669410705566, -4.579869747161865, -3.862070083618164, -3.1442699432373047, -2.4264700412750244, -1.7086701393127441, -0.9908702373504639, -0.2730703353881836, 0.4447295665740967, 1.162529468536377, 1.8803291320800781, 2.5981311798095703, 3.3159310817718506, 4.033730983734131, 4.751530647277832, 5.469330787658691, 6.187130928039551, 6.904930591583252, 7.622730255126953, 8.340530395507812, 9.058330535888672, 9.776130676269531, 10.493929862976074, 11.211730003356934, 11.929530143737793, 12.647329330444336, 13.365129470825195, 14.082929611206055, 14.800729751586914, 15.518529891967773, 16.236330032348633, 16.95412826538086, 17.67192840576172, 18.389728546142578, 19.107528686523438, 19.825328826904297, 20.543128967285156, 21.260929107666016, 21.978729248046875, 22.696529388427734, 23.41432762145996, 24.13212776184082, 24.84992790222168, 25.56772804260254]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 17.0, 11.0, 26.0, 32.0, 19.0, 30.0, 28.0, 38.0, 41.0, 32.0, 39.0, 58.0, 49.0, 34.0, 64.0, 56.0, 51.0, 43.0, 38.0, 40.0, 41.0, 32.0, 38.0, 19.0, 17.0, 13.0, 18.0, 7.0, 11.0, 9.0, 3.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.302734375, -2.2364501953125, -2.170166015625, -2.1038818359375, -2.03759765625, -1.9713134765625, -1.905029296875, -1.8387451171875, -1.7724609375, -1.7061767578125, -1.639892578125, -1.5736083984375, -1.50732421875, -1.4410400390625, -1.374755859375, -1.3084716796875, -1.2421875, -1.1759033203125, -1.109619140625, -1.0433349609375, -0.97705078125, -0.9107666015625, -0.844482421875, -0.7781982421875, -0.7119140625, -0.6456298828125, -0.579345703125, -0.5130615234375, -0.44677734375, -0.3804931640625, -0.314208984375, -0.2479248046875, -0.181640625, -0.1153564453125, -0.049072265625, 0.0172119140625, 0.08349609375, 0.1497802734375, 0.216064453125, 0.2823486328125, 0.3486328125, 0.4149169921875, 0.481201171875, 0.5474853515625, 0.61376953125, 0.6800537109375, 0.746337890625, 0.8126220703125, 0.87890625, 0.9451904296875, 1.011474609375, 1.0777587890625, 1.14404296875, 1.2103271484375, 1.276611328125, 1.3428955078125, 1.4091796875, 1.4754638671875, 1.541748046875, 1.6080322265625, 1.67431640625, 1.7406005859375, 1.806884765625, 1.8731689453125, 1.939453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 42.0, 66.0, 99.0, 115.0, 150.0, 218.0, 335.0, 504.0, 727.0, 1181.0, 1778.0, 2761.0, 4440.0, 7495.0, 12859.0, 22770.0, 44294.0, 103832.0, 626466.0, 2775035.0, 412048.0, 88648.0, 39105.0, 20446.0, 11462.0, 6531.0, 3892.0, 2381.0, 1542.0, 932.0, 605.0, 439.0, 277.0, 225.0, 148.0, 110.0, 89.0, 42.0, 38.0, 23.0, 11.0, 15.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.87890625, -4.72357177734375, -4.5682373046875, -4.41290283203125, -4.257568359375, -4.10223388671875, -3.9468994140625, -3.79156494140625, -3.63623046875, -3.48089599609375, -3.3255615234375, -3.17022705078125, -3.014892578125, -2.85955810546875, -2.7042236328125, -2.54888916015625, -2.3935546875, -2.23822021484375, -2.0828857421875, -1.92755126953125, -1.772216796875, -1.61688232421875, -1.4615478515625, -1.30621337890625, -1.15087890625, -0.99554443359375, -0.8402099609375, -0.68487548828125, -0.529541015625, -0.37420654296875, -0.2188720703125, -0.06353759765625, 0.091796875, 0.24713134765625, 0.4024658203125, 0.55780029296875, 0.713134765625, 0.86846923828125, 1.0238037109375, 1.17913818359375, 1.33447265625, 1.48980712890625, 1.6451416015625, 1.80047607421875, 1.955810546875, 2.11114501953125, 2.2664794921875, 2.42181396484375, 2.5771484375, 2.73248291015625, 2.8878173828125, 3.04315185546875, 3.198486328125, 3.35382080078125, 3.5091552734375, 3.66448974609375, 3.81982421875, 3.97515869140625, 4.1304931640625, 4.28582763671875, 4.441162109375, 4.59649658203125, 4.7518310546875, 4.90716552734375, 5.0625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 14.0, 17.0, 34.0, 45.0, 71.0, 117.0, 173.0, 297.0, 708.0, 1141.0, 655.0, 288.0, 174.0, 100.0, 75.0, 43.0, 32.0, 19.0, 12.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2578125, -10.9488525390625, -10.639892578125, -10.3309326171875, -10.02197265625, -9.7130126953125, -9.404052734375, -9.0950927734375, -8.7861328125, -8.4771728515625, -8.168212890625, -7.8592529296875, -7.55029296875, -7.2413330078125, -6.932373046875, -6.6234130859375, -6.314453125, -6.0054931640625, -5.696533203125, -5.3875732421875, -5.07861328125, -4.7696533203125, -4.460693359375, -4.1517333984375, -3.8427734375, -3.5338134765625, -3.224853515625, -2.9158935546875, -2.60693359375, -2.2979736328125, -1.989013671875, -1.6800537109375, -1.37109375, -1.0621337890625, -0.753173828125, -0.4442138671875, -0.13525390625, 0.1737060546875, 0.482666015625, 0.7916259765625, 1.1005859375, 1.4095458984375, 1.718505859375, 2.0274658203125, 2.33642578125, 2.6453857421875, 2.954345703125, 3.2633056640625, 3.572265625, 3.8812255859375, 4.190185546875, 4.4991455078125, 4.80810546875, 5.1170654296875, 5.426025390625, 5.7349853515625, 6.0439453125, 6.3529052734375, 6.661865234375, 6.9708251953125, 7.27978515625, 7.5887451171875, 7.897705078125, 8.2066650390625, 8.515625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 12.0, 14.0, 13.0, 24.0, 36.0, 23.0, 41.0, 46.0, 72.0, 103.0, 136.0, 175.0, 263.0, 428.0, 745.0, 1329.0, 2720.0, 5510.0, 12774.0, 31928.0, 96561.0, 472135.0, 3078413.0, 357934.0, 82316.0, 28538.0, 11259.0, 5018.0, 2443.0, 1182.0, 710.0, 469.0, 223.0, 179.0, 110.0, 98.0, 60.0, 55.0, 38.0, 29.0, 27.0, 16.0, 12.0, 13.0, 5.0, 8.0, 13.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5625, -10.2154541015625, -9.868408203125, -9.5213623046875, -9.17431640625, -8.8272705078125, -8.480224609375, -8.1331787109375, -7.7861328125, -7.4390869140625, -7.092041015625, -6.7449951171875, -6.39794921875, -6.0509033203125, -5.703857421875, -5.3568115234375, -5.009765625, -4.6627197265625, -4.315673828125, -3.9686279296875, -3.62158203125, -3.2745361328125, -2.927490234375, -2.5804443359375, -2.2333984375, -1.8863525390625, -1.539306640625, -1.1922607421875, -0.84521484375, -0.4981689453125, -0.151123046875, 0.1959228515625, 0.54296875, 0.8900146484375, 1.237060546875, 1.5841064453125, 1.93115234375, 2.2781982421875, 2.625244140625, 2.9722900390625, 3.3193359375, 3.6663818359375, 4.013427734375, 4.3604736328125, 4.70751953125, 5.0545654296875, 5.401611328125, 5.7486572265625, 6.095703125, 6.4427490234375, 6.789794921875, 7.1368408203125, 7.48388671875, 7.8309326171875, 8.177978515625, 8.5250244140625, 8.8720703125, 9.2191162109375, 9.566162109375, 9.9132080078125, 10.26025390625, 10.6072998046875, 10.954345703125, 11.3013916015625, 11.6484375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 10.0, 9.0, 15.0, 24.0, 30.0, 39.0, 44.0, 94.0, 118.0, 160.0, 138.0, 104.0, 72.0, 42.0, 43.0, 26.0, 16.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.158594131469727, -16.842029571533203, -15.525463104248047, -14.208897590637207, -12.892332077026367, -11.575766563415527, -10.259201049804688, -8.942635536193848, -7.626070022583008, -6.309504508972168, -4.992938995361328, -3.6763734817504883, -2.3598079681396484, -1.0432424545288086, 0.27332305908203125, 1.589888572692871, 2.906454086303711, 4.223019599914551, 5.539585113525391, 6.8561506271362305, 8.17271614074707, 9.48928165435791, 10.80584716796875, 12.12241268157959, 13.43897819519043, 14.75554370880127, 16.07210922241211, 17.388675689697266, 18.70524024963379, 20.021804809570312, 21.33837127685547, 22.654937744140625, 23.97150421142578, 25.288070678710938, 26.60463523864746, 27.921199798583984, 29.23776626586914, 30.554332733154297, 31.87089729309082, 33.187461853027344, 34.5040283203125, 35.820594787597656, 37.13716125488281, 38.4537239074707, 39.77029037475586, 41.086856842041016, 42.403419494628906, 43.71998596191406, 45.03655242919922, 46.353118896484375, 47.66968536376953, 48.98624801635742, 50.30281448364258, 51.619380950927734, 52.935943603515625, 54.25251007080078, 55.56907653808594, 56.885643005371094, 58.20220947265625, 59.51877212524414, 60.8353385925293, 62.15190505981445, 63.468467712402344, 64.7850341796875, 66.10160064697266]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 1.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 22.0, 28.0, 14.0, 22.0, 19.0, 31.0, 35.0, 39.0, 36.0, 38.0, 29.0, 29.0, 37.0, 36.0, 44.0, 49.0, 33.0, 44.0, 32.0, 37.0, 25.0, 34.0, 26.0, 29.0, 22.0, 30.0, 14.0, 12.0, 16.0, 17.0, 9.0, 10.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 6.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.290016174316406, -17.674758911132812, -17.059499740600586, -16.444242477416992, -15.828984260559082, -15.213726043701172, -14.598468780517578, -13.983210563659668, -13.367952346801758, -12.752694129943848, -12.137436866760254, -11.522178649902344, -10.906920433044434, -10.291662216186523, -9.67640495300293, -9.06114673614502, -8.445889472961426, -7.830631732940674, -7.215373516082764, -6.600115776062012, -5.984857559204102, -5.36959981918335, -4.754342079162598, -4.1390838623046875, -3.5238261222839355, -2.9085681438446045, -2.2933101654052734, -1.6780524253845215, -1.0627944469451904, -0.4475364685058594, 0.16772127151489258, 0.7829794883728027, 1.3982372283935547, 2.0134952068328857, 2.628753185272217, 3.2440109252929688, 3.8592689037323, 4.474526882171631, 5.089784622192383, 5.705042839050293, 6.320300579071045, 6.935558319091797, 7.550816535949707, 8.166074752807617, 8.781332015991211, 9.396590232849121, 10.011848449707031, 10.627105712890625, 11.242363929748535, 11.857622146606445, 12.472879409790039, 13.08813762664795, 13.70339584350586, 14.318653106689453, 14.933911323547363, 15.549169540405273, 16.164426803588867, 16.77968406677246, 17.394943237304688, 18.01020050048828, 18.625457763671875, 19.2407169342041, 19.855974197387695, 20.471233367919922, 21.086490631103516]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 19.0, 17.0, 19.0, 20.0, 23.0, 21.0, 33.0, 29.0, 43.0, 38.0, 39.0, 42.0, 47.0, 48.0, 44.0, 57.0, 49.0, 36.0, 46.0, 50.0, 34.0, 29.0, 29.0, 34.0, 28.0, 21.0, 17.0, 15.0, 18.0, 14.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.6990509033203125, -1.633453369140625, -1.5678558349609375, -1.50225830078125, -1.4366607666015625, -1.371063232421875, -1.3054656982421875, -1.2398681640625, -1.1742706298828125, -1.108673095703125, -1.0430755615234375, -0.97747802734375, -0.9118804931640625, -0.846282958984375, -0.7806854248046875, -0.715087890625, -0.6494903564453125, -0.583892822265625, -0.5182952880859375, -0.45269775390625, -0.3871002197265625, -0.321502685546875, -0.2559051513671875, -0.1903076171875, -0.1247100830078125, -0.059112548828125, 0.0064849853515625, 0.07208251953125, 0.1376800537109375, 0.203277587890625, 0.2688751220703125, 0.33447265625, 0.4000701904296875, 0.465667724609375, 0.5312652587890625, 0.59686279296875, 0.6624603271484375, 0.728057861328125, 0.7936553955078125, 0.8592529296875, 0.9248504638671875, 0.990447998046875, 1.0560455322265625, 1.12164306640625, 1.1872406005859375, 1.252838134765625, 1.3184356689453125, 1.384033203125, 1.4496307373046875, 1.515228271484375, 1.5808258056640625, 1.64642333984375, 1.7120208740234375, 1.777618408203125, 1.8432159423828125, 1.9088134765625, 1.9744110107421875, 2.040008544921875, 2.1056060791015625, 2.17120361328125, 2.2368011474609375, 2.302398681640625, 2.3679962158203125, 2.43359375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 9.0, 18.0, 22.0, 32.0, 32.0, 83.0, 110.0, 175.0, 240.0, 455.0, 601.0, 1092.0, 1709.0, 3130.0, 5302.0, 9713.0, 18598.0, 37554.0, 83641.0, 210482.0, 371410.0, 167647.0, 68728.0, 31721.0, 16166.0, 8395.0, 4635.0, 2703.0, 1528.0, 965.0, 588.0, 401.0, 201.0, 150.0, 99.0, 65.0, 57.0, 20.0, 24.0, 14.0, 15.0, 4.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6484375, -8.34375, -8.0390625, -7.734375, -7.4296875, -7.125, -6.8203125, -6.515625, -6.2109375, -5.90625, -5.6015625, -5.296875, -4.9921875, -4.6875, -4.3828125, -4.078125, -3.7734375, -3.46875, -3.1640625, -2.859375, -2.5546875, -2.25, -1.9453125, -1.640625, -1.3359375, -1.03125, -0.7265625, -0.421875, -0.1171875, 0.1875, 0.4921875, 0.796875, 1.1015625, 1.40625, 1.7109375, 2.015625, 2.3203125, 2.625, 2.9296875, 3.234375, 3.5390625, 3.84375, 4.1484375, 4.453125, 4.7578125, 5.0625, 5.3671875, 5.671875, 5.9765625, 6.28125, 6.5859375, 6.890625, 7.1953125, 7.5, 7.8046875, 8.109375, 8.4140625, 8.71875, 9.0234375, 9.328125, 9.6328125, 9.9375, 10.2421875, 10.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 7.0, 8.0, 12.0, 16.0, 19.0, 24.0, 21.0, 21.0, 30.0, 35.0, 37.0, 36.0, 49.0, 50.0, 42.0, 54.0, 1076.0, 46.0, 42.0, 52.0, 47.0, 49.0, 36.0, 37.0, 28.0, 22.0, 20.0, 17.0, 20.0, 13.0, 17.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08984375, -2.025390625, -1.9609375, -1.896484375, -1.83203125, -1.767578125, -1.703125, -1.638671875, -1.57421875, -1.509765625, -1.4453125, -1.380859375, -1.31640625, -1.251953125, -1.1875, -1.123046875, -1.05859375, -0.994140625, -0.9296875, -0.865234375, -0.80078125, -0.736328125, -0.671875, -0.607421875, -0.54296875, -0.478515625, -0.4140625, -0.349609375, -0.28515625, -0.220703125, -0.15625, -0.091796875, -0.02734375, 0.037109375, 0.1015625, 0.166015625, 0.23046875, 0.294921875, 0.359375, 0.423828125, 0.48828125, 0.552734375, 0.6171875, 0.681640625, 0.74609375, 0.810546875, 0.875, 0.939453125, 1.00390625, 1.068359375, 1.1328125, 1.197265625, 1.26171875, 1.326171875, 1.390625, 1.455078125, 1.51953125, 1.583984375, 1.6484375, 1.712890625, 1.77734375, 1.841796875, 1.90625, 1.970703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 15.0, 11.0, 39.0, 30.0, 52.0, 107.0, 154.0, 280.0, 399.0, 677.0, 1158.0, 2551.0, 5547.0, 14616.0, 52972.0, 1054775.0, 886692.0, 51394.0, 14457.0, 5503.0, 2576.0, 1287.0, 691.0, 423.0, 225.0, 169.0, 107.0, 73.0, 40.0, 27.0, 14.0, 14.0, 6.0, 9.0, 1.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.359619140625, -18.73486328125, -18.110107421875, -17.4853515625, -16.860595703125, -16.23583984375, -15.611083984375, -14.986328125, -14.361572265625, -13.73681640625, -13.112060546875, -12.4873046875, -11.862548828125, -11.23779296875, -10.613037109375, -9.98828125, -9.363525390625, -8.73876953125, -8.114013671875, -7.4892578125, -6.864501953125, -6.23974609375, -5.614990234375, -4.990234375, -4.365478515625, -3.74072265625, -3.115966796875, -2.4912109375, -1.866455078125, -1.24169921875, -0.616943359375, 0.0078125, 0.632568359375, 1.25732421875, 1.882080078125, 2.5068359375, 3.131591796875, 3.75634765625, 4.381103515625, 5.005859375, 5.630615234375, 6.25537109375, 6.880126953125, 7.5048828125, 8.129638671875, 8.75439453125, 9.379150390625, 10.00390625, 10.628662109375, 11.25341796875, 11.878173828125, 12.5029296875, 13.127685546875, 13.75244140625, 14.377197265625, 15.001953125, 15.626708984375, 16.25146484375, 16.876220703125, 17.5009765625, 18.125732421875, 18.75048828125, 19.375244140625, 20.0]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 27.0, 33.0, 66.0, 94.0, 208.0, 224.0, 114.0, 55.0, 41.0, 21.0, 15.0, 10.0, 11.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.415283203125, -4.25244140625, -4.089599609375, -3.9267578125, -3.763916015625, -3.60107421875, -3.438232421875, -3.275390625, -3.112548828125, -2.94970703125, -2.786865234375, -2.6240234375, -2.461181640625, -2.29833984375, -2.135498046875, -1.97265625, -1.809814453125, -1.64697265625, -1.484130859375, -1.3212890625, -1.158447265625, -0.99560546875, -0.832763671875, -0.669921875, -0.507080078125, -0.34423828125, -0.181396484375, -0.0185546875, 0.144287109375, 0.30712890625, 0.469970703125, 0.6328125, 0.795654296875, 0.95849609375, 1.121337890625, 1.2841796875, 1.447021484375, 1.60986328125, 1.772705078125, 1.935546875, 2.098388671875, 2.26123046875, 2.424072265625, 2.5869140625, 2.749755859375, 2.91259765625, 3.075439453125, 3.23828125, 3.401123046875, 3.56396484375, 3.726806640625, 3.8896484375, 4.052490234375, 4.21533203125, 4.378173828125, 4.541015625, 4.703857421875, 4.86669921875, 5.029541015625, 5.1923828125, 5.355224609375, 5.51806640625, 5.680908203125, 5.84375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 7.0, 8.0, 14.0, 9.0, 22.0, 37.0, 55.0, 89.0, 208.0, 703.0, 4402.0, 356710.0, 680264.0, 4748.0, 733.0, 240.0, 112.0, 57.0, 34.0, 29.0, 14.0, 14.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.8125, -84.40234375, -81.9921875, -79.58203125, -77.171875, -74.76171875, -72.3515625, -69.94140625, -67.53125, -65.12109375, -62.7109375, -60.30078125, -57.890625, -55.48046875, -53.0703125, -50.66015625, -48.25, -45.83984375, -43.4296875, -41.01953125, -38.609375, -36.19921875, -33.7890625, -31.37890625, -28.96875, -26.55859375, -24.1484375, -21.73828125, -19.328125, -16.91796875, -14.5078125, -12.09765625, -9.6875, -7.27734375, -4.8671875, -2.45703125, -0.046875, 2.36328125, 4.7734375, 7.18359375, 9.59375, 12.00390625, 14.4140625, 16.82421875, 19.234375, 21.64453125, 24.0546875, 26.46484375, 28.875, 31.28515625, 33.6953125, 36.10546875, 38.515625, 40.92578125, 43.3359375, 45.74609375, 48.15625, 50.56640625, 52.9765625, 55.38671875, 57.796875, 60.20703125, 62.6171875, 65.02734375, 67.4375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 17.0, 55.0, 133.0, 351.0, 290.0, 101.0, 35.0, 17.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.813743591308594, -8.370620727539062, -7.927497863769531, -7.484375, -7.041252613067627, -6.598129749298096, -6.1550068855285645, -5.711884498596191, -5.26876163482666, -4.825638771057129, -4.382515907287598, -3.9393932819366455, -3.4962706565856934, -3.053147792816162, -2.610024929046631, -2.1669023036956787, -1.7237792015075684, -1.2806564569473267, -0.8375336527824402, -0.3944108486175537, 0.04871189594268799, 0.4918346405029297, 0.9349575042724609, 1.378080129623413, 1.8212029933929443, 2.2643258571624756, 2.7074484825134277, 3.150571346282959, 3.5936942100524902, 4.036816596984863, 4.4799394607543945, 4.923062324523926, 5.366185188293457, 5.809308052062988, 6.2524309158325195, 6.695553779602051, 7.138676166534424, 7.581799030303955, 8.024921417236328, 8.46804428100586, 8.91116714477539, 9.354290008544922, 9.797412872314453, 10.240535736083984, 10.683658599853516, 11.126781463623047, 11.569904327392578, 12.013026237487793, 12.45615005493164, 12.899272918701172, 13.342395782470703, 13.785518646240234, 14.228641510009766, 14.671764373779297, 15.114887237548828, 15.558009147644043, 16.001131057739258, 16.44425392150879, 16.88737678527832, 17.33049964904785, 17.773622512817383, 18.216745376586914, 18.659868240356445, 19.102991104125977, 19.546113967895508]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 23.0, 21.0, 37.0, 42.0, 46.0, 58.0, 56.0, 62.0, 71.0, 71.0, 65.0, 60.0, 57.0, 61.0, 53.0, 40.0, 34.0, 23.0, 34.0, 20.0, 21.0, 15.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7889270782470703, -3.6258251667022705, -3.4627232551574707, -3.299621343612671, -3.136519432067871, -2.973417282104492, -2.8103153705596924, -2.6472134590148926, -2.4841115474700928, -2.321009635925293, -2.157907724380493, -1.9948056936264038, -1.831703782081604, -1.6686018705368042, -1.5054998397827148, -1.342397928237915, -1.1792960166931152, -1.0161941051483154, -0.8530921339988708, -0.6899901628494263, -0.5268882513046265, -0.36378633975982666, -0.20068436861038208, -0.0375823974609375, 0.1255195140838623, 0.2886214554309845, 0.4517233967781067, 0.6148253679275513, 0.7779272794723511, 0.9410291910171509, 1.1041312217712402, 1.26723313331604, 1.4303350448608398, 1.5934369564056396, 1.7565388679504395, 1.9196408987045288, 2.082742691040039, 2.245844841003418, 2.4089467525482178, 2.5720486640930176, 2.7351505756378174, 2.898252487182617, 3.061354398727417, 3.224456310272217, 3.3875584602355957, 3.5506601333618164, 3.7137622833251953, 3.876864194869995, 4.039966106414795, 4.203068256378174, 4.3661699295043945, 4.529272079467773, 4.692373752593994, 4.855475902557373, 5.018577575683594, 5.181679725646973, 5.344781875610352, 5.5078840255737305, 5.670985698699951, 5.83408784866333, 5.997189521789551, 6.16029167175293, 6.32339334487915, 6.486495494842529, 6.64959716796875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 15.0, 23.0, 33.0, 34.0, 26.0, 39.0, 43.0, 54.0, 61.0, 55.0, 54.0, 55.0, 73.0, 57.0, 49.0, 53.0, 44.0, 38.0, 35.0, 34.0, 26.0, 26.0, 15.0, 10.0, 11.0, 8.0, 5.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24273681640625, -2.1593017578125, -2.07586669921875, -1.992431640625, -1.90899658203125, -1.8255615234375, -1.74212646484375, -1.65869140625, -1.57525634765625, -1.4918212890625, -1.40838623046875, -1.324951171875, -1.24151611328125, -1.1580810546875, -1.07464599609375, -0.9912109375, -0.90777587890625, -0.8243408203125, -0.74090576171875, -0.657470703125, -0.57403564453125, -0.4906005859375, -0.40716552734375, -0.32373046875, -0.24029541015625, -0.1568603515625, -0.07342529296875, 0.010009765625, 0.09344482421875, 0.1768798828125, 0.26031494140625, 0.34375, 0.42718505859375, 0.5106201171875, 0.59405517578125, 0.677490234375, 0.76092529296875, 0.8443603515625, 0.92779541015625, 1.01123046875, 1.09466552734375, 1.1781005859375, 1.26153564453125, 1.344970703125, 1.42840576171875, 1.5118408203125, 1.59527587890625, 1.6787109375, 1.76214599609375, 1.8455810546875, 1.92901611328125, 2.012451171875, 2.09588623046875, 2.1793212890625, 2.26275634765625, 2.34619140625, 2.42962646484375, 2.5130615234375, 2.59649658203125, 2.679931640625, 2.76336669921875, 2.8468017578125, 2.93023681640625, 3.013671875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 9.0, 8.0, 13.0, 9.0, 18.0, 21.0, 43.0, 54.0, 82.0, 96.0, 154.0, 241.0, 305.0, 459.0, 737.0, 989.0, 1544.0, 2397.0, 4013.0, 6952.0, 14391.0, 58775.0, 695115.0, 214136.0, 24401.0, 9550.0, 5023.0, 3097.0, 1993.0, 1366.0, 790.0, 522.0, 348.0, 251.0, 200.0, 117.0, 87.0, 62.0, 48.0, 51.0, 22.0, 16.0, 14.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.29315185546875, -4.1488037109375, -4.00445556640625, -3.860107421875, -3.71575927734375, -3.5714111328125, -3.42706298828125, -3.28271484375, -3.13836669921875, -2.9940185546875, -2.84967041015625, -2.705322265625, -2.56097412109375, -2.4166259765625, -2.27227783203125, -2.1279296875, -1.98358154296875, -1.8392333984375, -1.69488525390625, -1.550537109375, -1.40618896484375, -1.2618408203125, -1.11749267578125, -0.97314453125, -0.82879638671875, -0.6844482421875, -0.54010009765625, -0.395751953125, -0.25140380859375, -0.1070556640625, 0.03729248046875, 0.181640625, 0.32598876953125, 0.4703369140625, 0.61468505859375, 0.759033203125, 0.90338134765625, 1.0477294921875, 1.19207763671875, 1.33642578125, 1.48077392578125, 1.6251220703125, 1.76947021484375, 1.913818359375, 2.05816650390625, 2.2025146484375, 2.34686279296875, 2.4912109375, 2.63555908203125, 2.7799072265625, 2.92425537109375, 3.068603515625, 3.21295166015625, 3.3572998046875, 3.50164794921875, 3.64599609375, 3.79034423828125, 3.9346923828125, 4.07904052734375, 4.223388671875, 4.36773681640625, 4.5120849609375, 4.65643310546875, 4.80078125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 9.0, 11.0, 11.0, 20.0, 16.0, 16.0, 33.0, 20.0, 34.0, 43.0, 30.0, 39.0, 35.0, 47.0, 46.0, 103.0, 249.0, 1549.0, 211.0, 91.0, 57.0, 43.0, 52.0, 44.0, 30.0, 28.0, 23.0, 26.0, 17.0, 10.0, 13.0, 13.0, 13.0, 12.0, 6.0, 4.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.84375, -5.6307373046875, -5.417724609375, -5.2047119140625, -4.99169921875, -4.7786865234375, -4.565673828125, -4.3526611328125, -4.1396484375, -3.9266357421875, -3.713623046875, -3.5006103515625, -3.28759765625, -3.0745849609375, -2.861572265625, -2.6485595703125, -2.435546875, -2.2225341796875, -2.009521484375, -1.7965087890625, -1.58349609375, -1.3704833984375, -1.157470703125, -0.9444580078125, -0.7314453125, -0.5184326171875, -0.305419921875, -0.0924072265625, 0.12060546875, 0.3336181640625, 0.546630859375, 0.7596435546875, 0.97265625, 1.1856689453125, 1.398681640625, 1.6116943359375, 1.82470703125, 2.0377197265625, 2.250732421875, 2.4637451171875, 2.6767578125, 2.8897705078125, 3.102783203125, 3.3157958984375, 3.52880859375, 3.7418212890625, 3.954833984375, 4.1678466796875, 4.380859375, 4.5938720703125, 4.806884765625, 5.0198974609375, 5.23291015625, 5.4459228515625, 5.658935546875, 5.8719482421875, 6.0849609375, 6.2979736328125, 6.510986328125, 6.7239990234375, 6.93701171875, 7.1500244140625, 7.363037109375, 7.5760498046875, 7.7890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 11.0, 4.0, 7.0, 10.0, 12.0, 20.0, 20.0, 26.0, 45.0, 72.0, 101.0, 159.0, 296.0, 543.0, 985.0, 1948.0, 4352.0, 12097.0, 53617.0, 2012978.0, 1000333.0, 40026.0, 10216.0, 4013.0, 1690.0, 898.0, 440.0, 264.0, 157.0, 89.0, 84.0, 46.0, 34.0, 26.0, 20.0, 14.0, 9.0, 14.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0], "bins": [-9.1953125, -8.9462890625, -8.697265625, -8.4482421875, -8.19921875, -7.9501953125, -7.701171875, -7.4521484375, -7.203125, -6.9541015625, -6.705078125, -6.4560546875, -6.20703125, -5.9580078125, -5.708984375, -5.4599609375, -5.2109375, -4.9619140625, -4.712890625, -4.4638671875, -4.21484375, -3.9658203125, -3.716796875, -3.4677734375, -3.21875, -2.9697265625, -2.720703125, -2.4716796875, -2.22265625, -1.9736328125, -1.724609375, -1.4755859375, -1.2265625, -0.9775390625, -0.728515625, -0.4794921875, -0.23046875, 0.0185546875, 0.267578125, 0.5166015625, 0.765625, 1.0146484375, 1.263671875, 1.5126953125, 1.76171875, 2.0107421875, 2.259765625, 2.5087890625, 2.7578125, 3.0068359375, 3.255859375, 3.5048828125, 3.75390625, 4.0029296875, 4.251953125, 4.5009765625, 4.75, 4.9990234375, 5.248046875, 5.4970703125, 5.74609375, 5.9951171875, 6.244140625, 6.4931640625, 6.7421875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 25.0, 156.0, 511.0, 269.0, 49.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640542030334473, -4.840981960296631, -3.041422128677368, -1.2418622970581055, 0.5576977729797363, 2.357257843017578, 4.156817436218262, 5.956377983093262, 7.755937576293945, 9.555497169494629, 11.355057716369629, 13.154617309570312, 14.954177856445312, 16.753738403320312, 18.55329704284668, 20.35285758972168, 22.152416229248047, 23.951976776123047, 25.751535415649414, 27.551095962524414, 29.350656509399414, 31.15021514892578, 32.94977569580078, 34.74933624267578, 36.54889678955078, 38.34845733642578, 40.14801788330078, 41.94757843017578, 43.747135162353516, 45.546695709228516, 47.346256256103516, 49.145816802978516, 50.945377349853516, 52.744937896728516, 54.544498443603516, 56.34405517578125, 58.14361572265625, 59.94317626953125, 61.74273681640625, 63.54229736328125, 65.34185791015625, 67.14141845703125, 68.94097900390625, 70.74053955078125, 72.54010009765625, 74.33966064453125, 76.13922119140625, 77.93878173828125, 79.73833465576172, 81.53789520263672, 83.33745574951172, 85.13701629638672, 86.93657684326172, 88.73613739013672, 90.53569030761719, 92.33525085449219, 94.13481903076172, 95.93437957763672, 97.73394012451172, 99.53350067138672, 101.33306121826172, 103.13262176513672, 104.93217468261719, 106.73173522949219, 108.53129577636719]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 9.0, 6.0, 13.0, 14.0, 19.0, 15.0, 15.0, 24.0, 42.0, 28.0, 38.0, 34.0, 35.0, 59.0, 37.0, 33.0, 38.0, 61.0, 44.0, 47.0, 48.0, 42.0, 41.0, 37.0, 28.0, 37.0, 18.0, 14.0, 17.0, 20.0, 14.0, 16.0, 10.0, 9.0, 12.0, 10.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.468992233276367, -24.713703155517578, -23.95841407775879, -23.203125, -22.447834014892578, -21.69254493713379, -20.937255859375, -20.18196678161621, -19.426677703857422, -18.671388626098633, -17.916099548339844, -17.160808563232422, -16.405519485473633, -15.650230407714844, -14.894941329956055, -14.139652252197266, -13.384361267089844, -12.629072189331055, -11.87378215789795, -11.11849308013916, -10.363203048706055, -9.607913970947266, -8.852624893188477, -8.097335815429688, -7.342045783996582, -6.586756229400635, -5.8314666748046875, -5.076177597045898, -4.320888042449951, -3.565598487854004, -2.810309410095215, -2.0550198554992676, -1.2997283935546875, -0.5444389581680298, 0.21085047721862793, 0.9661397933959961, 1.7214293479919434, 2.4767189025878906, 3.2320079803466797, 3.987297534942627, 4.742587089538574, 5.4978766441345215, 6.253166198730469, 7.008455276489258, 7.763744831085205, 8.519034385681152, 9.274323463439941, 10.029613494873047, 10.784902572631836, 11.540191650390625, 12.29548168182373, 13.05077075958252, 13.806060791015625, 14.561349868774414, 15.316638946533203, 16.071928024291992, 16.82721710205078, 17.58250617980957, 18.33779525756836, 19.09308624267578, 19.84837532043457, 20.60366439819336, 21.35895347595215, 22.114242553710938, 22.86953353881836]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 13.0, 13.0, 14.0, 19.0, 30.0, 24.0, 33.0, 40.0, 31.0, 43.0, 46.0, 59.0, 51.0, 54.0, 60.0, 42.0, 57.0, 51.0, 39.0, 35.0, 35.0, 26.0, 31.0, 39.0, 24.0, 21.0, 12.0, 10.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.016082763671875, -1.94232177734375, -1.868560791015625, -1.7947998046875, -1.721038818359375, -1.64727783203125, -1.573516845703125, -1.499755859375, -1.425994873046875, -1.35223388671875, -1.278472900390625, -1.2047119140625, -1.130950927734375, -1.05718994140625, -0.983428955078125, -0.90966796875, -0.835906982421875, -0.76214599609375, -0.688385009765625, -0.6146240234375, -0.540863037109375, -0.46710205078125, -0.393341064453125, -0.319580078125, -0.245819091796875, -0.17205810546875, -0.098297119140625, -0.0245361328125, 0.049224853515625, 0.12298583984375, 0.196746826171875, 0.2705078125, 0.344268798828125, 0.41802978515625, 0.491790771484375, 0.5655517578125, 0.639312744140625, 0.71307373046875, 0.786834716796875, 0.860595703125, 0.934356689453125, 1.00811767578125, 1.081878662109375, 1.1556396484375, 1.229400634765625, 1.30316162109375, 1.376922607421875, 1.45068359375, 1.524444580078125, 1.59820556640625, 1.671966552734375, 1.7457275390625, 1.819488525390625, 1.89324951171875, 1.967010498046875, 2.040771484375, 2.114532470703125, 2.18829345703125, 2.262054443359375, 2.3358154296875, 2.409576416015625, 2.48333740234375, 2.557098388671875, 2.630859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 4.0, 6.0, 6.0, 14.0, 13.0, 26.0, 28.0, 52.0, 56.0, 86.0, 143.0, 200.0, 298.0, 446.0, 651.0, 1080.0, 1685.0, 2792.0, 4601.0, 8269.0, 15021.0, 29550.0, 65355.0, 248620.0, 2837591.0, 795599.0, 99004.0, 39165.0, 19105.0, 10193.0, 5752.0, 3350.0, 1987.0, 1249.0, 784.0, 507.0, 301.0, 227.0, 133.0, 103.0, 72.0, 56.0, 23.0, 29.0, 16.0, 5.0, 8.0, 10.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.578125, -6.38299560546875, -6.1878662109375, -5.99273681640625, -5.797607421875, -5.60247802734375, -5.4073486328125, -5.21221923828125, -5.01708984375, -4.82196044921875, -4.6268310546875, -4.43170166015625, -4.236572265625, -4.04144287109375, -3.8463134765625, -3.65118408203125, -3.4560546875, -3.26092529296875, -3.0657958984375, -2.87066650390625, -2.675537109375, -2.48040771484375, -2.2852783203125, -2.09014892578125, -1.89501953125, -1.69989013671875, -1.5047607421875, -1.30963134765625, -1.114501953125, -0.91937255859375, -0.7242431640625, -0.52911376953125, -0.333984375, -0.13885498046875, 0.0562744140625, 0.25140380859375, 0.446533203125, 0.64166259765625, 0.8367919921875, 1.03192138671875, 1.22705078125, 1.42218017578125, 1.6173095703125, 1.81243896484375, 2.007568359375, 2.20269775390625, 2.3978271484375, 2.59295654296875, 2.7880859375, 2.98321533203125, 3.1783447265625, 3.37347412109375, 3.568603515625, 3.76373291015625, 3.9588623046875, 4.15399169921875, 4.34912109375, 4.54425048828125, 4.7393798828125, 4.93450927734375, 5.129638671875, 5.32476806640625, 5.5198974609375, 5.71502685546875, 5.91015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 6.0, 6.0, 16.0, 23.0, 23.0, 50.0, 45.0, 69.0, 74.0, 104.0, 140.0, 274.0, 533.0, 824.0, 749.0, 393.0, 226.0, 143.0, 90.0, 72.0, 47.0, 32.0, 27.0, 29.0, 18.0, 12.0, 7.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.70367431640625, -4.4659423828125, -4.22821044921875, -3.990478515625, -3.75274658203125, -3.5150146484375, -3.27728271484375, -3.03955078125, -2.80181884765625, -2.5640869140625, -2.32635498046875, -2.088623046875, -1.85089111328125, -1.6131591796875, -1.37542724609375, -1.1376953125, -0.89996337890625, -0.6622314453125, -0.42449951171875, -0.186767578125, 0.05096435546875, 0.2886962890625, 0.52642822265625, 0.76416015625, 1.00189208984375, 1.2396240234375, 1.47735595703125, 1.715087890625, 1.95281982421875, 2.1905517578125, 2.42828369140625, 2.666015625, 2.90374755859375, 3.1414794921875, 3.37921142578125, 3.616943359375, 3.85467529296875, 4.0924072265625, 4.33013916015625, 4.56787109375, 4.80560302734375, 5.0433349609375, 5.28106689453125, 5.518798828125, 5.75653076171875, 5.9942626953125, 6.23199462890625, 6.4697265625, 6.70745849609375, 6.9451904296875, 7.18292236328125, 7.420654296875, 7.65838623046875, 7.8961181640625, 8.13385009765625, 8.37158203125, 8.60931396484375, 8.8470458984375, 9.08477783203125, 9.322509765625, 9.56024169921875, 9.7979736328125, 10.03570556640625, 10.2734375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 11.0, 8.0, 16.0, 23.0, 44.0, 52.0, 115.0, 190.0, 350.0, 660.0, 1311.0, 2815.0, 6283.0, 14593.0, 37653.0, 109665.0, 537679.0, 2992207.0, 350106.0, 87024.0, 30834.0, 12482.0, 5334.0, 2438.0, 1147.0, 547.0, 295.0, 158.0, 82.0, 53.0, 37.0, 32.0, 16.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.234375, -11.915771484375, -11.59716796875, -11.278564453125, -10.9599609375, -10.641357421875, -10.32275390625, -10.004150390625, -9.685546875, -9.366943359375, -9.04833984375, -8.729736328125, -8.4111328125, -8.092529296875, -7.77392578125, -7.455322265625, -7.13671875, -6.818115234375, -6.49951171875, -6.180908203125, -5.8623046875, -5.543701171875, -5.22509765625, -4.906494140625, -4.587890625, -4.269287109375, -3.95068359375, -3.632080078125, -3.3134765625, -2.994873046875, -2.67626953125, -2.357666015625, -2.0390625, -1.720458984375, -1.40185546875, -1.083251953125, -0.7646484375, -0.446044921875, -0.12744140625, 0.191162109375, 0.509765625, 0.828369140625, 1.14697265625, 1.465576171875, 1.7841796875, 2.102783203125, 2.42138671875, 2.739990234375, 3.05859375, 3.377197265625, 3.69580078125, 4.014404296875, 4.3330078125, 4.651611328125, 4.97021484375, 5.288818359375, 5.607421875, 5.926025390625, 6.24462890625, 6.563232421875, 6.8818359375, 7.200439453125, 7.51904296875, 7.837646484375, 8.15625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 16.0, 26.0, 57.0, 93.0, 156.0, 184.0, 181.0, 126.0, 63.0, 36.0, 34.0, 15.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.126312255859375, -59.4169807434082, -57.70764923095703, -55.998313903808594, -54.28898239135742, -52.57965087890625, -50.87031936645508, -49.160987854003906, -47.45165252685547, -45.7423210144043, -44.032989501953125, -42.32365417480469, -40.614322662353516, -38.904991149902344, -37.19565963745117, -35.486328125, -33.77699661254883, -32.067665100097656, -30.35833168029785, -28.64900016784668, -26.939666748046875, -25.230335235595703, -23.52100372314453, -21.81167221069336, -20.102338790893555, -18.393007278442383, -16.683673858642578, -14.974342346191406, -13.265009880065918, -11.55567741394043, -9.846345901489258, -8.13701343536377, -6.427677154541016, -4.718344688415527, -3.0090126991271973, -1.2996807098388672, 0.4096517562866211, 2.1189842224121094, 3.8283157348632812, 5.5376482009887695, 7.246980667114258, 8.956313133239746, 10.665645599365234, 12.374977111816406, 14.084309577941895, 15.793642044067383, 17.502973556518555, 19.21230697631836, 20.92163848876953, 22.630970001220703, 24.340303421020508, 26.04963493347168, 27.758968353271484, 29.468299865722656, 31.177631378173828, 32.886962890625, 34.59629821777344, 36.30562973022461, 38.01496124267578, 39.72429656982422, 41.43362808227539, 43.14295959472656, 44.852291107177734, 46.561622619628906, 48.27095413208008]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 14.0, 11.0, 15.0, 13.0, 15.0, 20.0, 22.0, 25.0, 21.0, 34.0, 28.0, 36.0, 36.0, 42.0, 36.0, 29.0, 32.0, 44.0, 31.0, 33.0, 48.0, 43.0, 33.0, 37.0, 35.0, 34.0, 29.0, 32.0, 24.0, 27.0, 20.0, 16.0, 11.0, 17.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.841964721679688, -17.242277145385742, -16.642589569091797, -16.04290199279785, -15.44321346282959, -14.843525886535645, -14.2438383102417, -13.644149780273438, -13.044462203979492, -12.444774627685547, -11.845087051391602, -11.245399475097656, -10.645710945129395, -10.04602336883545, -9.446335792541504, -8.846647262573242, -8.246960639953613, -7.647273063659668, -7.0475850105285645, -6.447897434234619, -5.848209381103516, -5.24852180480957, -4.648834228515625, -4.0491461753845215, -3.449458599090576, -2.8497707843780518, -2.2500829696655273, -1.650395393371582, -1.0507075786590576, -0.4510197639465332, 0.1486678123474121, 0.7483558654785156, 1.348043441772461, 1.9477312564849854, 2.5474190711975098, 3.147106647491455, 3.7467944622039795, 4.346482276916504, 4.946169853210449, 5.545857906341553, 6.145545482635498, 6.745233058929443, 7.344921112060547, 7.944608688354492, 8.544296264648438, 9.143983840942383, 9.743671417236328, 10.34335994720459, 10.943047523498535, 11.54273509979248, 12.142422676086426, 12.742111206054688, 13.341798782348633, 13.941486358642578, 14.541173934936523, 15.140861511230469, 15.740549087524414, 16.34023666381836, 16.939924240112305, 17.53961181640625, 18.139299392700195, 18.73898696899414, 19.33867645263672, 19.938364028930664, 20.53805160522461]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 11.0, 9.0, 12.0, 13.0, 18.0, 22.0, 35.0, 32.0, 37.0, 39.0, 37.0, 52.0, 63.0, 63.0, 65.0, 53.0, 67.0, 51.0, 40.0, 29.0, 36.0, 35.0, 26.0, 34.0, 27.0, 15.0, 19.0, 11.0, 11.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4517822265625, -2.372314453125, -2.2928466796875, -2.21337890625, -2.1339111328125, -2.054443359375, -1.9749755859375, -1.8955078125, -1.8160400390625, -1.736572265625, -1.6571044921875, -1.57763671875, -1.4981689453125, -1.418701171875, -1.3392333984375, -1.259765625, -1.1802978515625, -1.100830078125, -1.0213623046875, -0.94189453125, -0.8624267578125, -0.782958984375, -0.7034912109375, -0.6240234375, -0.5445556640625, -0.465087890625, -0.3856201171875, -0.30615234375, -0.2266845703125, -0.147216796875, -0.0677490234375, 0.01171875, 0.0911865234375, 0.170654296875, 0.2501220703125, 0.32958984375, 0.4090576171875, 0.488525390625, 0.5679931640625, 0.6474609375, 0.7269287109375, 0.806396484375, 0.8858642578125, 0.96533203125, 1.0447998046875, 1.124267578125, 1.2037353515625, 1.283203125, 1.3626708984375, 1.442138671875, 1.5216064453125, 1.60107421875, 1.6805419921875, 1.760009765625, 1.8394775390625, 1.9189453125, 1.9984130859375, 2.077880859375, 2.1573486328125, 2.23681640625, 2.3162841796875, 2.395751953125, 2.4752197265625, 2.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 4.0, 14.0, 15.0, 31.0, 68.0, 69.0, 127.0, 213.0, 319.0, 507.0, 739.0, 1129.0, 1780.0, 2924.0, 4516.0, 7082.0, 11398.0, 18787.0, 34332.0, 68378.0, 162734.0, 415208.0, 164195.0, 69390.0, 34629.0, 19337.0, 11371.0, 6928.0, 4424.0, 2803.0, 1776.0, 1161.0, 754.0, 521.0, 326.0, 194.0, 136.0, 84.0, 56.0, 28.0, 16.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5762939453125, -10.269775390625, -9.9632568359375, -9.65673828125, -9.3502197265625, -9.043701171875, -8.7371826171875, -8.4306640625, -8.1241455078125, -7.817626953125, -7.5111083984375, -7.20458984375, -6.8980712890625, -6.591552734375, -6.2850341796875, -5.978515625, -5.6719970703125, -5.365478515625, -5.0589599609375, -4.75244140625, -4.4459228515625, -4.139404296875, -3.8328857421875, -3.5263671875, -3.2198486328125, -2.913330078125, -2.6068115234375, -2.30029296875, -1.9937744140625, -1.687255859375, -1.3807373046875, -1.07421875, -0.7677001953125, -0.461181640625, -0.1546630859375, 0.15185546875, 0.4583740234375, 0.764892578125, 1.0714111328125, 1.3779296875, 1.6844482421875, 1.990966796875, 2.2974853515625, 2.60400390625, 2.9105224609375, 3.217041015625, 3.5235595703125, 3.830078125, 4.1365966796875, 4.443115234375, 4.7496337890625, 5.05615234375, 5.3626708984375, 5.669189453125, 5.9757080078125, 6.2822265625, 6.5887451171875, 6.895263671875, 7.2017822265625, 7.50830078125, 7.8148193359375, 8.121337890625, 8.4278564453125, 8.734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 15.0, 20.0, 14.0, 15.0, 23.0, 21.0, 34.0, 37.0, 39.0, 39.0, 53.0, 46.0, 43.0, 59.0, 1061.0, 47.0, 43.0, 38.0, 34.0, 32.0, 33.0, 33.0, 27.0, 27.0, 27.0, 17.0, 22.0, 15.0, 14.0, 11.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.45703125, -2.3908233642578125, -2.324615478515625, -2.2584075927734375, -2.19219970703125, -2.1259918212890625, -2.059783935546875, -1.9935760498046875, -1.9273681640625, -1.8611602783203125, -1.794952392578125, -1.7287445068359375, -1.66253662109375, -1.5963287353515625, -1.530120849609375, -1.4639129638671875, -1.397705078125, -1.3314971923828125, -1.265289306640625, -1.1990814208984375, -1.13287353515625, -1.0666656494140625, -1.000457763671875, -0.9342498779296875, -0.8680419921875, -0.8018341064453125, -0.735626220703125, -0.6694183349609375, -0.60321044921875, -0.5370025634765625, -0.470794677734375, -0.4045867919921875, -0.33837890625, -0.2721710205078125, -0.205963134765625, -0.1397552490234375, -0.07354736328125, -0.0073394775390625, 0.058868408203125, 0.1250762939453125, 0.1912841796875, 0.2574920654296875, 0.323699951171875, 0.3899078369140625, 0.45611572265625, 0.5223236083984375, 0.588531494140625, 0.6547393798828125, 0.720947265625, 0.7871551513671875, 0.853363037109375, 0.9195709228515625, 0.98577880859375, 1.0519866943359375, 1.118194580078125, 1.1844024658203125, 1.2506103515625, 1.3168182373046875, 1.383026123046875, 1.4492340087890625, 1.51544189453125, 1.5816497802734375, 1.647857666015625, 1.7140655517578125, 1.7802734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 0.0, 10.0, 3.0, 6.0, 20.0, 30.0, 33.0, 57.0, 68.0, 103.0, 186.0, 275.0, 439.0, 763.0, 1424.0, 3173.0, 8534.0, 26684.0, 132851.0, 1727473.0, 150553.0, 28509.0, 8945.0, 3449.0, 1479.0, 801.0, 422.0, 271.0, 175.0, 127.0, 107.0, 54.0, 35.0, 13.0, 12.0, 13.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.5625, -18.921630859375, -18.28076171875, -17.639892578125, -16.9990234375, -16.358154296875, -15.71728515625, -15.076416015625, -14.435546875, -13.794677734375, -13.15380859375, -12.512939453125, -11.8720703125, -11.231201171875, -10.59033203125, -9.949462890625, -9.30859375, -8.667724609375, -8.02685546875, -7.385986328125, -6.7451171875, -6.104248046875, -5.46337890625, -4.822509765625, -4.181640625, -3.540771484375, -2.89990234375, -2.259033203125, -1.6181640625, -0.977294921875, -0.33642578125, 0.304443359375, 0.9453125, 1.586181640625, 2.22705078125, 2.867919921875, 3.5087890625, 4.149658203125, 4.79052734375, 5.431396484375, 6.072265625, 6.713134765625, 7.35400390625, 7.994873046875, 8.6357421875, 9.276611328125, 9.91748046875, 10.558349609375, 11.19921875, 11.840087890625, 12.48095703125, 13.121826171875, 13.7626953125, 14.403564453125, 15.04443359375, 15.685302734375, 16.326171875, 16.967041015625, 17.60791015625, 18.248779296875, 18.8896484375, 19.530517578125, 20.17138671875, 20.812255859375, 21.453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 19.0, 26.0, 71.0, 109.0, 287.0, 235.0, 103.0, 50.0, 26.0, 16.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.453125, -5.2578125, -5.0625, -4.8671875, -4.671875, -4.4765625, -4.28125, -4.0859375, -3.890625, -3.6953125, -3.5, -3.3046875, -3.109375, -2.9140625, -2.71875, -2.5234375, -2.328125, -2.1328125, -1.9375, -1.7421875, -1.546875, -1.3515625, -1.15625, -0.9609375, -0.765625, -0.5703125, -0.375, -0.1796875, 0.015625, 0.2109375, 0.40625, 0.6015625, 0.796875, 0.9921875, 1.1875, 1.3828125, 1.578125, 1.7734375, 1.96875, 2.1640625, 2.359375, 2.5546875, 2.75, 2.9453125, 3.140625, 3.3359375, 3.53125, 3.7265625, 3.921875, 4.1171875, 4.3125, 4.5078125, 4.703125, 4.8984375, 5.09375, 5.2890625, 5.484375, 5.6796875, 5.875, 6.0703125, 6.265625, 6.4609375, 6.65625, 6.8515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 32.0, 52.0, 113.0, 382.0, 1554.0, 20360.0, 1017587.0, 7015.0, 992.0, 237.0, 99.0, 41.0, 12.0, 10.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.625, -102.63671875, -99.6484375, -96.66015625, -93.671875, -90.68359375, -87.6953125, -84.70703125, -81.71875, -78.73046875, -75.7421875, -72.75390625, -69.765625, -66.77734375, -63.7890625, -60.80078125, -57.8125, -54.82421875, -51.8359375, -48.84765625, -45.859375, -42.87109375, -39.8828125, -36.89453125, -33.90625, -30.91796875, -27.9296875, -24.94140625, -21.953125, -18.96484375, -15.9765625, -12.98828125, -10.0, -7.01171875, -4.0234375, -1.03515625, 1.953125, 4.94140625, 7.9296875, 10.91796875, 13.90625, 16.89453125, 19.8828125, 22.87109375, 25.859375, 28.84765625, 31.8359375, 34.82421875, 37.8125, 40.80078125, 43.7890625, 46.77734375, 49.765625, 52.75390625, 55.7421875, 58.73046875, 61.71875, 64.70703125, 67.6953125, 70.68359375, 73.671875, 76.66015625, 79.6484375, 82.63671875, 85.625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 12.0, 11.0, 20.0, 45.0, 59.0, 143.0, 272.0, 235.0, 99.0, 58.0, 25.0, 15.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.849494934082031, -11.527217864990234, -11.204939842224121, -10.882662773132324, -10.560384750366211, -10.238107681274414, -9.9158296585083, -9.593552589416504, -9.27127456665039, -8.948997497558594, -8.62671947479248, -8.304442405700684, -7.98216438293457, -7.659886837005615, -7.33760929107666, -7.015332221984863, -6.693054676055908, -6.370777130126953, -6.048499584197998, -5.726222038269043, -5.403944492340088, -5.081666946411133, -4.759389877319336, -4.437111854553223, -4.114834785461426, -3.7925572395324707, -3.4702796936035156, -3.1480021476745605, -2.8257246017456055, -2.5034470558166504, -2.1811697483062744, -1.8588922023773193, -1.5366144180297852, -1.21433687210083, -0.8920593857765198, -0.5697818994522095, -0.2475043535232544, 0.07477319240570068, 0.3970506191253662, 0.7193281650543213, 1.0416057109832764, 1.3638832569122314, 1.6861608028411865, 2.0084381103515625, 2.3307156562805176, 2.6529932022094727, 2.9752707481384277, 3.297548294067383, 3.619825839996338, 3.942103385925293, 4.264380931854248, 4.586658477783203, 4.908936023712158, 5.231213569641113, 5.55349063873291, 5.875768661499023, 6.19804573059082, 6.520323276519775, 6.8426008224487305, 7.1648783683776855, 7.487155914306641, 7.809433460235596, 8.13171100616455, 8.453988075256348, 8.776266098022461]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 15.0, 11.0, 18.0, 17.0, 34.0, 31.0, 34.0, 44.0, 45.0, 38.0, 49.0, 38.0, 55.0, 58.0, 57.0, 47.0, 48.0, 57.0, 58.0, 32.0, 29.0, 36.0, 38.0, 20.0, 15.0, 12.0, 10.0, 6.0, 3.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3224947452545166, -3.1939871311187744, -3.0654797554016113, -2.936972141265869, -2.808464527130127, -2.6799569129943848, -2.5514495372772217, -2.4229419231414795, -2.2944345474243164, -2.165926933288574, -2.037419557571411, -1.908911943435669, -1.7804043292999268, -1.6518968343734741, -1.5233893394470215, -1.3948817253112793, -1.266374111175537, -1.1378666162490845, -1.0093590021133423, -0.8808515071868896, -0.7523439526557922, -0.6238363981246948, -0.4953289031982422, -0.3668213486671448, -0.23831379413604736, -0.10980625450611115, 0.018701285123825073, 0.1472088098526001, 0.2757163643836975, 0.4042239189147949, 0.5327314138412476, 0.661238968372345, 0.7897462844848633, 0.9182538390159607, 1.046761393547058, 1.1752688884735107, 1.303776502609253, 1.4322839975357056, 1.5607914924621582, 1.6892991065979004, 1.817806601524353, 1.9463140964508057, 2.074821710586548, 2.203329086303711, 2.331836700439453, 2.4603443145751953, 2.5888519287109375, 2.7173593044281006, 2.8458669185638428, 2.974374532699585, 3.102881908416748, 3.2313895225524902, 3.3598971366882324, 3.4884047508239746, 3.6169121265411377, 3.74541974067688, 3.873927116394043, 4.002434730529785, 4.130942344665527, 4.2594499588012695, 4.3879570960998535, 4.516464710235596, 4.644972324371338, 4.77347993850708, 4.901987552642822]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 13.0, 10.0, 12.0, 11.0, 17.0, 27.0, 30.0, 37.0, 46.0, 47.0, 48.0, 65.0, 67.0, 51.0, 64.0, 43.0, 66.0, 53.0, 45.0, 35.0, 32.0, 30.0, 32.0, 28.0, 18.0, 21.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.534454345703125, -2.44781494140625, -2.361175537109375, -2.2745361328125, -2.187896728515625, -2.10125732421875, -2.014617919921875, -1.927978515625, -1.841339111328125, -1.75469970703125, -1.668060302734375, -1.5814208984375, -1.494781494140625, -1.40814208984375, -1.321502685546875, -1.23486328125, -1.148223876953125, -1.06158447265625, -0.974945068359375, -0.8883056640625, -0.801666259765625, -0.71502685546875, -0.628387451171875, -0.541748046875, -0.455108642578125, -0.36846923828125, -0.281829833984375, -0.1951904296875, -0.108551025390625, -0.02191162109375, 0.064727783203125, 0.1513671875, 0.238006591796875, 0.32464599609375, 0.411285400390625, 0.4979248046875, 0.584564208984375, 0.67120361328125, 0.757843017578125, 0.844482421875, 0.931121826171875, 1.01776123046875, 1.104400634765625, 1.1910400390625, 1.277679443359375, 1.36431884765625, 1.450958251953125, 1.53759765625, 1.624237060546875, 1.71087646484375, 1.797515869140625, 1.8841552734375, 1.970794677734375, 2.05743408203125, 2.144073486328125, 2.230712890625, 2.317352294921875, 2.40399169921875, 2.490631103515625, 2.5772705078125, 2.663909912109375, 2.75054931640625, 2.837188720703125, 2.923828125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 16.0, 10.0, 31.0, 31.0, 59.0, 106.0, 153.0, 225.0, 343.0, 578.0, 930.0, 1463.0, 2509.0, 4232.0, 7539.0, 14357.0, 31507.0, 102764.0, 662201.0, 144565.0, 38060.0, 16737.0, 8533.0, 4773.0, 2604.0, 1580.0, 966.0, 596.0, 403.0, 245.0, 150.0, 91.0, 82.0, 35.0, 27.0, 20.0, 12.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.58154296875, -4.4365234375, -4.29150390625, -4.146484375, -4.00146484375, -3.8564453125, -3.71142578125, -3.56640625, -3.42138671875, -3.2763671875, -3.13134765625, -2.986328125, -2.84130859375, -2.6962890625, -2.55126953125, -2.40625, -2.26123046875, -2.1162109375, -1.97119140625, -1.826171875, -1.68115234375, -1.5361328125, -1.39111328125, -1.24609375, -1.10107421875, -0.9560546875, -0.81103515625, -0.666015625, -0.52099609375, -0.3759765625, -0.23095703125, -0.0859375, 0.05908203125, 0.2041015625, 0.34912109375, 0.494140625, 0.63916015625, 0.7841796875, 0.92919921875, 1.07421875, 1.21923828125, 1.3642578125, 1.50927734375, 1.654296875, 1.79931640625, 1.9443359375, 2.08935546875, 2.234375, 2.37939453125, 2.5244140625, 2.66943359375, 2.814453125, 2.95947265625, 3.1044921875, 3.24951171875, 3.39453125, 3.53955078125, 3.6845703125, 3.82958984375, 3.974609375, 4.11962890625, 4.2646484375, 4.40966796875, 4.5546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 6.0, 14.0, 13.0, 16.0, 26.0, 17.0, 27.0, 27.0, 36.0, 30.0, 39.0, 38.0, 63.0, 81.0, 124.0, 283.0, 1510.0, 157.0, 92.0, 82.0, 50.0, 34.0, 38.0, 39.0, 24.0, 27.0, 23.0, 14.0, 17.0, 12.0, 13.0, 7.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.37890625, -7.1424560546875, -6.906005859375, -6.6695556640625, -6.43310546875, -6.1966552734375, -5.960205078125, -5.7237548828125, -5.4873046875, -5.2508544921875, -5.014404296875, -4.7779541015625, -4.54150390625, -4.3050537109375, -4.068603515625, -3.8321533203125, -3.595703125, -3.3592529296875, -3.122802734375, -2.8863525390625, -2.64990234375, -2.4134521484375, -2.177001953125, -1.9405517578125, -1.7041015625, -1.4676513671875, -1.231201171875, -0.9947509765625, -0.75830078125, -0.5218505859375, -0.285400390625, -0.0489501953125, 0.1875, 0.4239501953125, 0.660400390625, 0.8968505859375, 1.13330078125, 1.3697509765625, 1.606201171875, 1.8426513671875, 2.0791015625, 2.3155517578125, 2.552001953125, 2.7884521484375, 3.02490234375, 3.2613525390625, 3.497802734375, 3.7342529296875, 3.970703125, 4.2071533203125, 4.443603515625, 4.6800537109375, 4.91650390625, 5.1529541015625, 5.389404296875, 5.6258544921875, 5.8623046875, 6.0987548828125, 6.335205078125, 6.5716552734375, 6.80810546875, 7.0445556640625, 7.281005859375, 7.5174560546875, 7.75390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 9.0, 15.0, 19.0, 24.0, 42.0, 50.0, 90.0, 186.0, 425.0, 1079.0, 3521.0, 17145.0, 231829.0, 2807588.0, 71138.0, 8981.0, 2133.0, 731.0, 310.0, 134.0, 68.0, 44.0, 38.0, 24.0, 20.0, 8.0, 8.0, 9.0, 6.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1787109375, -14.708984375, -14.2392578125, -13.76953125, -13.2998046875, -12.830078125, -12.3603515625, -11.890625, -11.4208984375, -10.951171875, -10.4814453125, -10.01171875, -9.5419921875, -9.072265625, -8.6025390625, -8.1328125, -7.6630859375, -7.193359375, -6.7236328125, -6.25390625, -5.7841796875, -5.314453125, -4.8447265625, -4.375, -3.9052734375, -3.435546875, -2.9658203125, -2.49609375, -2.0263671875, -1.556640625, -1.0869140625, -0.6171875, -0.1474609375, 0.322265625, 0.7919921875, 1.26171875, 1.7314453125, 2.201171875, 2.6708984375, 3.140625, 3.6103515625, 4.080078125, 4.5498046875, 5.01953125, 5.4892578125, 5.958984375, 6.4287109375, 6.8984375, 7.3681640625, 7.837890625, 8.3076171875, 8.77734375, 9.2470703125, 9.716796875, 10.1865234375, 10.65625, 11.1259765625, 11.595703125, 12.0654296875, 12.53515625, 13.0048828125, 13.474609375, 13.9443359375, 14.4140625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 28.0, 102.0, 205.0, 336.0, 230.0, 79.0, 19.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.266178131103516, -27.768829345703125, -26.271480560302734, -24.774133682250977, -23.276784896850586, -21.779436111450195, -20.282089233398438, -18.784740447998047, -17.287391662597656, -15.790042877197266, -14.292695045471191, -12.795347213745117, -11.297998428344727, -9.800649642944336, -8.303301811218262, -6.8059539794921875, -5.308605194091797, -3.8112568855285645, -2.313908576965332, -0.8165602684020996, 0.6807880401611328, 2.1781363487243652, 3.6754846572875977, 5.172832489013672, 6.6701812744140625, 8.167530059814453, 9.664877891540527, 11.162225723266602, 12.659574508666992, 14.156923294067383, 15.654271125793457, 17.15161895751953, 18.648971557617188, 20.146320343017578, 21.64366912841797, 23.141016006469727, 24.638364791870117, 26.135713577270508, 27.633060455322266, 29.130409240722656, 30.627758026123047, 32.12510681152344, 33.62245559692383, 35.11980438232422, 36.617149353027344, 38.114498138427734, 39.611846923828125, 41.109195709228516, 42.606544494628906, 44.1038932800293, 45.60124206542969, 47.09859085083008, 48.59593963623047, 50.093284606933594, 51.590633392333984, 53.087982177734375, 54.585330963134766, 56.082679748535156, 57.58002853393555, 59.07737731933594, 60.57472229003906, 62.07207107543945, 63.569419860839844, 65.0667724609375, 66.56411743164062]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 8.0, 4.0, 7.0, 12.0, 18.0, 17.0, 18.0, 22.0, 22.0, 36.0, 26.0, 38.0, 43.0, 42.0, 37.0, 41.0, 43.0, 56.0, 60.0, 47.0, 41.0, 35.0, 51.0, 49.0, 29.0, 34.0, 30.0, 25.0, 23.0, 21.0, 13.0, 18.0, 6.0, 4.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.179262161254883, -21.414167404174805, -20.649070739746094, -19.883975982666016, -19.118881225585938, -18.35378646850586, -17.58868980407715, -16.82359504699707, -16.05849838256836, -15.293402671813965, -14.528307914733887, -13.763212203979492, -12.998117446899414, -12.23302173614502, -11.467926025390625, -10.702831268310547, -9.937736511230469, -9.172640800476074, -8.407546043395996, -7.642450332641602, -6.877355098724365, -6.112259864807129, -5.347164154052734, -4.582068920135498, -3.8169736862182617, -3.0518784523010254, -2.28678297996521, -1.5216875076293945, -0.7565922737121582, 0.008502960205078125, 0.7735986709594727, 1.538693904876709, 2.3037891387939453, 3.0688843727111816, 3.833979845046997, 4.5990753173828125, 5.364170551300049, 6.129265785217285, 6.89436149597168, 7.659456729888916, 8.424551963806152, 9.189647674560547, 9.954742431640625, 10.71983814239502, 11.484933853149414, 12.250028610229492, 13.015124320983887, 13.780220031738281, 14.54531478881836, 15.310410499572754, 16.07550621032715, 16.840600967407227, 17.605695724487305, 18.370792388916016, 19.135887145996094, 19.900981903076172, 20.66607666015625, 21.431171417236328, 22.19626808166504, 22.961362838745117, 23.726457595825195, 24.491554260253906, 25.256649017333984, 26.021743774414062, 26.786840438842773]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 15.0, 12.0, 18.0, 27.0, 34.0, 35.0, 49.0, 53.0, 45.0, 64.0, 62.0, 51.0, 37.0, 76.0, 48.0, 44.0, 49.0, 37.0, 35.0, 27.0, 34.0, 20.0, 21.0, 24.0, 11.0, 11.0, 5.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.248016357421875, -2.16204833984375, -2.076080322265625, -1.9901123046875, -1.904144287109375, -1.81817626953125, -1.732208251953125, -1.646240234375, -1.560272216796875, -1.47430419921875, -1.388336181640625, -1.3023681640625, -1.216400146484375, -1.13043212890625, -1.044464111328125, -0.95849609375, -0.872528076171875, -0.78656005859375, -0.700592041015625, -0.6146240234375, -0.528656005859375, -0.44268798828125, -0.356719970703125, -0.270751953125, -0.184783935546875, -0.09881591796875, -0.012847900390625, 0.0731201171875, 0.159088134765625, 0.24505615234375, 0.331024169921875, 0.4169921875, 0.502960205078125, 0.58892822265625, 0.674896240234375, 0.7608642578125, 0.846832275390625, 0.93280029296875, 1.018768310546875, 1.104736328125, 1.190704345703125, 1.27667236328125, 1.362640380859375, 1.4486083984375, 1.534576416015625, 1.62054443359375, 1.706512451171875, 1.79248046875, 1.878448486328125, 1.96441650390625, 2.050384521484375, 2.1363525390625, 2.222320556640625, 2.30828857421875, 2.394256591796875, 2.480224609375, 2.566192626953125, 2.65216064453125, 2.738128662109375, 2.8240966796875, 2.910064697265625, 2.99603271484375, 3.082000732421875, 3.16796875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 11.0, 17.0, 17.0, 37.0, 53.0, 82.0, 124.0, 190.0, 289.0, 456.0, 689.0, 1075.0, 1680.0, 2800.0, 4438.0, 7328.0, 12669.0, 22339.0, 42740.0, 98970.0, 535661.0, 2602756.0, 648047.0, 108012.0, 44733.0, 23310.0, 13796.0, 8214.0, 4903.0, 3168.0, 2009.0, 1282.0, 776.0, 531.0, 351.0, 221.0, 158.0, 121.0, 58.0, 45.0, 32.0, 29.0, 13.0, 13.0, 13.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.27734375, -4.1220703125, -3.966796875, -3.8115234375, -3.65625, -3.5009765625, -3.345703125, -3.1904296875, -3.03515625, -2.8798828125, -2.724609375, -2.5693359375, -2.4140625, -2.2587890625, -2.103515625, -1.9482421875, -1.79296875, -1.6376953125, -1.482421875, -1.3271484375, -1.171875, -1.0166015625, -0.861328125, -0.7060546875, -0.55078125, -0.3955078125, -0.240234375, -0.0849609375, 0.0703125, 0.2255859375, 0.380859375, 0.5361328125, 0.69140625, 0.8466796875, 1.001953125, 1.1572265625, 1.3125, 1.4677734375, 1.623046875, 1.7783203125, 1.93359375, 2.0888671875, 2.244140625, 2.3994140625, 2.5546875, 2.7099609375, 2.865234375, 3.0205078125, 3.17578125, 3.3310546875, 3.486328125, 3.6416015625, 3.796875, 3.9521484375, 4.107421875, 4.2626953125, 4.41796875, 4.5732421875, 4.728515625, 4.8837890625, 5.0390625, 5.1943359375, 5.349609375, 5.5048828125, 5.66015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 16.0, 17.0, 14.0, 24.0, 35.0, 41.0, 48.0, 66.0, 78.0, 121.0, 173.0, 325.0, 501.0, 687.0, 589.0, 434.0, 211.0, 161.0, 104.0, 88.0, 71.0, 46.0, 46.0, 35.0, 25.0, 23.0, 10.0, 15.0, 11.0, 5.0, 6.0, 8.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.629150390625, -5.42626953125, -5.223388671875, -5.0205078125, -4.817626953125, -4.61474609375, -4.411865234375, -4.208984375, -4.006103515625, -3.80322265625, -3.600341796875, -3.3974609375, -3.194580078125, -2.99169921875, -2.788818359375, -2.5859375, -2.383056640625, -2.18017578125, -1.977294921875, -1.7744140625, -1.571533203125, -1.36865234375, -1.165771484375, -0.962890625, -0.760009765625, -0.55712890625, -0.354248046875, -0.1513671875, 0.051513671875, 0.25439453125, 0.457275390625, 0.66015625, 0.863037109375, 1.06591796875, 1.268798828125, 1.4716796875, 1.674560546875, 1.87744140625, 2.080322265625, 2.283203125, 2.486083984375, 2.68896484375, 2.891845703125, 3.0947265625, 3.297607421875, 3.50048828125, 3.703369140625, 3.90625, 4.109130859375, 4.31201171875, 4.514892578125, 4.7177734375, 4.920654296875, 5.12353515625, 5.326416015625, 5.529296875, 5.732177734375, 5.93505859375, 6.137939453125, 6.3408203125, 6.543701171875, 6.74658203125, 6.949462890625, 7.15234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 13.0, 11.0, 20.0, 46.0, 67.0, 77.0, 125.0, 224.0, 319.0, 571.0, 922.0, 1672.0, 2929.0, 5010.0, 9760.0, 18857.0, 40894.0, 96712.0, 311018.0, 2355993.0, 1037543.0, 182851.0, 67346.0, 29606.0, 14601.0, 7406.0, 4163.0, 2253.0, 1276.0, 784.0, 471.0, 287.0, 154.0, 109.0, 66.0, 41.0, 34.0, 18.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.453125, -7.21875, -6.984375, -6.75, -6.515625, -6.28125, -6.046875, -5.8125, -5.578125, -5.34375, -5.109375, -4.875, -4.640625, -4.40625, -4.171875, -3.9375, -3.703125, -3.46875, -3.234375, -3.0, -2.765625, -2.53125, -2.296875, -2.0625, -1.828125, -1.59375, -1.359375, -1.125, -0.890625, -0.65625, -0.421875, -0.1875, 0.046875, 0.28125, 0.515625, 0.75, 0.984375, 1.21875, 1.453125, 1.6875, 1.921875, 2.15625, 2.390625, 2.625, 2.859375, 3.09375, 3.328125, 3.5625, 3.796875, 4.03125, 4.265625, 4.5, 4.734375, 4.96875, 5.203125, 5.4375, 5.671875, 5.90625, 6.140625, 6.375, 6.609375, 6.84375, 7.078125, 7.3125, 7.546875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 10.0, 8.0, 32.0, 55.0, 127.0, 185.0, 248.0, 165.0, 102.0, 41.0, 19.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3114242553711, -92.07685089111328, -89.84226989746094, -87.60769653320312, -85.37312316894531, -83.1385498046875, -80.90396881103516, -78.66939544677734, -76.434814453125, -74.20024108886719, -71.96566009521484, -69.73108673095703, -67.49651336669922, -65.26193237304688, -63.02735900878906, -60.79278564453125, -58.55821228027344, -56.32363510131836, -54.08906173706055, -51.85448455810547, -49.619911193847656, -47.38533401489258, -45.1507568359375, -42.91618347167969, -40.68160629272461, -38.44702911376953, -36.21245574951172, -33.97787857055664, -31.743303298950195, -29.50872802734375, -27.274150848388672, -25.039575576782227, -22.804996490478516, -20.57042121887207, -18.335845947265625, -16.101268768310547, -13.866693496704102, -11.632118225097656, -9.397541999816895, -7.162965774536133, -4.9283905029296875, -2.693814754486084, -0.45923900604248047, 1.775336742401123, 4.009912490844727, 6.244487762451172, 8.479063987731934, 10.713640213012695, 12.94821548461914, 15.182790756225586, 17.41736602783203, 19.65194320678711, 21.886518478393555, 24.12109375, 26.355670928955078, 28.590246200561523, 30.82482147216797, 33.05939865112305, 35.29397201538086, 37.52854919433594, 39.76312255859375, 41.99769973754883, 44.232276916503906, 46.46685028076172, 48.7014274597168]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 7.0, 10.0, 21.0, 18.0, 23.0, 22.0, 26.0, 29.0, 30.0, 27.0, 28.0, 35.0, 36.0, 40.0, 28.0, 36.0, 39.0, 47.0, 50.0, 42.0, 40.0, 32.0, 35.0, 31.0, 35.0, 30.0, 38.0, 24.0, 18.0, 20.0, 26.0, 16.0, 8.0, 10.0, 10.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03443717956543, -20.38628578186035, -19.738136291503906, -19.089984893798828, -18.441835403442383, -17.793684005737305, -17.14553451538086, -16.49738311767578, -15.849231719970703, -15.201081275939941, -14.55293083190918, -13.904779434204102, -13.25662899017334, -12.608478546142578, -11.960328102111816, -11.312177658081055, -10.664027214050293, -10.015876770019531, -9.36772632598877, -8.719575881958008, -8.07142448425293, -7.423274040222168, -6.775123596191406, -6.126972675323486, -5.478822231292725, -4.830671787261963, -4.182520866394043, -3.5343704223632812, -2.8862197399139404, -2.2380690574645996, -1.589918613433838, -0.941767692565918, -0.29361724853515625, 0.3545333743095398, 1.0026839971542358, 1.650834560394287, 2.298985242843628, 2.9471359252929688, 3.5952863693237305, 4.24343729019165, 4.891587734222412, 5.539738178253174, 6.187889099121094, 6.8360395431518555, 7.484189987182617, 8.132341384887695, 8.78049087524414, 9.428642272949219, 10.07679271697998, 10.724943161010742, 11.373093605041504, 12.021244049072266, 12.669395446777344, 13.317545890808105, 13.965696334838867, 14.613847732543945, 15.26199722290039, 15.910147666931152, 16.558298110961914, 17.206449508666992, 17.854598999023438, 18.502750396728516, 19.150901794433594, 19.79905128479004, 20.447202682495117]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 13.0, 6.0, 13.0, 17.0, 13.0, 20.0, 20.0, 20.0, 40.0, 43.0, 36.0, 48.0, 58.0, 51.0, 55.0, 44.0, 53.0, 54.0, 47.0, 59.0, 39.0, 38.0, 23.0, 31.0, 22.0, 19.0, 21.0, 22.0, 23.0, 15.0, 10.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.123443603515625, -2.04180908203125, -1.960174560546875, -1.8785400390625, -1.796905517578125, -1.71527099609375, -1.633636474609375, -1.552001953125, -1.470367431640625, -1.38873291015625, -1.307098388671875, -1.2254638671875, -1.143829345703125, -1.06219482421875, -0.980560302734375, -0.89892578125, -0.817291259765625, -0.73565673828125, -0.654022216796875, -0.5723876953125, -0.490753173828125, -0.40911865234375, -0.327484130859375, -0.245849609375, -0.164215087890625, -0.08258056640625, -0.000946044921875, 0.0806884765625, 0.162322998046875, 0.24395751953125, 0.325592041015625, 0.4072265625, 0.488861083984375, 0.57049560546875, 0.652130126953125, 0.7337646484375, 0.815399169921875, 0.89703369140625, 0.978668212890625, 1.060302734375, 1.141937255859375, 1.22357177734375, 1.305206298828125, 1.3868408203125, 1.468475341796875, 1.55010986328125, 1.631744384765625, 1.71337890625, 1.795013427734375, 1.87664794921875, 1.958282470703125, 2.0399169921875, 2.121551513671875, 2.20318603515625, 2.284820556640625, 2.366455078125, 2.448089599609375, 2.52972412109375, 2.611358642578125, 2.6929931640625, 2.774627685546875, 2.85626220703125, 2.937896728515625, 3.01953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 9.0, 16.0, 37.0, 31.0, 55.0, 72.0, 129.0, 147.0, 192.0, 322.0, 492.0, 806.0, 1150.0, 1944.0, 3118.0, 5366.0, 9822.0, 20704.0, 55785.0, 376680.0, 463896.0, 60640.0, 22340.0, 10489.0, 5499.0, 3235.0, 1901.0, 1209.0, 747.0, 532.0, 342.0, 269.0, 175.0, 123.0, 73.0, 69.0, 29.0, 25.0, 21.0, 20.0, 13.0, 7.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.640625, -13.1865234375, -12.732421875, -12.2783203125, -11.82421875, -11.3701171875, -10.916015625, -10.4619140625, -10.0078125, -9.5537109375, -9.099609375, -8.6455078125, -8.19140625, -7.7373046875, -7.283203125, -6.8291015625, -6.375, -5.9208984375, -5.466796875, -5.0126953125, -4.55859375, -4.1044921875, -3.650390625, -3.1962890625, -2.7421875, -2.2880859375, -1.833984375, -1.3798828125, -0.92578125, -0.4716796875, -0.017578125, 0.4365234375, 0.890625, 1.3447265625, 1.798828125, 2.2529296875, 2.70703125, 3.1611328125, 3.615234375, 4.0693359375, 4.5234375, 4.9775390625, 5.431640625, 5.8857421875, 6.33984375, 6.7939453125, 7.248046875, 7.7021484375, 8.15625, 8.6103515625, 9.064453125, 9.5185546875, 9.97265625, 10.4267578125, 10.880859375, 11.3349609375, 11.7890625, 12.2431640625, 12.697265625, 13.1513671875, 13.60546875, 14.0595703125, 14.513671875, 14.9677734375, 15.421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 6.0, 15.0, 11.0, 19.0, 19.0, 25.0, 29.0, 23.0, 39.0, 41.0, 42.0, 44.0, 40.0, 63.0, 58.0, 1073.0, 45.0, 53.0, 59.0, 46.0, 41.0, 42.0, 29.0, 33.0, 24.0, 17.0, 17.0, 14.0, 8.0, 14.0, 7.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.380706787109375, -2.30633544921875, -2.231964111328125, -2.1575927734375, -2.083221435546875, -2.00885009765625, -1.934478759765625, -1.860107421875, -1.785736083984375, -1.71136474609375, -1.636993408203125, -1.5626220703125, -1.488250732421875, -1.41387939453125, -1.339508056640625, -1.26513671875, -1.190765380859375, -1.11639404296875, -1.042022705078125, -0.9676513671875, -0.893280029296875, -0.81890869140625, -0.744537353515625, -0.670166015625, -0.595794677734375, -0.52142333984375, -0.447052001953125, -0.3726806640625, -0.298309326171875, -0.22393798828125, -0.149566650390625, -0.0751953125, -0.000823974609375, 0.07354736328125, 0.147918701171875, 0.2222900390625, 0.296661376953125, 0.37103271484375, 0.445404052734375, 0.519775390625, 0.594146728515625, 0.66851806640625, 0.742889404296875, 0.8172607421875, 0.891632080078125, 0.96600341796875, 1.040374755859375, 1.11474609375, 1.189117431640625, 1.26348876953125, 1.337860107421875, 1.4122314453125, 1.486602783203125, 1.56097412109375, 1.635345458984375, 1.709716796875, 1.784088134765625, 1.85845947265625, 1.932830810546875, 2.0072021484375, 2.081573486328125, 2.15594482421875, 2.230316162109375, 2.3046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 10.0, 16.0, 24.0, 46.0, 74.0, 104.0, 148.0, 200.0, 316.0, 499.0, 739.0, 1225.0, 1936.0, 3985.0, 10746.0, 58438.0, 1918795.0, 77153.0, 12217.0, 4529.0, 2237.0, 1244.0, 731.0, 534.0, 392.0, 272.0, 149.0, 129.0, 64.0, 40.0, 25.0, 25.0, 11.0, 14.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.703125, -24.888427734375, -24.07373046875, -23.259033203125, -22.4443359375, -21.629638671875, -20.81494140625, -20.000244140625, -19.185546875, -18.370849609375, -17.55615234375, -16.741455078125, -15.9267578125, -15.112060546875, -14.29736328125, -13.482666015625, -12.66796875, -11.853271484375, -11.03857421875, -10.223876953125, -9.4091796875, -8.594482421875, -7.77978515625, -6.965087890625, -6.150390625, -5.335693359375, -4.52099609375, -3.706298828125, -2.8916015625, -2.076904296875, -1.26220703125, -0.447509765625, 0.3671875, 1.181884765625, 1.99658203125, 2.811279296875, 3.6259765625, 4.440673828125, 5.25537109375, 6.070068359375, 6.884765625, 7.699462890625, 8.51416015625, 9.328857421875, 10.1435546875, 10.958251953125, 11.77294921875, 12.587646484375, 13.40234375, 14.217041015625, 15.03173828125, 15.846435546875, 16.6611328125, 17.475830078125, 18.29052734375, 19.105224609375, 19.919921875, 20.734619140625, 21.54931640625, 22.364013671875, 23.1787109375, 23.993408203125, 24.80810546875, 25.622802734375, 26.4375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 42.0, 117.0, 425.0, 269.0, 67.0, 21.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.64306640625, -6.3955078125, -6.14794921875, -5.900390625, -5.65283203125, -5.4052734375, -5.15771484375, -4.91015625, -4.66259765625, -4.4150390625, -4.16748046875, -3.919921875, -3.67236328125, -3.4248046875, -3.17724609375, -2.9296875, -2.68212890625, -2.4345703125, -2.18701171875, -1.939453125, -1.69189453125, -1.4443359375, -1.19677734375, -0.94921875, -0.70166015625, -0.4541015625, -0.20654296875, 0.041015625, 0.28857421875, 0.5361328125, 0.78369140625, 1.03125, 1.27880859375, 1.5263671875, 1.77392578125, 2.021484375, 2.26904296875, 2.5166015625, 2.76416015625, 3.01171875, 3.25927734375, 3.5068359375, 3.75439453125, 4.001953125, 4.24951171875, 4.4970703125, 4.74462890625, 4.9921875, 5.23974609375, 5.4873046875, 5.73486328125, 5.982421875, 6.22998046875, 6.4775390625, 6.72509765625, 6.97265625, 7.22021484375, 7.4677734375, 7.71533203125, 7.962890625, 8.21044921875, 8.4580078125, 8.70556640625, 8.953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 17.0, 25.0, 33.0, 102.0, 496.0, 2862.0, 47850.0, 991885.0, 4212.0, 755.0, 152.0, 40.0, 23.0, 15.0, 11.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-140.625, -136.73046875, -132.8359375, -128.94140625, -125.046875, -121.15234375, -117.2578125, -113.36328125, -109.46875, -105.57421875, -101.6796875, -97.78515625, -93.890625, -89.99609375, -86.1015625, -82.20703125, -78.3125, -74.41796875, -70.5234375, -66.62890625, -62.734375, -58.83984375, -54.9453125, -51.05078125, -47.15625, -43.26171875, -39.3671875, -35.47265625, -31.578125, -27.68359375, -23.7890625, -19.89453125, -16.0, -12.10546875, -8.2109375, -4.31640625, -0.421875, 3.47265625, 7.3671875, 11.26171875, 15.15625, 19.05078125, 22.9453125, 26.83984375, 30.734375, 34.62890625, 38.5234375, 42.41796875, 46.3125, 50.20703125, 54.1015625, 57.99609375, 61.890625, 65.78515625, 69.6796875, 73.57421875, 77.46875, 81.36328125, 85.2578125, 89.15234375, 93.046875, 96.94140625, 100.8359375, 104.73046875, 108.625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 9.0, 13.0, 23.0, 26.0, 29.0, 54.0, 77.0, 162.0, 191.0, 126.0, 93.0, 59.0, 42.0, 15.0, 23.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.547995567321777, -8.305628776550293, -8.063262939453125, -7.820896625518799, -7.578530311584473, -7.3361639976501465, -7.09379768371582, -6.851430892944336, -6.609065055847168, -6.366698741912842, -6.124332427978516, -5.8819661140441895, -5.639599800109863, -5.397233486175537, -5.154867172241211, -4.912500381469727, -4.6701340675354, -4.427767753601074, -4.185401439666748, -3.943035125732422, -3.7006688117980957, -3.4583024978637695, -3.2159359455108643, -2.973569631576538, -2.731203317642212, -2.4888370037078857, -2.2464706897735596, -2.0041041374206543, -1.7617379426956177, -1.5193716287612915, -1.2770051956176758, -1.0346388816833496, -0.7922720909118652, -0.5499057769775391, -0.3075394034385681, -0.06517302989959717, 0.177193284034729, 0.4195595979690552, 0.6619260311126709, 0.9042923450469971, 1.1466586589813232, 1.3890249729156494, 1.6313912868499756, 1.8737577199935913, 2.116124153137207, 2.358490467071533, 2.6008567810058594, 2.8432230949401855, 3.0855894088745117, 3.327955722808838, 3.570322036743164, 3.8126883506774902, 4.055054664611816, 4.297420978546143, 4.539787292480469, 4.782154083251953, 5.024519920349121, 5.266886234283447, 5.509252548217773, 5.7516188621521, 5.993985176086426, 6.236351490020752, 6.478717803955078, 6.7210845947265625, 6.963450908660889]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 9.0, 7.0, 15.0, 10.0, 18.0, 25.0, 28.0, 25.0, 31.0, 28.0, 27.0, 27.0, 35.0, 46.0, 39.0, 39.0, 40.0, 44.0, 48.0, 43.0, 35.0, 38.0, 38.0, 33.0, 28.0, 28.0, 27.0, 17.0, 29.0, 19.0, 27.0, 17.0, 10.0, 14.0, 7.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8647117614746094, -3.7316665649414062, -3.598621368408203, -3.465576171875, -3.332530975341797, -3.1994857788085938, -3.0664408206939697, -2.9333956241607666, -2.8003504276275635, -2.6673052310943604, -2.5342600345611572, -2.401214838027954, -2.26816987991333, -2.135124683380127, -2.002079486846924, -1.8690342903137207, -1.7359890937805176, -1.6029438972473145, -1.4698987007141113, -1.3368536233901978, -1.2038084268569946, -1.0707632303237915, -0.9377180933952332, -0.8046729564666748, -0.6716277599334717, -0.5385825634002686, -0.4055374264717102, -0.27249225974082947, -0.13944709300994873, -0.0064018964767456055, 0.12664324045181274, 0.2596883773803711, 0.3927335739135742, 0.5257787704467773, 0.6588239073753357, 0.791869044303894, 0.9249142408370972, 1.0579594373703003, 1.1910045146942139, 1.324049711227417, 1.4570949077606201, 1.5901401042938232, 1.7231853008270264, 1.85623037815094, 1.989275574684143, 2.1223206520080566, 2.2553658485412598, 2.388411045074463, 2.521456241607666, 2.654501438140869, 2.7875466346740723, 2.9205918312072754, 3.0536370277404785, 3.1866822242736816, 3.3197271823883057, 3.452772378921509, 3.585817575454712, 3.718862771987915, 3.851907968521118, 3.9849531650543213, 4.117998123168945, 4.251043319702148, 4.384088516235352, 4.517133712768555, 4.650178909301758]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 10.0, 7.0, 12.0, 22.0, 19.0, 23.0, 28.0, 21.0, 33.0, 66.0, 47.0, 51.0, 53.0, 46.0, 69.0, 64.0, 55.0, 55.0, 56.0, 34.0, 39.0, 35.0, 27.0, 28.0, 22.0, 20.0, 18.0, 14.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.834686279296875, -2.73968505859375, -2.644683837890625, -2.5496826171875, -2.454681396484375, -2.35968017578125, -2.264678955078125, -2.169677734375, -2.074676513671875, -1.97967529296875, -1.884674072265625, -1.7896728515625, -1.694671630859375, -1.59967041015625, -1.504669189453125, -1.40966796875, -1.314666748046875, -1.21966552734375, -1.124664306640625, -1.0296630859375, -0.934661865234375, -0.83966064453125, -0.744659423828125, -0.649658203125, -0.554656982421875, -0.45965576171875, -0.364654541015625, -0.2696533203125, -0.174652099609375, -0.07965087890625, 0.015350341796875, 0.1103515625, 0.205352783203125, 0.30035400390625, 0.395355224609375, 0.4903564453125, 0.585357666015625, 0.68035888671875, 0.775360107421875, 0.870361328125, 0.965362548828125, 1.06036376953125, 1.155364990234375, 1.2503662109375, 1.345367431640625, 1.44036865234375, 1.535369873046875, 1.63037109375, 1.725372314453125, 1.82037353515625, 1.915374755859375, 2.0103759765625, 2.105377197265625, 2.20037841796875, 2.295379638671875, 2.390380859375, 2.485382080078125, 2.58038330078125, 2.675384521484375, 2.7703857421875, 2.865386962890625, 2.96038818359375, 3.055389404296875, 3.150390625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 25.0, 28.0, 47.0, 67.0, 115.0, 190.0, 260.0, 457.0, 706.0, 1206.0, 2049.0, 3518.0, 6397.0, 12337.0, 25738.0, 66906.0, 246401.0, 476009.0, 125749.0, 41750.0, 17990.0, 8979.0, 4929.0, 2607.0, 1598.0, 895.0, 601.0, 350.0, 235.0, 136.0, 97.0, 53.0, 42.0, 31.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.1973876953125, -3.088134765625, -2.9788818359375, -2.86962890625, -2.7603759765625, -2.651123046875, -2.5418701171875, -2.4326171875, -2.3233642578125, -2.214111328125, -2.1048583984375, -1.99560546875, -1.8863525390625, -1.777099609375, -1.6678466796875, -1.55859375, -1.4493408203125, -1.340087890625, -1.2308349609375, -1.12158203125, -1.0123291015625, -0.903076171875, -0.7938232421875, -0.6845703125, -0.5753173828125, -0.466064453125, -0.3568115234375, -0.24755859375, -0.1383056640625, -0.029052734375, 0.0802001953125, 0.189453125, 0.2987060546875, 0.407958984375, 0.5172119140625, 0.62646484375, 0.7357177734375, 0.844970703125, 0.9542236328125, 1.0634765625, 1.1727294921875, 1.281982421875, 1.3912353515625, 1.50048828125, 1.6097412109375, 1.718994140625, 1.8282470703125, 1.9375, 2.0467529296875, 2.156005859375, 2.2652587890625, 2.37451171875, 2.4837646484375, 2.593017578125, 2.7022705078125, 2.8115234375, 2.9207763671875, 3.030029296875, 3.1392822265625, 3.24853515625, 3.3577880859375, 3.467041015625, 3.5762939453125, 3.685546875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 10.0, 14.0, 7.0, 8.0, 9.0, 15.0, 19.0, 20.0, 13.0, 33.0, 24.0, 35.0, 32.0, 52.0, 56.0, 65.0, 94.0, 193.0, 1406.0, 330.0, 149.0, 81.0, 62.0, 51.0, 35.0, 35.0, 29.0, 29.0, 22.0, 23.0, 21.0, 11.0, 13.0, 11.0, 7.0, 3.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7589111328125, -6.486572265625, -6.2142333984375, -5.94189453125, -5.6695556640625, -5.397216796875, -5.1248779296875, -4.8525390625, -4.5802001953125, -4.307861328125, -4.0355224609375, -3.76318359375, -3.4908447265625, -3.218505859375, -2.9461669921875, -2.673828125, -2.4014892578125, -2.129150390625, -1.8568115234375, -1.58447265625, -1.3121337890625, -1.039794921875, -0.7674560546875, -0.4951171875, -0.2227783203125, 0.049560546875, 0.3218994140625, 0.59423828125, 0.8665771484375, 1.138916015625, 1.4112548828125, 1.68359375, 1.9559326171875, 2.228271484375, 2.5006103515625, 2.77294921875, 3.0452880859375, 3.317626953125, 3.5899658203125, 3.8623046875, 4.1346435546875, 4.406982421875, 4.6793212890625, 4.95166015625, 5.2239990234375, 5.496337890625, 5.7686767578125, 6.041015625, 6.3133544921875, 6.585693359375, 6.8580322265625, 7.13037109375, 7.4027099609375, 7.675048828125, 7.9473876953125, 8.2197265625, 8.4920654296875, 8.764404296875, 9.0367431640625, 9.30908203125, 9.5814208984375, 9.853759765625, 10.1260986328125, 10.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 14.0, 15.0, 14.0, 16.0, 18.0, 32.0, 44.0, 46.0, 61.0, 94.0, 137.0, 232.0, 461.0, 1187.0, 5278.0, 56616.0, 2670479.0, 391102.0, 15762.0, 2410.0, 680.0, 330.0, 179.0, 126.0, 91.0, 50.0, 50.0, 26.0, 25.0, 20.0, 19.0, 11.0, 15.0, 10.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-15.046875, -14.6260986328125, -14.205322265625, -13.7845458984375, -13.36376953125, -12.9429931640625, -12.522216796875, -12.1014404296875, -11.6806640625, -11.2598876953125, -10.839111328125, -10.4183349609375, -9.99755859375, -9.5767822265625, -9.156005859375, -8.7352294921875, -8.314453125, -7.8936767578125, -7.472900390625, -7.0521240234375, -6.63134765625, -6.2105712890625, -5.789794921875, -5.3690185546875, -4.9482421875, -4.5274658203125, -4.106689453125, -3.6859130859375, -3.26513671875, -2.8443603515625, -2.423583984375, -2.0028076171875, -1.58203125, -1.1612548828125, -0.740478515625, -0.3197021484375, 0.10107421875, 0.5218505859375, 0.942626953125, 1.3634033203125, 1.7841796875, 2.2049560546875, 2.625732421875, 3.0465087890625, 3.46728515625, 3.8880615234375, 4.308837890625, 4.7296142578125, 5.150390625, 5.5711669921875, 5.991943359375, 6.4127197265625, 6.83349609375, 7.2542724609375, 7.675048828125, 8.0958251953125, 8.5166015625, 8.9373779296875, 9.358154296875, 9.7789306640625, 10.19970703125, 10.6204833984375, 11.041259765625, 11.4620361328125, 11.8828125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [5.0, 445.0, 546.0, 19.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.746743202209473, -5.018730640411377, -0.29071807861328125, 4.437294960021973, 9.16530704498291, 13.893319129943848, 18.621334075927734, 23.349346160888672, 28.07735824584961, 32.80537033081055, 37.533382415771484, 42.26139831542969, 46.989410400390625, 51.71742248535156, 56.4454345703125, 61.17344665527344, 65.90145874023438, 70.62947082519531, 75.35748291015625, 80.08549499511719, 84.81350708007812, 89.54151916503906, 94.26953125, 98.99754333496094, 103.72555541992188, 108.45356750488281, 113.18157958984375, 117.90959167480469, 122.63760375976562, 127.36561584472656, 132.0936279296875, 136.82164001464844, 141.54966735839844, 146.27767944335938, 151.0056915283203, 155.73370361328125, 160.4617156982422, 165.18972778320312, 169.91773986816406, 174.645751953125, 179.37376403808594, 184.10177612304688, 188.8297882080078, 193.55780029296875, 198.2858123779297, 203.01382446289062, 207.74183654785156, 212.4698486328125, 217.1978759765625, 221.92588806152344, 226.65390014648438, 231.3819122314453, 236.10992431640625, 240.8379364013672, 245.56594848632812, 250.29396057128906, 255.02197265625, 259.75, 264.4779968261719, 269.2060241699219, 273.93402099609375, 278.66204833984375, 283.3900451660156, 288.1180725097656, 292.8460693359375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 10.0, 9.0, 14.0, 9.0, 11.0, 10.0, 13.0, 17.0, 26.0, 30.0, 29.0, 36.0, 31.0, 39.0, 41.0, 33.0, 50.0, 31.0, 32.0, 45.0, 51.0, 35.0, 49.0, 40.0, 29.0, 35.0, 25.0, 31.0, 24.0, 24.0, 31.0, 22.0, 17.0, 11.0, 13.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.77924156188965, -21.081886291503906, -20.384531021118164, -19.687175750732422, -18.989822387695312, -18.29246711730957, -17.595111846923828, -16.897756576538086, -16.200401306152344, -15.503046035766602, -14.805691719055176, -14.108336448669434, -13.410982131958008, -12.713626861572266, -12.016271591186523, -11.318916320800781, -10.621562957763672, -9.92420768737793, -9.226853370666504, -8.529498100280762, -7.832143306732178, -7.134788513183594, -6.437433242797852, -5.740078449249268, -5.042723655700684, -4.3453688621521, -3.6480138301849365, -2.9506587982177734, -2.2533040046691895, -1.5559492111206055, -0.8585939407348633, -0.1612391471862793, 0.5361175537109375, 1.233472466468811, 1.9308273792266846, 2.6281824111938477, 3.3255372047424316, 4.022891998291016, 4.720247268676758, 5.417602062225342, 6.114956855773926, 6.81231164932251, 7.509666442871094, 8.207021713256836, 8.904376983642578, 9.601731300354004, 10.299086570739746, 10.996440887451172, 11.693796157836914, 12.391151428222656, 13.088505744934082, 13.785861015319824, 14.48321533203125, 15.180570602416992, 15.877925872802734, 16.575281143188477, 17.27263641357422, 17.96999168395996, 18.667346954345703, 19.364700317382812, 20.062055587768555, 20.759410858154297, 21.45676612854004, 22.15412139892578, 22.85147476196289]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 15.0, 22.0, 15.0, 26.0, 28.0, 35.0, 30.0, 44.0, 54.0, 44.0, 45.0, 55.0, 49.0, 43.0, 58.0, 42.0, 55.0, 47.0, 41.0, 39.0, 31.0, 25.0, 28.0, 22.0, 16.0, 18.0, 19.0, 18.0, 9.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.45062255859375, -2.3621826171875, -2.27374267578125, -2.185302734375, -2.09686279296875, -2.0084228515625, -1.91998291015625, -1.83154296875, -1.74310302734375, -1.6546630859375, -1.56622314453125, -1.477783203125, -1.38934326171875, -1.3009033203125, -1.21246337890625, -1.1240234375, -1.03558349609375, -0.9471435546875, -0.85870361328125, -0.770263671875, -0.68182373046875, -0.5933837890625, -0.50494384765625, -0.41650390625, -0.32806396484375, -0.2396240234375, -0.15118408203125, -0.062744140625, 0.02569580078125, 0.1141357421875, 0.20257568359375, 0.291015625, 0.37945556640625, 0.4678955078125, 0.55633544921875, 0.644775390625, 0.73321533203125, 0.8216552734375, 0.91009521484375, 0.99853515625, 1.08697509765625, 1.1754150390625, 1.26385498046875, 1.352294921875, 1.44073486328125, 1.5291748046875, 1.61761474609375, 1.7060546875, 1.79449462890625, 1.8829345703125, 1.97137451171875, 2.059814453125, 2.14825439453125, 2.2366943359375, 2.32513427734375, 2.41357421875, 2.50201416015625, 2.5904541015625, 2.67889404296875, 2.767333984375, 2.85577392578125, 2.9442138671875, 3.03265380859375, 3.12109375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 10.0, 5.0, 7.0, 8.0, 14.0, 14.0, 33.0, 45.0, 62.0, 102.0, 172.0, 258.0, 393.0, 697.0, 1300.0, 2229.0, 4093.0, 7602.0, 14770.0, 29488.0, 68087.0, 313022.0, 2718772.0, 856636.0, 98117.0, 38020.0, 18534.0, 9578.0, 5301.0, 2836.0, 1590.0, 931.0, 547.0, 321.0, 244.0, 140.0, 94.0, 67.0, 38.0, 30.0, 16.0, 24.0, 14.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.2154541015625, -6.012939453125, -5.8104248046875, -5.60791015625, -5.4053955078125, -5.202880859375, -5.0003662109375, -4.7978515625, -4.5953369140625, -4.392822265625, -4.1903076171875, -3.98779296875, -3.7852783203125, -3.582763671875, -3.3802490234375, -3.177734375, -2.9752197265625, -2.772705078125, -2.5701904296875, -2.36767578125, -2.1651611328125, -1.962646484375, -1.7601318359375, -1.5576171875, -1.3551025390625, -1.152587890625, -0.9500732421875, -0.74755859375, -0.5450439453125, -0.342529296875, -0.1400146484375, 0.0625, 0.2650146484375, 0.467529296875, 0.6700439453125, 0.87255859375, 1.0750732421875, 1.277587890625, 1.4801025390625, 1.6826171875, 1.8851318359375, 2.087646484375, 2.2901611328125, 2.49267578125, 2.6951904296875, 2.897705078125, 3.1002197265625, 3.302734375, 3.5052490234375, 3.707763671875, 3.9102783203125, 4.11279296875, 4.3153076171875, 4.517822265625, 4.7203369140625, 4.9228515625, 5.1253662109375, 5.327880859375, 5.5303955078125, 5.73291015625, 5.9354248046875, 6.137939453125, 6.3404541015625, 6.54296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 16.0, 10.0, 21.0, 16.0, 49.0, 61.0, 74.0, 105.0, 148.0, 248.0, 491.0, 877.0, 816.0, 403.0, 208.0, 138.0, 91.0, 83.0, 58.0, 43.0, 32.0, 24.0, 16.0, 12.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.17938232421875, -5.9095458984375, -5.63970947265625, -5.369873046875, -5.10003662109375, -4.8302001953125, -4.56036376953125, -4.29052734375, -4.02069091796875, -3.7508544921875, -3.48101806640625, -3.211181640625, -2.94134521484375, -2.6715087890625, -2.40167236328125, -2.1318359375, -1.86199951171875, -1.5921630859375, -1.32232666015625, -1.052490234375, -0.78265380859375, -0.5128173828125, -0.24298095703125, 0.02685546875, 0.29669189453125, 0.5665283203125, 0.83636474609375, 1.106201171875, 1.37603759765625, 1.6458740234375, 1.91571044921875, 2.185546875, 2.45538330078125, 2.7252197265625, 2.99505615234375, 3.264892578125, 3.53472900390625, 3.8045654296875, 4.07440185546875, 4.34423828125, 4.61407470703125, 4.8839111328125, 5.15374755859375, 5.423583984375, 5.69342041015625, 5.9632568359375, 6.23309326171875, 6.5029296875, 6.77276611328125, 7.0426025390625, 7.31243896484375, 7.582275390625, 7.85211181640625, 8.1219482421875, 8.39178466796875, 8.66162109375, 8.93145751953125, 9.2012939453125, 9.47113037109375, 9.740966796875, 10.01080322265625, 10.2806396484375, 10.55047607421875, 10.8203125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 8.0, 25.0, 28.0, 56.0, 78.0, 108.0, 218.0, 492.0, 1378.0, 5216.0, 25015.0, 183040.0, 3617793.0, 315220.0, 35690.0, 6827.0, 1900.0, 572.0, 248.0, 139.0, 68.0, 49.0, 25.0, 20.0, 13.0, 12.0, 13.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.078125, -23.4700927734375, -22.862060546875, -22.2540283203125, -21.64599609375, -21.0379638671875, -20.429931640625, -19.8218994140625, -19.2138671875, -18.6058349609375, -17.997802734375, -17.3897705078125, -16.78173828125, -16.1737060546875, -15.565673828125, -14.9576416015625, -14.349609375, -13.7415771484375, -13.133544921875, -12.5255126953125, -11.91748046875, -11.3094482421875, -10.701416015625, -10.0933837890625, -9.4853515625, -8.8773193359375, -8.269287109375, -7.6612548828125, -7.05322265625, -6.4451904296875, -5.837158203125, -5.2291259765625, -4.62109375, -4.0130615234375, -3.405029296875, -2.7969970703125, -2.18896484375, -1.5809326171875, -0.972900390625, -0.3648681640625, 0.2431640625, 0.8511962890625, 1.459228515625, 2.0672607421875, 2.67529296875, 3.2833251953125, 3.891357421875, 4.4993896484375, 5.107421875, 5.7154541015625, 6.323486328125, 6.9315185546875, 7.53955078125, 8.1475830078125, 8.755615234375, 9.3636474609375, 9.9716796875, 10.5797119140625, 11.187744140625, 11.7957763671875, 12.40380859375, 13.0118408203125, 13.619873046875, 14.2279052734375, 14.8359375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 19.0, 25.0, 61.0, 87.0, 127.0, 152.0, 160.0, 102.0, 78.0, 58.0, 42.0, 31.0, 17.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-71.78440856933594, -70.34912872314453, -68.91385650634766, -67.47857666015625, -66.04330444335938, -64.60802459716797, -63.17274856567383, -61.73747253417969, -60.30219650268555, -58.866920471191406, -57.431644439697266, -55.996368408203125, -54.56108856201172, -53.12581253051758, -51.69053649902344, -50.2552604675293, -48.819984436035156, -47.384708404541016, -45.949432373046875, -44.514156341552734, -43.078880310058594, -41.64360046386719, -40.20832443237305, -38.773048400878906, -37.337772369384766, -35.902496337890625, -34.467220306396484, -33.031944274902344, -31.59666633605957, -30.16139030456543, -28.726112365722656, -27.290836334228516, -25.85555648803711, -24.42028045654297, -22.985004425048828, -21.549726486206055, -20.114450454711914, -18.679174423217773, -17.243896484375, -15.80862045288086, -14.373344421386719, -12.938068389892578, -11.502791404724121, -10.067514419555664, -8.632238388061523, -7.196961879730225, -5.761685371398926, -4.326408386230469, -2.891132354736328, -1.4558558464050293, -0.02057933807373047, 1.4146971702575684, 2.849973678588867, 4.285250186920166, 5.720526695251465, 7.155803680419922, 8.591079711914062, 10.026355743408203, 11.46163272857666, 12.896909713745117, 14.332185745239258, 15.767461776733398, 17.202739715576172, 18.638015747070312, 20.073291778564453]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 12.0, 6.0, 16.0, 14.0, 12.0, 16.0, 22.0, 25.0, 18.0, 24.0, 35.0, 35.0, 33.0, 45.0, 52.0, 38.0, 34.0, 42.0, 47.0, 46.0, 45.0, 34.0, 43.0, 38.0, 31.0, 30.0, 24.0, 20.0, 26.0, 18.0, 18.0, 15.0, 13.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.072383880615234, -20.38842010498047, -19.704458236694336, -19.02049446105957, -18.336532592773438, -17.652568817138672, -16.968605041503906, -16.284643173217773, -15.600679397583008, -14.916716575622559, -14.23275375366211, -13.548789978027344, -12.864827156066895, -12.180864334106445, -11.496901512145996, -10.812938690185547, -10.128975868225098, -9.445013046264648, -8.7610502243042, -8.07708740234375, -7.393123626708984, -6.709160804748535, -6.025197982788086, -5.3412346839904785, -4.657271862030029, -3.973308801651001, -3.2893457412719727, -2.6053829193115234, -1.9214198589324951, -1.2374567985534668, -0.5534939765930176, 0.13046932220458984, 0.8144321441650391, 1.4983952045440674, 2.1823582649230957, 2.866321086883545, 3.5502841472625732, 4.234247207641602, 4.918210029602051, 5.602173328399658, 6.286136150360107, 6.970098972320557, 7.654062271118164, 8.338025093078613, 9.021987915039062, 9.705951690673828, 10.389913558959961, 11.073877334594727, 11.757840156555176, 12.441802978515625, 13.125765800476074, 13.809728622436523, 14.493692398071289, 15.177655220031738, 15.861618041992188, 16.545581817626953, 17.229543685913086, 17.91350746154785, 18.597469329833984, 19.28143310546875, 19.965394973754883, 20.64935874938965, 21.33332061767578, 22.017284393310547, 22.701248168945312]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 9.0, 12.0, 21.0, 22.0, 33.0, 29.0, 31.0, 26.0, 41.0, 42.0, 46.0, 38.0, 50.0, 43.0, 49.0, 42.0, 36.0, 36.0, 43.0, 37.0, 39.0, 38.0, 41.0, 20.0, 20.0, 23.0, 10.0, 15.0, 13.0, 13.0, 19.0, 11.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.01641845703125, -1.9410400390625, -1.86566162109375, -1.790283203125, -1.71490478515625, -1.6395263671875, -1.56414794921875, -1.48876953125, -1.41339111328125, -1.3380126953125, -1.26263427734375, -1.187255859375, -1.11187744140625, -1.0364990234375, -0.96112060546875, -0.8857421875, -0.81036376953125, -0.7349853515625, -0.65960693359375, -0.584228515625, -0.50885009765625, -0.4334716796875, -0.35809326171875, -0.28271484375, -0.20733642578125, -0.1319580078125, -0.05657958984375, 0.018798828125, 0.09417724609375, 0.1695556640625, 0.24493408203125, 0.3203125, 0.39569091796875, 0.4710693359375, 0.54644775390625, 0.621826171875, 0.69720458984375, 0.7725830078125, 0.84796142578125, 0.92333984375, 0.99871826171875, 1.0740966796875, 1.14947509765625, 1.224853515625, 1.30023193359375, 1.3756103515625, 1.45098876953125, 1.5263671875, 1.60174560546875, 1.6771240234375, 1.75250244140625, 1.827880859375, 1.90325927734375, 1.9786376953125, 2.05401611328125, 2.12939453125, 2.20477294921875, 2.2801513671875, 2.35552978515625, 2.430908203125, 2.50628662109375, 2.5816650390625, 2.65704345703125, 2.732421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 9.0, 21.0, 34.0, 41.0, 70.0, 107.0, 125.0, 202.0, 280.0, 413.0, 605.0, 861.0, 1276.0, 1938.0, 2866.0, 4366.0, 6850.0, 10855.0, 18139.0, 31267.0, 61641.0, 279036.0, 471134.0, 70173.0, 34022.0, 19223.0, 11804.0, 7232.0, 4612.0, 3025.0, 1917.0, 1341.0, 889.0, 683.0, 427.0, 301.0, 215.0, 161.0, 105.0, 71.0, 63.0, 41.0, 29.0, 19.0, 13.0, 11.0, 7.0, 0.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.8828125, -9.5428466796875, -9.202880859375, -8.8629150390625, -8.52294921875, -8.1829833984375, -7.843017578125, -7.5030517578125, -7.1630859375, -6.8231201171875, -6.483154296875, -6.1431884765625, -5.80322265625, -5.4632568359375, -5.123291015625, -4.7833251953125, -4.443359375, -4.1033935546875, -3.763427734375, -3.4234619140625, -3.08349609375, -2.7435302734375, -2.403564453125, -2.0635986328125, -1.7236328125, -1.3836669921875, -1.043701171875, -0.7037353515625, -0.36376953125, -0.0238037109375, 0.316162109375, 0.6561279296875, 0.99609375, 1.3360595703125, 1.676025390625, 2.0159912109375, 2.35595703125, 2.6959228515625, 3.035888671875, 3.3758544921875, 3.7158203125, 4.0557861328125, 4.395751953125, 4.7357177734375, 5.07568359375, 5.4156494140625, 5.755615234375, 6.0955810546875, 6.435546875, 6.7755126953125, 7.115478515625, 7.4554443359375, 7.79541015625, 8.1353759765625, 8.475341796875, 8.8153076171875, 9.1552734375, 9.4952392578125, 9.835205078125, 10.1751708984375, 10.51513671875, 10.8551025390625, 11.195068359375, 11.5350341796875, 11.875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 13.0, 14.0, 11.0, 18.0, 11.0, 20.0, 19.0, 32.0, 41.0, 28.0, 41.0, 31.0, 48.0, 46.0, 45.0, 47.0, 1062.0, 48.0, 33.0, 30.0, 36.0, 41.0, 29.0, 33.0, 24.0, 30.0, 23.0, 19.0, 24.0, 18.0, 11.0, 8.0, 9.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.78515625, -1.7266693115234375, -1.668182373046875, -1.6096954345703125, -1.55120849609375, -1.4927215576171875, -1.434234619140625, -1.3757476806640625, -1.3172607421875, -1.2587738037109375, -1.200286865234375, -1.1417999267578125, -1.08331298828125, -1.0248260498046875, -0.966339111328125, -0.9078521728515625, -0.849365234375, -0.7908782958984375, -0.732391357421875, -0.6739044189453125, -0.61541748046875, -0.5569305419921875, -0.498443603515625, -0.4399566650390625, -0.3814697265625, -0.3229827880859375, -0.264495849609375, -0.2060089111328125, -0.14752197265625, -0.0890350341796875, -0.030548095703125, 0.0279388427734375, 0.08642578125, 0.1449127197265625, 0.203399658203125, 0.2618865966796875, 0.32037353515625, 0.3788604736328125, 0.437347412109375, 0.4958343505859375, 0.5543212890625, 0.6128082275390625, 0.671295166015625, 0.7297821044921875, 0.78826904296875, 0.8467559814453125, 0.905242919921875, 0.9637298583984375, 1.022216796875, 1.0807037353515625, 1.139190673828125, 1.1976776123046875, 1.25616455078125, 1.3146514892578125, 1.373138427734375, 1.4316253662109375, 1.4901123046875, 1.5485992431640625, 1.607086181640625, 1.6655731201171875, 1.72406005859375, 1.7825469970703125, 1.841033935546875, 1.8995208740234375, 1.9580078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 7.0, 4.0, 6.0, 14.0, 20.0, 30.0, 45.0, 54.0, 89.0, 128.0, 264.0, 375.0, 619.0, 937.0, 1589.0, 2993.0, 9093.0, 68365.0, 1954137.0, 44092.0, 7409.0, 2758.0, 1510.0, 929.0, 571.0, 346.0, 251.0, 162.0, 130.0, 67.0, 32.0, 36.0, 13.0, 15.0, 14.0, 7.0, 5.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.8359375, -37.515625, -36.1953125, -34.875, -33.5546875, -32.234375, -30.9140625, -29.59375, -28.2734375, -26.953125, -25.6328125, -24.3125, -22.9921875, -21.671875, -20.3515625, -19.03125, -17.7109375, -16.390625, -15.0703125, -13.75, -12.4296875, -11.109375, -9.7890625, -8.46875, -7.1484375, -5.828125, -4.5078125, -3.1875, -1.8671875, -0.546875, 0.7734375, 2.09375, 3.4140625, 4.734375, 6.0546875, 7.375, 8.6953125, 10.015625, 11.3359375, 12.65625, 13.9765625, 15.296875, 16.6171875, 17.9375, 19.2578125, 20.578125, 21.8984375, 23.21875, 24.5390625, 25.859375, 27.1796875, 28.5, 29.8203125, 31.140625, 32.4609375, 33.78125, 35.1015625, 36.421875, 37.7421875, 39.0625, 40.3828125, 41.703125, 43.0234375, 44.34375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 24.0, 47.0, 752.0, 76.0, 30.0, 19.0, 8.0, 10.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.828857421875, -10.42333984375, -10.017822265625, -9.6123046875, -9.206787109375, -8.80126953125, -8.395751953125, -7.990234375, -7.584716796875, -7.17919921875, -6.773681640625, -6.3681640625, -5.962646484375, -5.55712890625, -5.151611328125, -4.74609375, -4.340576171875, -3.93505859375, -3.529541015625, -3.1240234375, -2.718505859375, -2.31298828125, -1.907470703125, -1.501953125, -1.096435546875, -0.69091796875, -0.285400390625, 0.1201171875, 0.525634765625, 0.93115234375, 1.336669921875, 1.7421875, 2.147705078125, 2.55322265625, 2.958740234375, 3.3642578125, 3.769775390625, 4.17529296875, 4.580810546875, 4.986328125, 5.391845703125, 5.79736328125, 6.202880859375, 6.6083984375, 7.013916015625, 7.41943359375, 7.824951171875, 8.23046875, 8.635986328125, 9.04150390625, 9.447021484375, 9.8525390625, 10.258056640625, 10.66357421875, 11.069091796875, 11.474609375, 11.880126953125, 12.28564453125, 12.691162109375, 13.0966796875, 13.502197265625, 13.90771484375, 14.313232421875, 14.71875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 23.0, 64.0, 236.0, 1200.0, 14160.0, 1028432.0, 3671.0, 491.0, 125.0, 53.0, 22.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-244.375, -237.63671875, -230.8984375, -224.16015625, -217.421875, -210.68359375, -203.9453125, -197.20703125, -190.46875, -183.73046875, -176.9921875, -170.25390625, -163.515625, -156.77734375, -150.0390625, -143.30078125, -136.5625, -129.82421875, -123.0859375, -116.34765625, -109.609375, -102.87109375, -96.1328125, -89.39453125, -82.65625, -75.91796875, -69.1796875, -62.44140625, -55.703125, -48.96484375, -42.2265625, -35.48828125, -28.75, -22.01171875, -15.2734375, -8.53515625, -1.796875, 4.94140625, 11.6796875, 18.41796875, 25.15625, 31.89453125, 38.6328125, 45.37109375, 52.109375, 58.84765625, 65.5859375, 72.32421875, 79.0625, 85.80078125, 92.5390625, 99.27734375, 106.015625, 112.75390625, 119.4921875, 126.23046875, 132.96875, 139.70703125, 146.4453125, 153.18359375, 159.921875, 166.66015625, 173.3984375, 180.13671875, 186.875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 13.0, 16.0, 11.0, 9.0, 13.0, 16.0, 22.0, 38.0, 58.0, 63.0, 89.0, 135.0, 133.0, 78.0, 65.0, 43.0, 37.0, 40.0, 19.0, 21.0, 17.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.570699691772461, -6.352674961090088, -6.134650230407715, -5.916625499725342, -5.698600769042969, -5.480576038360596, -5.262551307678223, -5.044526100158691, -4.826501846313477, -4.6084771156311035, -4.3904523849487305, -4.172427654266357, -3.9544029235839844, -3.7363781929016113, -3.518353223800659, -3.300328493118286, -3.082303524017334, -2.864278793334961, -2.646254062652588, -2.428229331970215, -2.210204601287842, -1.9921797513961792, -1.7741549015045166, -1.5561301708221436, -1.3381054401397705, -1.1200807094573975, -0.9020559191703796, -0.6840311288833618, -0.46600639820098877, -0.24798166751861572, -0.029956817626953125, 0.18806791305541992, 0.40609264373779297, 0.624117374420166, 0.8421421647071838, 1.0601669549942017, 1.2781916856765747, 1.4962164163589478, 1.7142412662506104, 1.9322659969329834, 2.1502907276153564, 2.3683154582977295, 2.5863401889801025, 2.8043651580810547, 3.0223898887634277, 3.240414619445801, 3.458439350128174, 3.676464080810547, 3.89448881149292, 4.112513542175293, 4.330538272857666, 4.548563003540039, 4.766587734222412, 4.984612464904785, 5.202637672424316, 5.420661926269531, 5.6386871337890625, 5.8567118644714355, 6.074736595153809, 6.292761325836182, 6.510786056518555, 6.728810787200928, 6.946835517883301, 7.164860725402832, 7.382884979248047]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 6.0, 18.0, 11.0, 14.0, 18.0, 25.0, 23.0, 37.0, 28.0, 39.0, 42.0, 41.0, 40.0, 32.0, 51.0, 59.0, 50.0, 41.0, 48.0, 49.0, 39.0, 45.0, 40.0, 35.0, 26.0, 26.0, 23.0, 16.0, 18.0, 21.0, 7.0, 6.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.732614040374756, -6.518804550170898, -6.304995059967041, -6.091185569763184, -5.877376079559326, -5.663566589355469, -5.449756622314453, -5.235947132110596, -5.022137641906738, -4.808328151702881, -4.594518661499023, -4.380709171295166, -4.166899681091309, -3.953089952468872, -3.7392804622650146, -3.525470733642578, -3.3116614818573, -3.0978519916534424, -2.884042501449585, -2.6702327728271484, -2.456423282623291, -2.2426137924194336, -2.028804302215576, -1.8149946928024292, -1.6011852025985718, -1.3873757123947144, -1.1735661029815674, -0.95975661277771, -0.7459470629692078, -0.5321375131607056, -0.31832802295684814, -0.10451841354370117, 0.10929107666015625, 0.32310062646865845, 0.5369101762771606, 0.7507196664810181, 0.9645292162895203, 1.1783387660980225, 1.3921482563018799, 1.6059578657150269, 1.8197673559188843, 2.0335769653320312, 2.2473864555358887, 2.461195945739746, 2.6750054359436035, 2.888814926147461, 3.1026244163513184, 3.316434144973755, 3.5302436351776123, 3.7440531253814697, 3.957862615585327, 4.171672344207764, 4.385481834411621, 4.5992913246154785, 4.813100814819336, 5.026910305023193, 5.240719795227051, 5.454529285430908, 5.668338775634766, 5.882148265838623, 6.0959577560424805, 6.309767723083496, 6.523576736450195, 6.737386703491211, 6.951196193695068]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 13.0, 8.0, 19.0, 21.0, 22.0, 34.0, 38.0, 37.0, 32.0, 33.0, 38.0, 45.0, 59.0, 52.0, 46.0, 48.0, 51.0, 40.0, 52.0, 48.0, 36.0, 32.0, 26.0, 21.0, 23.0, 15.0, 24.0, 20.0, 14.0, 12.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.208892822265625, -2.11700439453125, -2.025115966796875, -1.9332275390625, -1.841339111328125, -1.74945068359375, -1.657562255859375, -1.565673828125, -1.473785400390625, -1.38189697265625, -1.290008544921875, -1.1981201171875, -1.106231689453125, -1.01434326171875, -0.922454833984375, -0.83056640625, -0.738677978515625, -0.64678955078125, -0.554901123046875, -0.4630126953125, -0.371124267578125, -0.27923583984375, -0.187347412109375, -0.095458984375, -0.003570556640625, 0.08831787109375, 0.180206298828125, 0.2720947265625, 0.363983154296875, 0.45587158203125, 0.547760009765625, 0.6396484375, 0.731536865234375, 0.82342529296875, 0.915313720703125, 1.0072021484375, 1.099090576171875, 1.19097900390625, 1.282867431640625, 1.374755859375, 1.466644287109375, 1.55853271484375, 1.650421142578125, 1.7423095703125, 1.834197998046875, 1.92608642578125, 2.017974853515625, 2.10986328125, 2.201751708984375, 2.29364013671875, 2.385528564453125, 2.4774169921875, 2.569305419921875, 2.66119384765625, 2.753082275390625, 2.844970703125, 2.936859130859375, 3.02874755859375, 3.120635986328125, 3.2125244140625, 3.304412841796875, 3.39630126953125, 3.488189697265625, 3.580078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 6.0, 18.0, 13.0, 32.0, 30.0, 56.0, 101.0, 132.0, 172.0, 252.0, 400.0, 597.0, 961.0, 1644.0, 2753.0, 4945.0, 9217.0, 18896.0, 42575.0, 133776.0, 597327.0, 147421.0, 45071.0, 19758.0, 9770.0, 5147.0, 2909.0, 1723.0, 1011.0, 675.0, 371.0, 258.0, 162.0, 100.0, 86.0, 59.0, 38.0, 14.0, 22.0, 10.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.05963134765625, -4.8614501953125, -4.66326904296875, -4.465087890625, -4.26690673828125, -4.0687255859375, -3.87054443359375, -3.67236328125, -3.47418212890625, -3.2760009765625, -3.07781982421875, -2.879638671875, -2.68145751953125, -2.4832763671875, -2.28509521484375, -2.0869140625, -1.88873291015625, -1.6905517578125, -1.49237060546875, -1.294189453125, -1.09600830078125, -0.8978271484375, -0.69964599609375, -0.50146484375, -0.30328369140625, -0.1051025390625, 0.09307861328125, 0.291259765625, 0.48944091796875, 0.6876220703125, 0.88580322265625, 1.083984375, 1.28216552734375, 1.4803466796875, 1.67852783203125, 1.876708984375, 2.07489013671875, 2.2730712890625, 2.47125244140625, 2.66943359375, 2.86761474609375, 3.0657958984375, 3.26397705078125, 3.462158203125, 3.66033935546875, 3.8585205078125, 4.05670166015625, 4.2548828125, 4.45306396484375, 4.6512451171875, 4.84942626953125, 5.047607421875, 5.24578857421875, 5.4439697265625, 5.64215087890625, 5.84033203125, 6.03851318359375, 6.2366943359375, 6.43487548828125, 6.633056640625, 6.83123779296875, 7.0294189453125, 7.22760009765625, 7.42578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 18.0, 33.0, 25.0, 26.0, 25.0, 31.0, 41.0, 41.0, 72.0, 71.0, 95.0, 146.0, 1424.0, 360.0, 131.0, 93.0, 70.0, 52.0, 45.0, 39.0, 35.0, 35.0, 21.0, 15.0, 16.0, 15.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.307373046875, -8.97412109375, -8.640869140625, -8.3076171875, -7.974365234375, -7.64111328125, -7.307861328125, -6.974609375, -6.641357421875, -6.30810546875, -5.974853515625, -5.6416015625, -5.308349609375, -4.97509765625, -4.641845703125, -4.30859375, -3.975341796875, -3.64208984375, -3.308837890625, -2.9755859375, -2.642333984375, -2.30908203125, -1.975830078125, -1.642578125, -1.309326171875, -0.97607421875, -0.642822265625, -0.3095703125, 0.023681640625, 0.35693359375, 0.690185546875, 1.0234375, 1.356689453125, 1.68994140625, 2.023193359375, 2.3564453125, 2.689697265625, 3.02294921875, 3.356201171875, 3.689453125, 4.022705078125, 4.35595703125, 4.689208984375, 5.0224609375, 5.355712890625, 5.68896484375, 6.022216796875, 6.35546875, 6.688720703125, 7.02197265625, 7.355224609375, 7.6884765625, 8.021728515625, 8.35498046875, 8.688232421875, 9.021484375, 9.354736328125, 9.68798828125, 10.021240234375, 10.3544921875, 10.687744140625, 11.02099609375, 11.354248046875, 11.6875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 17.0, 13.0, 11.0, 19.0, 22.0, 27.0, 32.0, 37.0, 55.0, 111.0, 156.0, 276.0, 766.0, 2423.0, 11071.0, 82469.0, 2693648.0, 322074.0, 25543.0, 4646.0, 1220.0, 427.0, 214.0, 118.0, 61.0, 41.0, 43.0, 32.0, 27.0, 20.0, 17.0, 9.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.797119140625, -16.25048828125, -15.703857421875, -15.1572265625, -14.610595703125, -14.06396484375, -13.517333984375, -12.970703125, -12.424072265625, -11.87744140625, -11.330810546875, -10.7841796875, -10.237548828125, -9.69091796875, -9.144287109375, -8.59765625, -8.051025390625, -7.50439453125, -6.957763671875, -6.4111328125, -5.864501953125, -5.31787109375, -4.771240234375, -4.224609375, -3.677978515625, -3.13134765625, -2.584716796875, -2.0380859375, -1.491455078125, -0.94482421875, -0.398193359375, 0.1484375, 0.695068359375, 1.24169921875, 1.788330078125, 2.3349609375, 2.881591796875, 3.42822265625, 3.974853515625, 4.521484375, 5.068115234375, 5.61474609375, 6.161376953125, 6.7080078125, 7.254638671875, 7.80126953125, 8.347900390625, 8.89453125, 9.441162109375, 9.98779296875, 10.534423828125, 11.0810546875, 11.627685546875, 12.17431640625, 12.720947265625, 13.267578125, 13.814208984375, 14.36083984375, 14.907470703125, 15.4541015625, 16.000732421875, 16.54736328125, 17.093994140625, 17.640625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 33.0, 93.0, 201.0, 300.0, 207.0, 122.0, 37.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96629524230957, -25.113798141479492, -23.261301040649414, -21.408803939819336, -19.556306838989258, -17.70380973815918, -15.851312637329102, -13.998815536499023, -12.146318435668945, -10.293821334838867, -8.441324234008789, -6.588827133178711, -4.736330032348633, -2.8838329315185547, -1.0313358306884766, 0.8211612701416016, 2.6736583709716797, 4.526155471801758, 6.378652572631836, 8.231149673461914, 10.083646774291992, 11.93614387512207, 13.788640975952148, 15.641138076782227, 17.493635177612305, 19.346132278442383, 21.19862937927246, 23.05112648010254, 24.903623580932617, 26.756120681762695, 28.608617782592773, 30.46111488342285, 32.31361389160156, 34.16611099243164, 36.01860809326172, 37.8711051940918, 39.723602294921875, 41.57609939575195, 43.42859649658203, 45.28109359741211, 47.13359069824219, 48.986087799072266, 50.838584899902344, 52.69108200073242, 54.5435791015625, 56.39607620239258, 58.248573303222656, 60.101070404052734, 61.95356750488281, 63.80606460571289, 65.65856170654297, 67.51106262207031, 69.36355590820312, 71.21604919433594, 73.06855010986328, 74.92105102539062, 76.77354431152344, 78.62603759765625, 80.4785385131836, 82.33103942871094, 84.18353271484375, 86.03602600097656, 87.8885269165039, 89.74102783203125, 91.59352111816406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 11.0, 16.0, 13.0, 31.0, 22.0, 18.0, 26.0, 26.0, 35.0, 36.0, 36.0, 40.0, 45.0, 37.0, 49.0, 56.0, 41.0, 31.0, 40.0, 36.0, 32.0, 35.0, 24.0, 27.0, 29.0, 20.0, 24.0, 19.0, 22.0, 13.0, 15.0, 20.0, 8.0, 7.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.59970474243164, -25.747615814208984, -24.89552879333496, -24.043439865112305, -23.19135284423828, -22.339263916015625, -21.48717498779297, -20.635087966918945, -19.78299903869629, -18.930910110473633, -18.07882308959961, -17.226734161376953, -16.37464714050293, -15.522558212280273, -14.670470237731934, -13.818382263183594, -12.966294288635254, -12.114206314086914, -11.262118339538574, -10.410030364990234, -9.557941436767578, -8.705853462219238, -7.853765487670898, -7.0016770362854, -6.1495890617370605, -5.297501087188721, -4.445412635803223, -3.593324661254883, -2.741236448287964, -1.889148235321045, -1.037060260772705, -0.18497180938720703, 0.6671161651611328, 1.5192043781280518, 2.3712925910949707, 3.2233805656433105, 4.075469017028809, 4.927556991577148, 5.779644966125488, 6.631733417510986, 7.483821392059326, 8.335909843444824, 9.187997817993164, 10.040085792541504, 10.892173767089844, 11.7442626953125, 12.596349716186523, 13.44843864440918, 14.30052661895752, 15.15261459350586, 16.004703521728516, 16.85679054260254, 17.708879470825195, 18.56096649169922, 19.413055419921875, 20.26514434814453, 21.117231369018555, 21.96932029724121, 22.821407318115234, 23.67349624633789, 24.525583267211914, 25.37767219543457, 26.229759216308594, 27.08184814453125, 27.933937072753906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 13.0, 13.0, 18.0, 28.0, 22.0, 33.0, 30.0, 23.0, 45.0, 43.0, 43.0, 45.0, 48.0, 65.0, 42.0, 37.0, 42.0, 46.0, 43.0, 47.0, 32.0, 27.0, 30.0, 25.0, 20.0, 19.0, 22.0, 17.0, 16.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.393798828125, -2.29736328125, -2.200927734375, -2.1044921875, -2.008056640625, -1.91162109375, -1.815185546875, -1.71875, -1.622314453125, -1.52587890625, -1.429443359375, -1.3330078125, -1.236572265625, -1.14013671875, -1.043701171875, -0.947265625, -0.850830078125, -0.75439453125, -0.657958984375, -0.5615234375, -0.465087890625, -0.36865234375, -0.272216796875, -0.17578125, -0.079345703125, 0.01708984375, 0.113525390625, 0.2099609375, 0.306396484375, 0.40283203125, 0.499267578125, 0.595703125, 0.692138671875, 0.78857421875, 0.885009765625, 0.9814453125, 1.077880859375, 1.17431640625, 1.270751953125, 1.3671875, 1.463623046875, 1.56005859375, 1.656494140625, 1.7529296875, 1.849365234375, 1.94580078125, 2.042236328125, 2.138671875, 2.235107421875, 2.33154296875, 2.427978515625, 2.5244140625, 2.620849609375, 2.71728515625, 2.813720703125, 2.91015625, 3.006591796875, 3.10302734375, 3.199462890625, 3.2958984375, 3.392333984375, 3.48876953125, 3.585205078125, 3.681640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 12.0, 14.0, 24.0, 18.0, 46.0, 62.0, 74.0, 154.0, 200.0, 335.0, 483.0, 776.0, 1200.0, 2117.0, 3588.0, 6547.0, 11816.0, 23213.0, 52388.0, 198159.0, 1589525.0, 1964535.0, 230896.0, 54733.0, 24184.0, 12369.0, 6673.0, 3784.0, 2243.0, 1365.0, 910.0, 570.0, 369.0, 271.0, 175.0, 126.0, 91.0, 68.0, 35.0, 36.0, 21.0, 20.0, 13.0, 9.0, 10.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.4140625, -5.2210693359375, -5.028076171875, -4.8350830078125, -4.64208984375, -4.4490966796875, -4.256103515625, -4.0631103515625, -3.8701171875, -3.6771240234375, -3.484130859375, -3.2911376953125, -3.09814453125, -2.9051513671875, -2.712158203125, -2.5191650390625, -2.326171875, -2.1331787109375, -1.940185546875, -1.7471923828125, -1.55419921875, -1.3612060546875, -1.168212890625, -0.9752197265625, -0.7822265625, -0.5892333984375, -0.396240234375, -0.2032470703125, -0.01025390625, 0.1827392578125, 0.375732421875, 0.5687255859375, 0.76171875, 0.9547119140625, 1.147705078125, 1.3406982421875, 1.53369140625, 1.7266845703125, 1.919677734375, 2.1126708984375, 2.3056640625, 2.4986572265625, 2.691650390625, 2.8846435546875, 3.07763671875, 3.2706298828125, 3.463623046875, 3.6566162109375, 3.849609375, 4.0426025390625, 4.235595703125, 4.4285888671875, 4.62158203125, 4.8145751953125, 5.007568359375, 5.2005615234375, 5.3935546875, 5.5865478515625, 5.779541015625, 5.9725341796875, 6.16552734375, 6.3585205078125, 6.551513671875, 6.7445068359375, 6.9375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 18.0, 19.0, 31.0, 39.0, 49.0, 84.0, 113.0, 172.0, 371.0, 713.0, 940.0, 643.0, 312.0, 153.0, 109.0, 82.0, 60.0, 38.0, 41.0, 12.0, 12.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3641357421875, -9.056396484375, -8.7486572265625, -8.44091796875, -8.1331787109375, -7.825439453125, -7.5177001953125, -7.2099609375, -6.9022216796875, -6.594482421875, -6.2867431640625, -5.97900390625, -5.6712646484375, -5.363525390625, -5.0557861328125, -4.748046875, -4.4403076171875, -4.132568359375, -3.8248291015625, -3.51708984375, -3.2093505859375, -2.901611328125, -2.5938720703125, -2.2861328125, -1.9783935546875, -1.670654296875, -1.3629150390625, -1.05517578125, -0.7474365234375, -0.439697265625, -0.1319580078125, 0.17578125, 0.4835205078125, 0.791259765625, 1.0989990234375, 1.40673828125, 1.7144775390625, 2.022216796875, 2.3299560546875, 2.6376953125, 2.9454345703125, 3.253173828125, 3.5609130859375, 3.86865234375, 4.1763916015625, 4.484130859375, 4.7918701171875, 5.099609375, 5.4073486328125, 5.715087890625, 6.0228271484375, 6.33056640625, 6.6383056640625, 6.946044921875, 7.2537841796875, 7.5615234375, 7.8692626953125, 8.177001953125, 8.4847412109375, 8.79248046875, 9.1002197265625, 9.407958984375, 9.7156982421875, 10.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 10.0, 32.0, 32.0, 50.0, 86.0, 174.0, 341.0, 681.0, 1664.0, 4676.0, 16562.0, 79864.0, 1387124.0, 2567562.0, 105722.0, 20632.0, 5629.0, 1860.0, 769.0, 370.0, 176.0, 104.0, 60.0, 29.0, 24.0, 8.0, 13.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.439697265625, -15.91064453125, -15.381591796875, -14.8525390625, -14.323486328125, -13.79443359375, -13.265380859375, -12.736328125, -12.207275390625, -11.67822265625, -11.149169921875, -10.6201171875, -10.091064453125, -9.56201171875, -9.032958984375, -8.50390625, -7.974853515625, -7.44580078125, -6.916748046875, -6.3876953125, -5.858642578125, -5.32958984375, -4.800537109375, -4.271484375, -3.742431640625, -3.21337890625, -2.684326171875, -2.1552734375, -1.626220703125, -1.09716796875, -0.568115234375, -0.0390625, 0.489990234375, 1.01904296875, 1.548095703125, 2.0771484375, 2.606201171875, 3.13525390625, 3.664306640625, 4.193359375, 4.722412109375, 5.25146484375, 5.780517578125, 6.3095703125, 6.838623046875, 7.36767578125, 7.896728515625, 8.42578125, 8.954833984375, 9.48388671875, 10.012939453125, 10.5419921875, 11.071044921875, 11.60009765625, 12.129150390625, 12.658203125, 13.187255859375, 13.71630859375, 14.245361328125, 14.7744140625, 15.303466796875, 15.83251953125, 16.361572265625, 16.890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 18.0, 24.0, 28.0, 41.0, 54.0, 73.0, 111.0, 142.0, 130.0, 103.0, 83.0, 70.0, 36.0, 25.0, 24.0, 18.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.594764709472656, -34.35810470581055, -33.12144088745117, -31.88477897644043, -30.648117065429688, -29.411457061767578, -28.174795150756836, -26.938133239746094, -25.70147132873535, -24.46480941772461, -23.228147506713867, -21.991485595703125, -20.754825592041016, -19.51816177368164, -18.28150177001953, -17.04483985900879, -15.808177947998047, -14.571516036987305, -13.334854125976562, -12.098193168640137, -10.861531257629395, -9.624869346618652, -8.388208389282227, -7.151546478271484, -5.914884567260742, -4.67822265625, -3.441561222076416, -2.204899549484253, -0.9682378768920898, 0.26842403411865234, 1.5050854682922363, 2.7417469024658203, 3.978412628173828, 5.21507453918457, 6.451735973358154, 7.688397407531738, 8.92505931854248, 10.161721229553223, 11.398382186889648, 12.63504409790039, 13.871706008911133, 15.108367919921875, 16.345029830932617, 17.58169174194336, 18.81835174560547, 20.055015563964844, 21.291675567626953, 22.528337478637695, 23.764999389648438, 25.00166130065918, 26.238323211669922, 27.474985122680664, 28.711647033691406, 29.948307037353516, 31.184968948364258, 32.421630859375, 33.658294677734375, 34.894954681396484, 36.13161849975586, 37.36827850341797, 38.604942321777344, 39.84160232543945, 41.07826614379883, 42.31492614746094, 43.55158615112305]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 3.0, 7.0, 13.0, 12.0, 11.0, 13.0, 19.0, 19.0, 22.0, 25.0, 31.0, 28.0, 37.0, 32.0, 25.0, 40.0, 42.0, 41.0, 42.0, 27.0, 40.0, 34.0, 41.0, 37.0, 37.0, 40.0, 35.0, 24.0, 24.0, 29.0, 12.0, 25.0, 18.0, 14.0, 16.0, 16.0, 10.0, 15.0, 8.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-22.668424606323242, -21.979143142700195, -21.28986167907715, -20.6005802154541, -19.911298751831055, -19.222017288208008, -18.532737731933594, -17.843456268310547, -17.1541748046875, -16.464893341064453, -15.775611877441406, -15.08633041381836, -14.397048950195312, -13.707767486572266, -13.018486976623535, -12.329205513000488, -11.639923095703125, -10.950641632080078, -10.261360168457031, -9.572078704833984, -8.882797241210938, -8.19351577758789, -7.50423526763916, -6.814953804016113, -6.125672340393066, -5.4363908767700195, -4.747109413146973, -4.057828426361084, -3.368546962738037, -2.6792654991149902, -1.9899845123291016, -1.3007030487060547, -0.6114234924316406, 0.0778578519821167, 0.767139196395874, 1.4564204216003418, 2.1457018852233887, 2.8349833488464355, 3.524264335632324, 4.213545799255371, 4.902827262878418, 5.592108726501465, 6.281390190124512, 6.9706711769104, 7.659952640533447, 8.349233627319336, 9.038515090942383, 9.72779655456543, 10.417078018188477, 11.106359481811523, 11.79564094543457, 12.484922409057617, 13.174203872680664, 13.863485336303711, 14.552765846252441, 15.242047309875488, 15.931328773498535, 16.620609283447266, 17.309890747070312, 17.99917221069336, 18.688453674316406, 19.377735137939453, 20.0670166015625, 20.756298065185547, 21.445579528808594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 14.0, 19.0, 21.0, 22.0, 15.0, 28.0, 26.0, 28.0, 34.0, 38.0, 29.0, 40.0, 30.0, 38.0, 40.0, 39.0, 41.0, 34.0, 35.0, 35.0, 37.0, 29.0, 35.0, 33.0, 14.0, 22.0, 20.0, 26.0, 16.0, 24.0, 19.0, 14.0, 5.0, 6.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.296875, -2.2203369140625, -2.143798828125, -2.0672607421875, -1.99072265625, -1.9141845703125, -1.837646484375, -1.7611083984375, -1.6845703125, -1.6080322265625, -1.531494140625, -1.4549560546875, -1.37841796875, -1.3018798828125, -1.225341796875, -1.1488037109375, -1.072265625, -0.9957275390625, -0.919189453125, -0.8426513671875, -0.76611328125, -0.6895751953125, -0.613037109375, -0.5364990234375, -0.4599609375, -0.3834228515625, -0.306884765625, -0.2303466796875, -0.15380859375, -0.0772705078125, -0.000732421875, 0.0758056640625, 0.15234375, 0.2288818359375, 0.305419921875, 0.3819580078125, 0.45849609375, 0.5350341796875, 0.611572265625, 0.6881103515625, 0.7646484375, 0.8411865234375, 0.917724609375, 0.9942626953125, 1.07080078125, 1.1473388671875, 1.223876953125, 1.3004150390625, 1.376953125, 1.4534912109375, 1.530029296875, 1.6065673828125, 1.68310546875, 1.7596435546875, 1.836181640625, 1.9127197265625, 1.9892578125, 2.0657958984375, 2.142333984375, 2.2188720703125, 2.29541015625, 2.3719482421875, 2.448486328125, 2.5250244140625, 2.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 12.0, 19.0, 31.0, 31.0, 40.0, 59.0, 109.0, 111.0, 171.0, 217.0, 282.0, 444.0, 591.0, 792.0, 1155.0, 1654.0, 2601.0, 4471.0, 9412.0, 25489.0, 117873.0, 722753.0, 113239.0, 24972.0, 9311.0, 4410.0, 2575.0, 1654.0, 1187.0, 764.0, 556.0, 441.0, 290.0, 235.0, 153.0, 109.0, 98.0, 76.0, 37.0, 40.0, 29.0, 18.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.19146728515625, -5.9884033203125, -5.78533935546875, -5.582275390625, -5.37921142578125, -5.1761474609375, -4.97308349609375, -4.77001953125, -4.56695556640625, -4.3638916015625, -4.16082763671875, -3.957763671875, -3.75469970703125, -3.5516357421875, -3.34857177734375, -3.1455078125, -2.94244384765625, -2.7393798828125, -2.53631591796875, -2.333251953125, -2.13018798828125, -1.9271240234375, -1.72406005859375, -1.52099609375, -1.31793212890625, -1.1148681640625, -0.91180419921875, -0.708740234375, -0.50567626953125, -0.3026123046875, -0.09954833984375, 0.103515625, 0.30657958984375, 0.5096435546875, 0.71270751953125, 0.915771484375, 1.11883544921875, 1.3218994140625, 1.52496337890625, 1.72802734375, 1.93109130859375, 2.1341552734375, 2.33721923828125, 2.540283203125, 2.74334716796875, 2.9464111328125, 3.14947509765625, 3.3525390625, 3.55560302734375, 3.7586669921875, 3.96173095703125, 4.164794921875, 4.36785888671875, 4.5709228515625, 4.77398681640625, 4.97705078125, 5.18011474609375, 5.3831787109375, 5.58624267578125, 5.789306640625, 5.99237060546875, 6.1954345703125, 6.39849853515625, 6.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 11.0, 7.0, 4.0, 12.0, 9.0, 9.0, 19.0, 25.0, 29.0, 26.0, 27.0, 32.0, 27.0, 39.0, 45.0, 35.0, 41.0, 40.0, 1078.0, 43.0, 38.0, 34.0, 38.0, 36.0, 43.0, 43.0, 32.0, 32.0, 21.0, 17.0, 20.0, 15.0, 19.0, 13.0, 12.0, 12.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.0850830078125, -2.011962890625, -1.9388427734375, -1.86572265625, -1.7926025390625, -1.719482421875, -1.6463623046875, -1.5732421875, -1.5001220703125, -1.427001953125, -1.3538818359375, -1.28076171875, -1.2076416015625, -1.134521484375, -1.0614013671875, -0.98828125, -0.9151611328125, -0.842041015625, -0.7689208984375, -0.69580078125, -0.6226806640625, -0.549560546875, -0.4764404296875, -0.4033203125, -0.3302001953125, -0.257080078125, -0.1839599609375, -0.11083984375, -0.0377197265625, 0.035400390625, 0.1085205078125, 0.181640625, 0.2547607421875, 0.327880859375, 0.4010009765625, 0.47412109375, 0.5472412109375, 0.620361328125, 0.6934814453125, 0.7666015625, 0.8397216796875, 0.912841796875, 0.9859619140625, 1.05908203125, 1.1322021484375, 1.205322265625, 1.2784423828125, 1.3515625, 1.4246826171875, 1.497802734375, 1.5709228515625, 1.64404296875, 1.7171630859375, 1.790283203125, 1.8634033203125, 1.9365234375, 2.0096435546875, 2.082763671875, 2.1558837890625, 2.22900390625, 2.3021240234375, 2.375244140625, 2.4483642578125, 2.521484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 9.0, 13.0, 10.0, 9.0, 19.0, 25.0, 22.0, 37.0, 31.0, 63.0, 66.0, 114.0, 120.0, 172.0, 276.0, 315.0, 457.0, 653.0, 1004.0, 1536.0, 2470.0, 4353.0, 9495.0, 32477.0, 1329657.0, 665232.0, 28540.0, 8662.0, 4153.0, 2322.0, 1489.0, 1017.0, 609.0, 444.0, 344.0, 211.0, 192.0, 120.0, 93.0, 68.0, 62.0, 34.0, 32.0, 28.0, 19.0, 18.0, 6.0, 9.0, 4.0, 4.0, 0.0, 3.0, 6.0, 5.0], "bins": [-8.3046875, -8.067138671875, -7.82958984375, -7.592041015625, -7.3544921875, -7.116943359375, -6.87939453125, -6.641845703125, -6.404296875, -6.166748046875, -5.92919921875, -5.691650390625, -5.4541015625, -5.216552734375, -4.97900390625, -4.741455078125, -4.50390625, -4.266357421875, -4.02880859375, -3.791259765625, -3.5537109375, -3.316162109375, -3.07861328125, -2.841064453125, -2.603515625, -2.365966796875, -2.12841796875, -1.890869140625, -1.6533203125, -1.415771484375, -1.17822265625, -0.940673828125, -0.703125, -0.465576171875, -0.22802734375, 0.009521484375, 0.2470703125, 0.484619140625, 0.72216796875, 0.959716796875, 1.197265625, 1.434814453125, 1.67236328125, 1.909912109375, 2.1474609375, 2.385009765625, 2.62255859375, 2.860107421875, 3.09765625, 3.335205078125, 3.57275390625, 3.810302734375, 4.0478515625, 4.285400390625, 4.52294921875, 4.760498046875, 4.998046875, 5.235595703125, 5.47314453125, 5.710693359375, 5.9482421875, 6.185791015625, 6.42333984375, 6.660888671875, 6.8984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 17.0, 19.0, 25.0, 28.0, 60.0, 184.0, 362.0, 97.0, 49.0, 30.0, 20.0, 15.0, 16.0, 13.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.38671875, -2.3244171142578125, -2.262115478515625, -2.1998138427734375, -2.13751220703125, -2.0752105712890625, -2.012908935546875, -1.9506072998046875, -1.8883056640625, -1.8260040283203125, -1.763702392578125, -1.7014007568359375, -1.63909912109375, -1.5767974853515625, -1.514495849609375, -1.4521942138671875, -1.389892578125, -1.3275909423828125, -1.265289306640625, -1.2029876708984375, -1.14068603515625, -1.0783843994140625, -1.016082763671875, -0.9537811279296875, -0.8914794921875, -0.8291778564453125, -0.766876220703125, -0.7045745849609375, -0.64227294921875, -0.5799713134765625, -0.517669677734375, -0.4553680419921875, -0.39306640625, -0.3307647705078125, -0.268463134765625, -0.2061614990234375, -0.14385986328125, -0.0815582275390625, -0.019256591796875, 0.0430450439453125, 0.1053466796875, 0.1676483154296875, 0.229949951171875, 0.2922515869140625, 0.35455322265625, 0.4168548583984375, 0.479156494140625, 0.5414581298828125, 0.603759765625, 0.6660614013671875, 0.728363037109375, 0.7906646728515625, 0.85296630859375, 0.9152679443359375, 0.977569580078125, 1.0398712158203125, 1.1021728515625, 1.1644744873046875, 1.226776123046875, 1.2890777587890625, 1.35137939453125, 1.4136810302734375, 1.475982666015625, 1.5382843017578125, 1.6005859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 3.0, 8.0, 5.0, 8.0, 18.0, 34.0, 55.0, 102.0, 292.0, 1296.0, 7571.0, 999347.0, 36042.0, 2828.0, 575.0, 153.0, 66.0, 33.0, 21.0, 17.0, 17.0, 15.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-28.71875, -27.60302734375, -26.4873046875, -25.37158203125, -24.255859375, -23.14013671875, -22.0244140625, -20.90869140625, -19.79296875, -18.67724609375, -17.5615234375, -16.44580078125, -15.330078125, -14.21435546875, -13.0986328125, -11.98291015625, -10.8671875, -9.75146484375, -8.6357421875, -7.52001953125, -6.404296875, -5.28857421875, -4.1728515625, -3.05712890625, -1.94140625, -0.82568359375, 0.2900390625, 1.40576171875, 2.521484375, 3.63720703125, 4.7529296875, 5.86865234375, 6.984375, 8.10009765625, 9.2158203125, 10.33154296875, 11.447265625, 12.56298828125, 13.6787109375, 14.79443359375, 15.91015625, 17.02587890625, 18.1416015625, 19.25732421875, 20.373046875, 21.48876953125, 22.6044921875, 23.72021484375, 24.8359375, 25.95166015625, 27.0673828125, 28.18310546875, 29.298828125, 30.41455078125, 31.5302734375, 32.64599609375, 33.76171875, 34.87744140625, 35.9931640625, 37.10888671875, 38.224609375, 39.34033203125, 40.4560546875, 41.57177734375, 42.6875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 17.0, 43.0, 228.0, 583.0, 107.0, 26.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082770347595215, -3.6443777084350586, -3.2059853076934814, -2.7675929069519043, -2.329200267791748, -1.8908076286315918, -1.4524152278900146, -1.0140228271484375, -0.5756301879882812, -0.13723766803741455, 0.30115485191345215, 0.7395473718643188, 1.1779398918151855, 1.6163325309753418, 2.054724931716919, 2.493117332458496, 2.9315099716186523, 3.3699026107788086, 3.8082950115203857, 4.246687412261963, 4.685080051422119, 5.123472690582275, 5.561864852905273, 6.00025749206543, 6.438650131225586, 6.877042770385742, 7.315435409545898, 7.7538275718688965, 8.192220687866211, 8.630613327026367, 9.069005012512207, 9.507397651672363, 9.945791244506836, 10.384183883666992, 10.822576522827148, 11.260969161987305, 11.699361801147461, 12.137754440307617, 12.576146125793457, 13.014538764953613, 13.45293140411377, 13.891324043273926, 14.329716682434082, 14.768109321594238, 15.206501007080078, 15.644893646240234, 16.08328628540039, 16.521678924560547, 16.960071563720703, 17.39846420288086, 17.836856842041016, 18.275249481201172, 18.713642120361328, 19.152034759521484, 19.59042739868164, 20.028820037841797, 20.467212677001953, 20.90560531616211, 21.343997955322266, 21.782390594482422, 22.220783233642578, 22.659175872802734, 23.09756851196289, 23.535961151123047, 23.97435188293457]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 10.0, 9.0, 10.0, 3.0, 13.0, 12.0, 21.0, 23.0, 25.0, 26.0, 25.0, 38.0, 43.0, 42.0, 43.0, 44.0, 55.0, 47.0, 55.0, 42.0, 42.0, 40.0, 44.0, 47.0, 38.0, 26.0, 25.0, 21.0, 23.0, 21.0, 19.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5552830696105957, -1.4940707683563232, -1.4328584671020508, -1.3716461658477783, -1.3104337453842163, -1.2492214441299438, -1.1880091428756714, -1.126796841621399, -1.065584421157837, -1.0043721199035645, -0.9431597590446472, -0.8819474577903748, -0.8207350969314575, -0.7595227956771851, -0.6983104944229126, -0.6370981931686401, -0.5758858919143677, -0.5146735906600952, -0.453461229801178, -0.3922489285469055, -0.33103659749031067, -0.2698242664337158, -0.20861196517944336, -0.1473996341228485, -0.08618730306625366, -0.02497497946023941, 0.03623734414577484, 0.0974496603012085, 0.15866199135780334, 0.2198743224143982, 0.28108662366867065, 0.3422989547252655, 0.40351128578186035, 0.4647236168384552, 0.52593594789505, 0.5871482491493225, 0.6483606100082397, 0.7095729112625122, 0.7707852125167847, 0.8319975137710571, 0.8932098746299744, 0.9544221758842468, 1.015634536743164, 1.0768468379974365, 1.138059139251709, 1.1992714405059814, 1.260483741760254, 1.321696162223816, 1.3829084634780884, 1.4441207647323608, 1.5053330659866333, 1.5665454864501953, 1.6277577877044678, 1.6889700889587402, 1.7501823902130127, 1.8113946914672852, 1.8726069927215576, 1.93381929397583, 1.9950315952301025, 2.056243896484375, 2.1174561977386475, 2.17866849899292, 2.2398810386657715, 2.301093339920044, 2.3623056411743164]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 9.0, 11.0, 11.0, 17.0, 14.0, 31.0, 26.0, 25.0, 39.0, 43.0, 32.0, 41.0, 42.0, 28.0, 39.0, 43.0, 48.0, 52.0, 41.0, 52.0, 37.0, 44.0, 35.0, 32.0, 24.0, 27.0, 29.0, 26.0, 14.0, 11.0, 11.0, 11.0, 9.0, 11.0, 6.0, 7.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.904296875, -2.815826416015625, -2.72735595703125, -2.638885498046875, -2.5504150390625, -2.461944580078125, -2.37347412109375, -2.285003662109375, -2.196533203125, -2.108062744140625, -2.01959228515625, -1.931121826171875, -1.8426513671875, -1.754180908203125, -1.66571044921875, -1.577239990234375, -1.48876953125, -1.400299072265625, -1.31182861328125, -1.223358154296875, -1.1348876953125, -1.046417236328125, -0.95794677734375, -0.869476318359375, -0.781005859375, -0.692535400390625, -0.60406494140625, -0.515594482421875, -0.4271240234375, -0.338653564453125, -0.25018310546875, -0.161712646484375, -0.0732421875, 0.015228271484375, 0.10369873046875, 0.192169189453125, 0.2806396484375, 0.369110107421875, 0.45758056640625, 0.546051025390625, 0.634521484375, 0.722991943359375, 0.81146240234375, 0.899932861328125, 0.9884033203125, 1.076873779296875, 1.16534423828125, 1.253814697265625, 1.34228515625, 1.430755615234375, 1.51922607421875, 1.607696533203125, 1.6961669921875, 1.784637451171875, 1.87310791015625, 1.961578369140625, 2.050048828125, 2.138519287109375, 2.22698974609375, 2.315460205078125, 2.4039306640625, 2.492401123046875, 2.58087158203125, 2.669342041015625, 2.7578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 6.0, 9.0, 7.0, 29.0, 31.0, 46.0, 65.0, 90.0, 160.0, 202.0, 320.0, 512.0, 814.0, 1188.0, 1812.0, 2901.0, 4678.0, 7652.0, 12303.0, 21298.0, 38886.0, 76964.0, 195786.0, 392694.0, 146780.0, 63315.0, 32729.0, 18351.0, 10852.0, 6478.0, 4121.0, 2569.0, 1669.0, 1129.0, 685.0, 485.0, 303.0, 213.0, 138.0, 98.0, 64.0, 46.0, 19.0, 17.0, 16.0, 11.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.47161865234375, -3.3572998046875, -3.24298095703125, -3.128662109375, -3.01434326171875, -2.9000244140625, -2.78570556640625, -2.67138671875, -2.55706787109375, -2.4427490234375, -2.32843017578125, -2.214111328125, -2.09979248046875, -1.9854736328125, -1.87115478515625, -1.7568359375, -1.64251708984375, -1.5281982421875, -1.41387939453125, -1.299560546875, -1.18524169921875, -1.0709228515625, -0.95660400390625, -0.84228515625, -0.72796630859375, -0.6136474609375, -0.49932861328125, -0.385009765625, -0.27069091796875, -0.1563720703125, -0.04205322265625, 0.072265625, 0.18658447265625, 0.3009033203125, 0.41522216796875, 0.529541015625, 0.64385986328125, 0.7581787109375, 0.87249755859375, 0.98681640625, 1.10113525390625, 1.2154541015625, 1.32977294921875, 1.444091796875, 1.55841064453125, 1.6727294921875, 1.78704833984375, 1.9013671875, 2.01568603515625, 2.1300048828125, 2.24432373046875, 2.358642578125, 2.47296142578125, 2.5872802734375, 2.70159912109375, 2.81591796875, 2.93023681640625, 3.0445556640625, 3.15887451171875, 3.273193359375, 3.38751220703125, 3.5018310546875, 3.61614990234375, 3.73046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 10.0, 16.0, 19.0, 15.0, 24.0, 27.0, 37.0, 34.0, 45.0, 49.0, 56.0, 83.0, 139.0, 251.0, 1420.0, 253.0, 136.0, 68.0, 54.0, 53.0, 50.0, 41.0, 27.0, 12.0, 24.0, 17.0, 8.0, 9.0, 6.0, 8.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-12.046875, -11.70703125, -11.3671875, -11.02734375, -10.6875, -10.34765625, -10.0078125, -9.66796875, -9.328125, -8.98828125, -8.6484375, -8.30859375, -7.96875, -7.62890625, -7.2890625, -6.94921875, -6.609375, -6.26953125, -5.9296875, -5.58984375, -5.25, -4.91015625, -4.5703125, -4.23046875, -3.890625, -3.55078125, -3.2109375, -2.87109375, -2.53125, -2.19140625, -1.8515625, -1.51171875, -1.171875, -0.83203125, -0.4921875, -0.15234375, 0.1875, 0.52734375, 0.8671875, 1.20703125, 1.546875, 1.88671875, 2.2265625, 2.56640625, 2.90625, 3.24609375, 3.5859375, 3.92578125, 4.265625, 4.60546875, 4.9453125, 5.28515625, 5.625, 5.96484375, 6.3046875, 6.64453125, 6.984375, 7.32421875, 7.6640625, 8.00390625, 8.34375, 8.68359375, 9.0234375, 9.36328125, 9.703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 22.0, 41.0, 49.0, 65.0, 89.0, 129.0, 215.0, 437.0, 1597.0, 10625.0, 221794.0, 2826820.0, 75691.0, 6014.0, 996.0, 358.0, 210.0, 120.0, 91.0, 71.0, 51.0, 32.0, 32.0, 20.0, 16.0, 13.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.189453125, -15.59765625, -15.005859375, -14.4140625, -13.822265625, -13.23046875, -12.638671875, -12.046875, -11.455078125, -10.86328125, -10.271484375, -9.6796875, -9.087890625, -8.49609375, -7.904296875, -7.3125, -6.720703125, -6.12890625, -5.537109375, -4.9453125, -4.353515625, -3.76171875, -3.169921875, -2.578125, -1.986328125, -1.39453125, -0.802734375, -0.2109375, 0.380859375, 0.97265625, 1.564453125, 2.15625, 2.748046875, 3.33984375, 3.931640625, 4.5234375, 5.115234375, 5.70703125, 6.298828125, 6.890625, 7.482421875, 8.07421875, 8.666015625, 9.2578125, 9.849609375, 10.44140625, 11.033203125, 11.625, 12.216796875, 12.80859375, 13.400390625, 13.9921875, 14.583984375, 15.17578125, 15.767578125, 16.359375, 16.951171875, 17.54296875, 18.134765625, 18.7265625, 19.318359375, 19.91015625, 20.501953125, 21.09375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [3.0, 20.0, 327.0, 597.0, 73.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.854573249816895, -9.474528312683105, -5.094483375549316, -0.7144384384155273, 3.6656064987182617, 8.04565143585205, 12.42569637298584, 16.805740356445312, 21.185787200927734, 25.565832138061523, 29.945877075195312, 34.32592010498047, 38.70596694946289, 43.08601379394531, 47.46605682373047, 51.846099853515625, 56.22614669799805, 60.60619354248047, 64.98623657226562, 69.36627960205078, 73.74632263183594, 78.12637329101562, 82.50641632080078, 86.88645935058594, 91.2665023803711, 95.64654541015625, 100.02659606933594, 104.4066390991211, 108.78668212890625, 113.1667251586914, 117.54676818847656, 121.92681884765625, 126.30685424804688, 130.68690490722656, 135.0669403076172, 139.44699096679688, 143.8270263671875, 148.2070770263672, 152.58712768554688, 156.9671630859375, 161.3472137451172, 165.72726440429688, 170.1072998046875, 174.4873504638672, 178.86740112304688, 183.2474365234375, 187.6274871826172, 192.0075225830078, 196.3875732421875, 200.7676239013672, 205.1476593017578, 209.5277099609375, 213.90774536132812, 218.2877960205078, 222.6678466796875, 227.04788208007812, 231.4279327392578, 235.8079833984375, 240.18801879882812, 244.5680694580078, 248.9481201171875, 253.32815551757812, 257.70819091796875, 262.0882568359375, 266.4682922363281]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 9.0, 12.0, 12.0, 14.0, 13.0, 12.0, 15.0, 24.0, 23.0, 34.0, 26.0, 23.0, 31.0, 32.0, 33.0, 19.0, 33.0, 37.0, 36.0, 27.0, 33.0, 24.0, 41.0, 39.0, 34.0, 36.0, 35.0, 39.0, 26.0, 24.0, 20.0, 22.0, 23.0, 18.0, 17.0, 14.0, 10.0, 13.0, 11.0, 10.0, 14.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.88700294494629, -21.217126846313477, -20.547252655029297, -19.877376556396484, -19.207500457763672, -18.53762435913086, -17.86775016784668, -17.197874069213867, -16.527999877929688, -15.858124732971191, -15.188248634338379, -14.518373489379883, -13.84849739074707, -13.178622245788574, -12.508747100830078, -11.838871002197266, -11.168994903564453, -10.499119758605957, -9.829243659973145, -9.159368515014648, -8.489492416381836, -7.81961727142334, -7.149742126464844, -6.4798665046691895, -5.809990882873535, -5.140115261077881, -4.470239639282227, -3.8003644943237305, -3.130488872528076, -2.460613250732422, -1.7907381057739258, -1.1208624839782715, -0.4509849548339844, 0.21889054775238037, 0.8887660503387451, 1.5586414337158203, 2.2285170555114746, 2.898392677307129, 3.568267822265625, 4.238143444061279, 4.908019065856934, 5.577894687652588, 6.247770309448242, 6.917645454406738, 7.587521076202393, 8.257396697998047, 8.927271842956543, 9.597146987915039, 10.267023086547852, 10.936898231506348, 11.60677433013916, 12.276649475097656, 12.946525573730469, 13.616400718688965, 14.286275863647461, 14.956151962280273, 15.62602710723877, 16.295902252197266, 16.965778350830078, 17.63565444946289, 18.30552864074707, 18.975404739379883, 19.645278930664062, 20.315155029296875, 20.985031127929688]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 16.0, 13.0, 13.0, 18.0, 24.0, 20.0, 25.0, 22.0, 33.0, 31.0, 34.0, 47.0, 37.0, 44.0, 43.0, 55.0, 53.0, 36.0, 42.0, 52.0, 39.0, 38.0, 28.0, 24.0, 36.0, 21.0, 21.0, 19.0, 18.0, 15.0, 11.0, 7.0, 10.0, 5.0, 8.0, 12.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.095703125, -3.002593994140625, -2.90948486328125, -2.816375732421875, -2.7232666015625, -2.630157470703125, -2.53704833984375, -2.443939208984375, -2.350830078125, -2.257720947265625, -2.16461181640625, -2.071502685546875, -1.9783935546875, -1.885284423828125, -1.79217529296875, -1.699066162109375, -1.60595703125, -1.512847900390625, -1.41973876953125, -1.326629638671875, -1.2335205078125, -1.140411376953125, -1.04730224609375, -0.954193115234375, -0.861083984375, -0.767974853515625, -0.67486572265625, -0.581756591796875, -0.4886474609375, -0.395538330078125, -0.30242919921875, -0.209320068359375, -0.1162109375, -0.023101806640625, 0.07000732421875, 0.163116455078125, 0.2562255859375, 0.349334716796875, 0.44244384765625, 0.535552978515625, 0.628662109375, 0.721771240234375, 0.81488037109375, 0.907989501953125, 1.0010986328125, 1.094207763671875, 1.18731689453125, 1.280426025390625, 1.37353515625, 1.466644287109375, 1.55975341796875, 1.652862548828125, 1.7459716796875, 1.839080810546875, 1.93218994140625, 2.025299072265625, 2.118408203125, 2.211517333984375, 2.30462646484375, 2.397735595703125, 2.4908447265625, 2.583953857421875, 2.67706298828125, 2.770172119140625, 2.86328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 11.0, 26.0, 32.0, 53.0, 81.0, 113.0, 147.0, 237.0, 332.0, 550.0, 867.0, 1486.0, 2600.0, 4608.0, 8473.0, 16960.0, 38347.0, 130966.0, 1106509.0, 2452063.0, 317416.0, 60328.0, 24414.0, 11817.0, 6306.0, 3623.0, 2091.0, 1292.0, 799.0, 523.0, 357.0, 234.0, 162.0, 103.0, 89.0, 65.0, 38.0, 37.0, 23.0, 17.0, 14.0, 12.0, 7.0, 9.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.4609375, -6.24725341796875, -6.0335693359375, -5.81988525390625, -5.606201171875, -5.39251708984375, -5.1788330078125, -4.96514892578125, -4.75146484375, -4.53778076171875, -4.3240966796875, -4.11041259765625, -3.896728515625, -3.68304443359375, -3.4693603515625, -3.25567626953125, -3.0419921875, -2.82830810546875, -2.6146240234375, -2.40093994140625, -2.187255859375, -1.97357177734375, -1.7598876953125, -1.54620361328125, -1.33251953125, -1.11883544921875, -0.9051513671875, -0.69146728515625, -0.477783203125, -0.26409912109375, -0.0504150390625, 0.16326904296875, 0.376953125, 0.59063720703125, 0.8043212890625, 1.01800537109375, 1.231689453125, 1.44537353515625, 1.6590576171875, 1.87274169921875, 2.08642578125, 2.30010986328125, 2.5137939453125, 2.72747802734375, 2.941162109375, 3.15484619140625, 3.3685302734375, 3.58221435546875, 3.7958984375, 4.00958251953125, 4.2232666015625, 4.43695068359375, 4.650634765625, 4.86431884765625, 5.0780029296875, 5.29168701171875, 5.50537109375, 5.71905517578125, 5.9327392578125, 6.14642333984375, 6.360107421875, 6.57379150390625, 6.7874755859375, 7.00115966796875, 7.21484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 16.0, 13.0, 14.0, 33.0, 37.0, 68.0, 73.0, 93.0, 155.0, 261.0, 467.0, 789.0, 801.0, 464.0, 225.0, 148.0, 115.0, 74.0, 55.0, 33.0, 27.0, 22.0, 12.0, 18.0, 8.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6953125, -9.41796875, -9.140625, -8.86328125, -8.5859375, -8.30859375, -8.03125, -7.75390625, -7.4765625, -7.19921875, -6.921875, -6.64453125, -6.3671875, -6.08984375, -5.8125, -5.53515625, -5.2578125, -4.98046875, -4.703125, -4.42578125, -4.1484375, -3.87109375, -3.59375, -3.31640625, -3.0390625, -2.76171875, -2.484375, -2.20703125, -1.9296875, -1.65234375, -1.375, -1.09765625, -0.8203125, -0.54296875, -0.265625, 0.01171875, 0.2890625, 0.56640625, 0.84375, 1.12109375, 1.3984375, 1.67578125, 1.953125, 2.23046875, 2.5078125, 2.78515625, 3.0625, 3.33984375, 3.6171875, 3.89453125, 4.171875, 4.44921875, 4.7265625, 5.00390625, 5.28125, 5.55859375, 5.8359375, 6.11328125, 6.390625, 6.66796875, 6.9453125, 7.22265625, 7.5, 7.77734375, 8.0546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 10.0, 24.0, 33.0, 45.0, 99.0, 129.0, 320.0, 751.0, 1812.0, 6095.0, 26018.0, 193031.0, 3549601.0, 365341.0, 38623.0, 8179.0, 2412.0, 876.0, 421.0, 184.0, 94.0, 54.0, 36.0, 20.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.01904296875, -16.4443359375, -15.86962890625, -15.294921875, -14.72021484375, -14.1455078125, -13.57080078125, -12.99609375, -12.42138671875, -11.8466796875, -11.27197265625, -10.697265625, -10.12255859375, -9.5478515625, -8.97314453125, -8.3984375, -7.82373046875, -7.2490234375, -6.67431640625, -6.099609375, -5.52490234375, -4.9501953125, -4.37548828125, -3.80078125, -3.22607421875, -2.6513671875, -2.07666015625, -1.501953125, -0.92724609375, -0.3525390625, 0.22216796875, 0.796875, 1.37158203125, 1.9462890625, 2.52099609375, 3.095703125, 3.67041015625, 4.2451171875, 4.81982421875, 5.39453125, 5.96923828125, 6.5439453125, 7.11865234375, 7.693359375, 8.26806640625, 8.8427734375, 9.41748046875, 9.9921875, 10.56689453125, 11.1416015625, 11.71630859375, 12.291015625, 12.86572265625, 13.4404296875, 14.01513671875, 14.58984375, 15.16455078125, 15.7392578125, 16.31396484375, 16.888671875, 17.46337890625, 18.0380859375, 18.61279296875, 19.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 23.0, 17.0, 35.0, 53.0, 93.0, 120.0, 140.0, 125.0, 131.0, 87.0, 48.0, 49.0, 20.0, 15.0, 11.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.46260070800781, -40.11937713623047, -38.776153564453125, -37.43292999267578, -36.08970642089844, -34.74648666381836, -33.403263092041016, -32.06003952026367, -30.716815948486328, -29.373592376708984, -28.03036880493164, -26.68714714050293, -25.343923568725586, -24.000699996948242, -22.65747833251953, -21.314254760742188, -19.971031188964844, -18.6278076171875, -17.284584045410156, -15.941362380981445, -14.598138809204102, -13.254915237426758, -11.91169261932373, -10.568470001220703, -9.22524642944336, -7.882023334503174, -6.538800239562988, -5.195577144622803, -3.852354049682617, -2.5091309547424316, -1.165907859802246, 0.17731475830078125, 1.520538330078125, 2.8637614250183105, 4.206984519958496, 5.550207614898682, 6.893430709838867, 8.236654281616211, 9.579876899719238, 10.923099517822266, 12.26632308959961, 13.609546661376953, 14.95276927947998, 16.295991897583008, 17.63921546936035, 18.982439041137695, 20.325660705566406, 21.66888427734375, 23.012107849121094, 24.355331420898438, 25.69855499267578, 27.041776657104492, 28.385000228881836, 29.72822380065918, 31.07144546508789, 32.414669036865234, 33.75789260864258, 35.10111618041992, 36.444339752197266, 37.78756332397461, 39.13078308105469, 40.47400665283203, 41.817230224609375, 43.16045379638672, 44.50367736816406]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 13.0, 9.0, 11.0, 17.0, 19.0, 23.0, 17.0, 34.0, 36.0, 35.0, 45.0, 35.0, 40.0, 39.0, 42.0, 54.0, 43.0, 42.0, 50.0, 40.0, 43.0, 38.0, 39.0, 32.0, 24.0, 18.0, 26.0, 22.0, 17.0, 21.0, 12.0, 13.0, 9.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.348052978515625, -27.520893096923828, -26.6937313079834, -25.8665714263916, -25.039409637451172, -24.212249755859375, -23.385089874267578, -22.55792808532715, -21.73076629638672, -20.903606414794922, -20.076444625854492, -19.249284744262695, -18.422122955322266, -17.59496307373047, -16.767803192138672, -15.940641403198242, -15.113481521606445, -14.286320686340332, -13.459159851074219, -12.631999969482422, -11.804838180541992, -10.977678298950195, -10.150517463684082, -9.323356628417969, -8.496195793151855, -7.669034957885742, -6.841874122619629, -6.014713764190674, -5.1875529289245605, -4.360392093658447, -3.533231735229492, -2.706070899963379, -1.8789100646972656, -1.051749348640442, -0.22458863258361816, 0.602571964263916, 1.4297327995300293, 2.2568936347961426, 3.0840539932250977, 3.911214828491211, 4.738375663757324, 5.5655364990234375, 6.392697334289551, 7.219857692718506, 8.047018051147461, 8.87417984008789, 9.701339721679688, 10.5285005569458, 11.355661392211914, 12.182822227478027, 13.00998306274414, 13.837142944335938, 14.664304733276367, 15.491464614868164, 16.318626403808594, 17.14578628540039, 17.972946166992188, 18.800106048583984, 19.627267837524414, 20.45442771911621, 21.28158950805664, 22.108749389648438, 22.935909271240234, 23.763071060180664, 24.590232849121094]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 11.0, 8.0, 20.0, 17.0, 24.0, 15.0, 21.0, 27.0, 33.0, 34.0, 38.0, 35.0, 36.0, 50.0, 41.0, 60.0, 55.0, 43.0, 41.0, 53.0, 38.0, 44.0, 39.0, 33.0, 30.0, 23.0, 18.0, 22.0, 14.0, 10.0, 16.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.79058837890625, -2.6925048828125, -2.59442138671875, -2.496337890625, -2.39825439453125, -2.3001708984375, -2.20208740234375, -2.10400390625, -2.00592041015625, -1.9078369140625, -1.80975341796875, -1.711669921875, -1.61358642578125, -1.5155029296875, -1.41741943359375, -1.3193359375, -1.22125244140625, -1.1231689453125, -1.02508544921875, -0.927001953125, -0.82891845703125, -0.7308349609375, -0.63275146484375, -0.53466796875, -0.43658447265625, -0.3385009765625, -0.24041748046875, -0.142333984375, -0.04425048828125, 0.0538330078125, 0.15191650390625, 0.25, 0.34808349609375, 0.4461669921875, 0.54425048828125, 0.642333984375, 0.74041748046875, 0.8385009765625, 0.93658447265625, 1.03466796875, 1.13275146484375, 1.2308349609375, 1.32891845703125, 1.427001953125, 1.52508544921875, 1.6231689453125, 1.72125244140625, 1.8193359375, 1.91741943359375, 2.0155029296875, 2.11358642578125, 2.211669921875, 2.30975341796875, 2.4078369140625, 2.50592041015625, 2.60400390625, 2.70208740234375, 2.8001708984375, 2.89825439453125, 2.996337890625, 3.09442138671875, 3.1925048828125, 3.29058837890625, 3.388671875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 9.0, 14.0, 13.0, 10.0, 20.0, 27.0, 43.0, 56.0, 81.0, 109.0, 120.0, 202.0, 281.0, 347.0, 509.0, 754.0, 1079.0, 1412.0, 2122.0, 3086.0, 4710.0, 7170.0, 11399.0, 19182.0, 33769.0, 70879.0, 296425.0, 417817.0, 82412.0, 37907.0, 20442.0, 12356.0, 7667.0, 5030.0, 3348.0, 2303.0, 1494.0, 1129.0, 802.0, 552.0, 403.0, 313.0, 205.0, 144.0, 107.0, 83.0, 51.0, 46.0, 35.0, 26.0, 19.0, 13.0, 11.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.203125, -4.06341552734375, -3.9237060546875, -3.78399658203125, -3.644287109375, -3.50457763671875, -3.3648681640625, -3.22515869140625, -3.08544921875, -2.94573974609375, -2.8060302734375, -2.66632080078125, -2.526611328125, -2.38690185546875, -2.2471923828125, -2.10748291015625, -1.9677734375, -1.82806396484375, -1.6883544921875, -1.54864501953125, -1.408935546875, -1.26922607421875, -1.1295166015625, -0.98980712890625, -0.85009765625, -0.71038818359375, -0.5706787109375, -0.43096923828125, -0.291259765625, -0.15155029296875, -0.0118408203125, 0.12786865234375, 0.267578125, 0.40728759765625, 0.5469970703125, 0.68670654296875, 0.826416015625, 0.96612548828125, 1.1058349609375, 1.24554443359375, 1.38525390625, 1.52496337890625, 1.6646728515625, 1.80438232421875, 1.944091796875, 2.08380126953125, 2.2235107421875, 2.36322021484375, 2.5029296875, 2.64263916015625, 2.7823486328125, 2.92205810546875, 3.061767578125, 3.20147705078125, 3.3411865234375, 3.48089599609375, 3.62060546875, 3.76031494140625, 3.9000244140625, 4.03973388671875, 4.179443359375, 4.31915283203125, 4.4588623046875, 4.59857177734375, 4.73828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 4.0, 3.0, 12.0, 19.0, 14.0, 17.0, 27.0, 23.0, 18.0, 17.0, 30.0, 44.0, 47.0, 37.0, 48.0, 52.0, 38.0, 56.0, 1067.0, 36.0, 53.0, 25.0, 42.0, 39.0, 31.0, 29.0, 24.0, 27.0, 30.0, 16.0, 14.0, 13.0, 10.0, 7.0, 13.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.333984375, -2.256988525390625, -2.17999267578125, -2.102996826171875, -2.0260009765625, -1.949005126953125, -1.87200927734375, -1.795013427734375, -1.718017578125, -1.641021728515625, -1.56402587890625, -1.487030029296875, -1.4100341796875, -1.333038330078125, -1.25604248046875, -1.179046630859375, -1.10205078125, -1.025054931640625, -0.94805908203125, -0.871063232421875, -0.7940673828125, -0.717071533203125, -0.64007568359375, -0.563079833984375, -0.486083984375, -0.409088134765625, -0.33209228515625, -0.255096435546875, -0.1781005859375, -0.101104736328125, -0.02410888671875, 0.052886962890625, 0.1298828125, 0.206878662109375, 0.28387451171875, 0.360870361328125, 0.4378662109375, 0.514862060546875, 0.59185791015625, 0.668853759765625, 0.745849609375, 0.822845458984375, 0.89984130859375, 0.976837158203125, 1.0538330078125, 1.130828857421875, 1.20782470703125, 1.284820556640625, 1.36181640625, 1.438812255859375, 1.51580810546875, 1.592803955078125, 1.6697998046875, 1.746795654296875, 1.82379150390625, 1.900787353515625, 1.977783203125, 2.054779052734375, 2.13177490234375, 2.208770751953125, 2.2857666015625, 2.362762451171875, 2.43975830078125, 2.516754150390625, 2.59375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 4.0, 5.0, 11.0, 22.0, 20.0, 38.0, 55.0, 70.0, 99.0, 161.0, 230.0, 337.0, 476.0, 754.0, 1192.0, 1908.0, 3155.0, 5493.0, 10518.0, 22086.0, 65521.0, 1396340.0, 496896.0, 50520.0, 18925.0, 9252.0, 5068.0, 2924.0, 1766.0, 1114.0, 706.0, 472.0, 283.0, 238.0, 152.0, 74.0, 81.0, 57.0, 31.0, 24.0, 20.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.546875, -5.39239501953125, -5.2379150390625, -5.08343505859375, -4.928955078125, -4.77447509765625, -4.6199951171875, -4.46551513671875, -4.31103515625, -4.15655517578125, -4.0020751953125, -3.84759521484375, -3.693115234375, -3.53863525390625, -3.3841552734375, -3.22967529296875, -3.0751953125, -2.92071533203125, -2.7662353515625, -2.61175537109375, -2.457275390625, -2.30279541015625, -2.1483154296875, -1.99383544921875, -1.83935546875, -1.68487548828125, -1.5303955078125, -1.37591552734375, -1.221435546875, -1.06695556640625, -0.9124755859375, -0.75799560546875, -0.603515625, -0.44903564453125, -0.2945556640625, -0.14007568359375, 0.014404296875, 0.16888427734375, 0.3233642578125, 0.47784423828125, 0.63232421875, 0.78680419921875, 0.9412841796875, 1.09576416015625, 1.250244140625, 1.40472412109375, 1.5592041015625, 1.71368408203125, 1.8681640625, 2.02264404296875, 2.1771240234375, 2.33160400390625, 2.486083984375, 2.64056396484375, 2.7950439453125, 2.94952392578125, 3.10400390625, 3.25848388671875, 3.4129638671875, 3.56744384765625, 3.721923828125, 3.87640380859375, 4.0308837890625, 4.18536376953125, 4.33984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 5.0, 11.0, 29.0, 93.0, 264.0, 382.0, 117.0, 41.0, 12.0, 7.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.923828125, -1.85784912109375, -1.7918701171875, -1.72589111328125, -1.659912109375, -1.59393310546875, -1.5279541015625, -1.46197509765625, -1.39599609375, -1.33001708984375, -1.2640380859375, -1.19805908203125, -1.132080078125, -1.06610107421875, -1.0001220703125, -0.93414306640625, -0.8681640625, -0.80218505859375, -0.7362060546875, -0.67022705078125, -0.604248046875, -0.53826904296875, -0.4722900390625, -0.40631103515625, -0.34033203125, -0.27435302734375, -0.2083740234375, -0.14239501953125, -0.076416015625, -0.01043701171875, 0.0555419921875, 0.12152099609375, 0.1875, 0.25347900390625, 0.3194580078125, 0.38543701171875, 0.451416015625, 0.51739501953125, 0.5833740234375, 0.64935302734375, 0.71533203125, 0.78131103515625, 0.8472900390625, 0.91326904296875, 0.979248046875, 1.04522705078125, 1.1112060546875, 1.17718505859375, 1.2431640625, 1.30914306640625, 1.3751220703125, 1.44110107421875, 1.507080078125, 1.57305908203125, 1.6390380859375, 1.70501708984375, 1.77099609375, 1.83697509765625, 1.9029541015625, 1.96893310546875, 2.034912109375, 2.10089111328125, 2.1668701171875, 2.23284912109375, 2.298828125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 11.0, 19.0, 22.0, 67.0, 288.0, 2357.0, 1013239.0, 31074.0, 1174.0, 188.0, 33.0, 18.0, 15.0, 13.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.375, -42.13037109375, -40.8857421875, -39.64111328125, -38.396484375, -37.15185546875, -35.9072265625, -34.66259765625, -33.41796875, -32.17333984375, -30.9287109375, -29.68408203125, -28.439453125, -27.19482421875, -25.9501953125, -24.70556640625, -23.4609375, -22.21630859375, -20.9716796875, -19.72705078125, -18.482421875, -17.23779296875, -15.9931640625, -14.74853515625, -13.50390625, -12.25927734375, -11.0146484375, -9.77001953125, -8.525390625, -7.28076171875, -6.0361328125, -4.79150390625, -3.546875, -2.30224609375, -1.0576171875, 0.18701171875, 1.431640625, 2.67626953125, 3.9208984375, 5.16552734375, 6.41015625, 7.65478515625, 8.8994140625, 10.14404296875, 11.388671875, 12.63330078125, 13.8779296875, 15.12255859375, 16.3671875, 17.61181640625, 18.8564453125, 20.10107421875, 21.345703125, 22.59033203125, 23.8349609375, 25.07958984375, 26.32421875, 27.56884765625, 28.8134765625, 30.05810546875, 31.302734375, 32.54736328125, 33.7919921875, 35.03662109375, 36.28125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 12.0, 20.0, 24.0, 39.0, 62.0, 140.0, 210.0, 216.0, 115.0, 52.0, 33.0, 28.0, 10.0, 7.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7362329959869385, -3.644993305206299, -3.55375337600708, -3.4625136852264404, -3.3712737560272217, -3.280034065246582, -3.1887941360473633, -3.0975544452667236, -3.006314754486084, -2.9150750637054443, -2.8238351345062256, -2.732595443725586, -2.641355514526367, -2.5501158237457275, -2.458876132965088, -2.367636203765869, -2.2763962745666504, -2.1851565837860107, -2.093916654586792, -2.0026769638061523, -1.9114370346069336, -1.820197343826294, -1.7289575338363647, -1.6377177238464355, -1.5464779138565063, -1.4552381038665771, -1.363998293876648, -1.2727584838867188, -1.181518793106079, -1.0902788639068604, -0.9990391731262207, -0.9077993631362915, -0.8165597915649414, -0.7253199815750122, -0.634080171585083, -0.5428404211997986, -0.4516006112098694, -0.3603608012199402, -0.26912105083465576, -0.17788124084472656, -0.08664143085479736, 0.004598364233970642, 0.09583815932273865, 0.18707793951034546, 0.27831774950027466, 0.36955755949020386, 0.4607973098754883, 0.5520371198654175, 0.6432769298553467, 0.7345167398452759, 0.8257565498352051, 0.9169963002204895, 1.0082361698150635, 1.0994758605957031, 1.1907156705856323, 1.2819554805755615, 1.3731952905654907, 1.46443510055542, 1.5556749105453491, 1.6469147205352783, 1.738154411315918, 1.8293943405151367, 1.9206340312957764, 2.011873722076416, 2.1031136512756348]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 12.0, 16.0, 18.0, 28.0, 13.0, 25.0, 31.0, 25.0, 38.0, 27.0, 39.0, 35.0, 41.0, 35.0, 37.0, 37.0, 37.0, 43.0, 34.0, 46.0, 45.0, 23.0, 36.0, 31.0, 20.0, 27.0, 20.0, 18.0, 18.0, 18.0, 17.0, 9.0, 3.0, 10.0, 8.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1061121225357056, -1.0673414468765259, -1.0285708904266357, -0.989800214767456, -0.9510295391082764, -0.9122588634490967, -0.8734882473945618, -0.8347176313400269, -0.7959469556808472, -0.7571762800216675, -0.7184056639671326, -0.6796350479125977, -0.640864372253418, -0.6020936965942383, -0.5633230805397034, -0.5245524644851685, -0.48578178882598877, -0.44701114296913147, -0.40824049711227417, -0.36946985125541687, -0.33069920539855957, -0.29192855954170227, -0.25315791368484497, -0.21438726782798767, -0.17561662197113037, -0.13684597611427307, -0.09807533025741577, -0.05930468440055847, -0.020534038543701172, 0.018236607313156128, 0.05700725317001343, 0.09577789902687073, 0.13454842567443848, 0.17331907153129578, 0.21208971738815308, 0.2508603632450104, 0.2896310091018677, 0.328401654958725, 0.3671723008155823, 0.4059429466724396, 0.4447135925292969, 0.4834842383861542, 0.5222548842430115, 0.5610255002975464, 0.5997961759567261, 0.6385668516159058, 0.6773374676704407, 0.7161080837249756, 0.7548787593841553, 0.793649435043335, 0.8324200510978699, 0.8711906671524048, 0.9099613428115845, 0.9487320184707642, 0.9875026345252991, 1.026273250579834, 1.0650439262390137, 1.1038146018981934, 1.142585277557373, 1.1813558340072632, 1.2201265096664429, 1.2588971853256226, 1.2976677417755127, 1.3364384174346924, 1.375209093093872]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 1.0, 6.0, 7.0, 11.0, 15.0, 21.0, 21.0, 19.0, 27.0, 27.0, 27.0, 41.0, 38.0, 34.0, 33.0, 46.0, 39.0, 36.0, 51.0, 43.0, 54.0, 48.0, 42.0, 34.0, 46.0, 30.0, 37.0, 32.0, 22.0, 15.0, 16.0, 18.0, 12.0, 5.0, 4.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -2.994903564453125, -2.89996337890625, -2.805023193359375, -2.7100830078125, -2.615142822265625, -2.52020263671875, -2.425262451171875, -2.330322265625, -2.235382080078125, -2.14044189453125, -2.045501708984375, -1.9505615234375, -1.855621337890625, -1.76068115234375, -1.665740966796875, -1.57080078125, -1.475860595703125, -1.38092041015625, -1.285980224609375, -1.1910400390625, -1.096099853515625, -1.00115966796875, -0.906219482421875, -0.811279296875, -0.716339111328125, -0.62139892578125, -0.526458740234375, -0.4315185546875, -0.336578369140625, -0.24163818359375, -0.146697998046875, -0.0517578125, 0.043182373046875, 0.13812255859375, 0.233062744140625, 0.3280029296875, 0.422943115234375, 0.51788330078125, 0.612823486328125, 0.707763671875, 0.802703857421875, 0.89764404296875, 0.992584228515625, 1.0875244140625, 1.182464599609375, 1.27740478515625, 1.372344970703125, 1.46728515625, 1.562225341796875, 1.65716552734375, 1.752105712890625, 1.8470458984375, 1.941986083984375, 2.03692626953125, 2.131866455078125, 2.226806640625, 2.321746826171875, 2.41668701171875, 2.511627197265625, 2.6065673828125, 2.701507568359375, 2.79644775390625, 2.891387939453125, 2.986328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 16.0, 13.0, 20.0, 31.0, 38.0, 56.0, 72.0, 88.0, 150.0, 195.0, 296.0, 450.0, 668.0, 1083.0, 1888.0, 3350.0, 6361.0, 13076.0, 30335.0, 88294.0, 455232.0, 324358.0, 71486.0, 25855.0, 11640.0, 5749.0, 3004.0, 1699.0, 1050.0, 615.0, 387.0, 286.0, 191.0, 147.0, 108.0, 83.0, 44.0, 32.0, 27.0, 16.0, 13.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-5.60546875, -5.440185546875, -5.27490234375, -5.109619140625, -4.9443359375, -4.779052734375, -4.61376953125, -4.448486328125, -4.283203125, -4.117919921875, -3.95263671875, -3.787353515625, -3.6220703125, -3.456787109375, -3.29150390625, -3.126220703125, -2.9609375, -2.795654296875, -2.63037109375, -2.465087890625, -2.2998046875, -2.134521484375, -1.96923828125, -1.803955078125, -1.638671875, -1.473388671875, -1.30810546875, -1.142822265625, -0.9775390625, -0.812255859375, -0.64697265625, -0.481689453125, -0.31640625, -0.151123046875, 0.01416015625, 0.179443359375, 0.3447265625, 0.510009765625, 0.67529296875, 0.840576171875, 1.005859375, 1.171142578125, 1.33642578125, 1.501708984375, 1.6669921875, 1.832275390625, 1.99755859375, 2.162841796875, 2.328125, 2.493408203125, 2.65869140625, 2.823974609375, 2.9892578125, 3.154541015625, 3.31982421875, 3.485107421875, 3.650390625, 3.815673828125, 3.98095703125, 4.146240234375, 4.3115234375, 4.476806640625, 4.64208984375, 4.807373046875, 4.97265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 3.0, 13.0, 8.0, 14.0, 13.0, 15.0, 17.0, 21.0, 22.0, 23.0, 23.0, 34.0, 42.0, 44.0, 43.0, 66.0, 77.0, 146.0, 336.0, 1393.0, 143.0, 76.0, 65.0, 43.0, 44.0, 44.0, 43.0, 40.0, 32.0, 27.0, 17.0, 15.0, 21.0, 11.0, 2.0, 10.0, 15.0, 7.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.28125, -8.98193359375, -8.6826171875, -8.38330078125, -8.083984375, -7.78466796875, -7.4853515625, -7.18603515625, -6.88671875, -6.58740234375, -6.2880859375, -5.98876953125, -5.689453125, -5.39013671875, -5.0908203125, -4.79150390625, -4.4921875, -4.19287109375, -3.8935546875, -3.59423828125, -3.294921875, -2.99560546875, -2.6962890625, -2.39697265625, -2.09765625, -1.79833984375, -1.4990234375, -1.19970703125, -0.900390625, -0.60107421875, -0.3017578125, -0.00244140625, 0.296875, 0.59619140625, 0.8955078125, 1.19482421875, 1.494140625, 1.79345703125, 2.0927734375, 2.39208984375, 2.69140625, 2.99072265625, 3.2900390625, 3.58935546875, 3.888671875, 4.18798828125, 4.4873046875, 4.78662109375, 5.0859375, 5.38525390625, 5.6845703125, 5.98388671875, 6.283203125, 6.58251953125, 6.8818359375, 7.18115234375, 7.48046875, 7.77978515625, 8.0791015625, 8.37841796875, 8.677734375, 8.97705078125, 9.2763671875, 9.57568359375, 9.875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 10.0, 16.0, 14.0, 21.0, 38.0, 30.0, 62.0, 88.0, 111.0, 185.0, 343.0, 746.0, 2014.0, 9220.0, 126202.0, 2919810.0, 76425.0, 7107.0, 1737.0, 659.0, 292.0, 175.0, 88.0, 70.0, 63.0, 42.0, 28.0, 24.0, 17.0, 13.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.15673828125, -17.4697265625, -16.78271484375, -16.095703125, -15.40869140625, -14.7216796875, -14.03466796875, -13.34765625, -12.66064453125, -11.9736328125, -11.28662109375, -10.599609375, -9.91259765625, -9.2255859375, -8.53857421875, -7.8515625, -7.16455078125, -6.4775390625, -5.79052734375, -5.103515625, -4.41650390625, -3.7294921875, -3.04248046875, -2.35546875, -1.66845703125, -0.9814453125, -0.29443359375, 0.392578125, 1.07958984375, 1.7666015625, 2.45361328125, 3.140625, 3.82763671875, 4.5146484375, 5.20166015625, 5.888671875, 6.57568359375, 7.2626953125, 7.94970703125, 8.63671875, 9.32373046875, 10.0107421875, 10.69775390625, 11.384765625, 12.07177734375, 12.7587890625, 13.44580078125, 14.1328125, 14.81982421875, 15.5068359375, 16.19384765625, 16.880859375, 17.56787109375, 18.2548828125, 18.94189453125, 19.62890625, 20.31591796875, 21.0029296875, 21.68994140625, 22.376953125, 23.06396484375, 23.7509765625, 24.43798828125, 25.125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 34.0, 769.0, 209.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.653095245361328, -17.30721664428711, -10.961339950561523, -4.6154632568359375, 1.7304153442382812, 8.0762939453125, 14.422168731689453, 20.768047332763672, 27.11392593383789, 33.45980453491211, 39.80567932128906, 46.15155792236328, 52.4974365234375, 58.84331512451172, 65.18919372558594, 71.53506469726562, 77.88095092773438, 84.2268295288086, 90.57270812988281, 96.9185791015625, 103.26446533203125, 109.61033630371094, 115.95621490478516, 122.30209350585938, 128.64796447753906, 134.99383544921875, 141.3397216796875, 147.6855926513672, 154.03147888183594, 160.37734985351562, 166.72323608398438, 173.06910705566406, 179.41497802734375, 185.76084899902344, 192.1067352294922, 198.45260620117188, 204.79849243164062, 211.1443634033203, 217.490234375, 223.83612060546875, 230.1820068359375, 236.5278778076172, 242.87376403808594, 249.21963500976562, 255.56552124023438, 261.9114074707031, 268.25726318359375, 274.6031494140625, 280.94903564453125, 287.294921875, 293.6407775878906, 299.9866638183594, 306.3325500488281, 312.6784362792969, 319.0242919921875, 325.37017822265625, 331.7160339355469, 338.0619201660156, 344.40777587890625, 350.753662109375, 357.09954833984375, 363.4454345703125, 369.7912902832031, 376.1371765136719, 382.4830627441406]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 9.0, 7.0, 12.0, 23.0, 21.0, 23.0, 25.0, 32.0, 35.0, 27.0, 35.0, 34.0, 35.0, 45.0, 50.0, 37.0, 47.0, 39.0, 40.0, 40.0, 39.0, 37.0, 27.0, 46.0, 23.0, 30.0, 30.0, 18.0, 25.0, 19.0, 16.0, 6.0, 7.0, 11.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.468902587890625, -31.489551544189453, -30.51020050048828, -29.53084945678711, -28.551498413085938, -27.572147369384766, -26.592798233032227, -25.613447189331055, -24.634096145629883, -23.65474510192871, -22.67539405822754, -21.696043014526367, -20.716693878173828, -19.737342834472656, -18.757991790771484, -17.778640747070312, -16.79928970336914, -15.819938659667969, -14.840587615966797, -13.861237525939941, -12.88188648223877, -11.902535438537598, -10.923185348510742, -9.94383430480957, -8.964483261108398, -7.985132217407227, -7.005781650543213, -6.026431083679199, -5.047080039978027, -4.0677289962768555, -3.088378429412842, -2.109027862548828, -1.129678726196289, -0.1503279209136963, 0.8290228843688965, 1.8083736896514893, 2.787724494934082, 3.767075538635254, 4.746426105499268, 5.725776672363281, 6.705127716064453, 7.684478759765625, 8.663829803466797, 9.643179893493652, 10.622530937194824, 11.601881980895996, 12.581232070922852, 13.560583114624023, 14.539934158325195, 15.519285202026367, 16.49863624572754, 17.47798728942871, 18.45733642578125, 19.436687469482422, 20.416038513183594, 21.395389556884766, 22.374740600585938, 23.35409164428711, 24.33344268798828, 25.312793731689453, 26.292144775390625, 27.271495819091797, 28.250844955444336, 29.230195999145508, 30.20954704284668]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 7.0, 10.0, 11.0, 14.0, 12.0, 21.0, 23.0, 19.0, 25.0, 21.0, 31.0, 27.0, 29.0, 35.0, 40.0, 31.0, 32.0, 38.0, 45.0, 53.0, 54.0, 39.0, 35.0, 46.0, 28.0, 36.0, 30.0, 28.0, 25.0, 26.0, 25.0, 12.0, 14.0, 14.0, 15.0, 8.0, 14.0, 12.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.91796875, -2.821807861328125, -2.72564697265625, -2.629486083984375, -2.5333251953125, -2.437164306640625, -2.34100341796875, -2.244842529296875, -2.148681640625, -2.052520751953125, -1.95635986328125, -1.860198974609375, -1.7640380859375, -1.667877197265625, -1.57171630859375, -1.475555419921875, -1.37939453125, -1.283233642578125, -1.18707275390625, -1.090911865234375, -0.9947509765625, -0.898590087890625, -0.80242919921875, -0.706268310546875, -0.610107421875, -0.513946533203125, -0.41778564453125, -0.321624755859375, -0.2254638671875, -0.129302978515625, -0.03314208984375, 0.063018798828125, 0.1591796875, 0.255340576171875, 0.35150146484375, 0.447662353515625, 0.5438232421875, 0.639984130859375, 0.73614501953125, 0.832305908203125, 0.928466796875, 1.024627685546875, 1.12078857421875, 1.216949462890625, 1.3131103515625, 1.409271240234375, 1.50543212890625, 1.601593017578125, 1.69775390625, 1.793914794921875, 1.89007568359375, 1.986236572265625, 2.0823974609375, 2.178558349609375, 2.27471923828125, 2.370880126953125, 2.467041015625, 2.563201904296875, 2.65936279296875, 2.755523681640625, 2.8516845703125, 2.947845458984375, 3.04400634765625, 3.140167236328125, 3.236328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 3.0, 7.0, 9.0, 19.0, 25.0, 50.0, 69.0, 88.0, 148.0, 236.0, 324.0, 512.0, 777.0, 1328.0, 2218.0, 3888.0, 7189.0, 13124.0, 26238.0, 61253.0, 262474.0, 1811125.0, 1664721.0, 229785.0, 55583.0, 24292.0, 12325.0, 6724.0, 3719.0, 2227.0, 1390.0, 889.0, 527.0, 331.0, 212.0, 122.0, 112.0, 74.0, 49.0, 35.0, 24.0, 17.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96484375, -5.76580810546875, -5.5667724609375, -5.36773681640625, -5.168701171875, -4.96966552734375, -4.7706298828125, -4.57159423828125, -4.37255859375, -4.17352294921875, -3.9744873046875, -3.77545166015625, -3.576416015625, -3.37738037109375, -3.1783447265625, -2.97930908203125, -2.7802734375, -2.58123779296875, -2.3822021484375, -2.18316650390625, -1.984130859375, -1.78509521484375, -1.5860595703125, -1.38702392578125, -1.18798828125, -0.98895263671875, -0.7899169921875, -0.59088134765625, -0.391845703125, -0.19281005859375, 0.0062255859375, 0.20526123046875, 0.404296875, 0.60333251953125, 0.8023681640625, 1.00140380859375, 1.200439453125, 1.39947509765625, 1.5985107421875, 1.79754638671875, 1.99658203125, 2.19561767578125, 2.3946533203125, 2.59368896484375, 2.792724609375, 2.99176025390625, 3.1907958984375, 3.38983154296875, 3.5888671875, 3.78790283203125, 3.9869384765625, 4.18597412109375, 4.385009765625, 4.58404541015625, 4.7830810546875, 4.98211669921875, 5.18115234375, 5.38018798828125, 5.5792236328125, 5.77825927734375, 5.977294921875, 6.17633056640625, 6.3753662109375, 6.57440185546875, 6.7734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 12.0, 18.0, 26.0, 24.0, 42.0, 38.0, 51.0, 57.0, 94.0, 106.0, 207.0, 360.0, 517.0, 685.0, 590.0, 375.0, 236.0, 155.0, 85.0, 86.0, 51.0, 43.0, 46.0, 31.0, 18.0, 15.0, 15.0, 16.0, 7.0, 6.0, 2.0, 10.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86138916015625, -5.6329345703125, -5.40447998046875, -5.176025390625, -4.94757080078125, -4.7191162109375, -4.49066162109375, -4.26220703125, -4.03375244140625, -3.8052978515625, -3.57684326171875, -3.348388671875, -3.11993408203125, -2.8914794921875, -2.66302490234375, -2.4345703125, -2.20611572265625, -1.9776611328125, -1.74920654296875, -1.520751953125, -1.29229736328125, -1.0638427734375, -0.83538818359375, -0.60693359375, -0.37847900390625, -0.1500244140625, 0.07843017578125, 0.306884765625, 0.53533935546875, 0.7637939453125, 0.99224853515625, 1.220703125, 1.44915771484375, 1.6776123046875, 1.90606689453125, 2.134521484375, 2.36297607421875, 2.5914306640625, 2.81988525390625, 3.04833984375, 3.27679443359375, 3.5052490234375, 3.73370361328125, 3.962158203125, 4.19061279296875, 4.4190673828125, 4.64752197265625, 4.8759765625, 5.10443115234375, 5.3328857421875, 5.56134033203125, 5.789794921875, 6.01824951171875, 6.2467041015625, 6.47515869140625, 6.70361328125, 6.93206787109375, 7.1605224609375, 7.38897705078125, 7.617431640625, 7.84588623046875, 8.0743408203125, 8.30279541015625, 8.53125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 5.0, 1.0, 11.0, 13.0, 15.0, 15.0, 21.0, 32.0, 38.0, 57.0, 73.0, 160.0, 306.0, 952.0, 4114.0, 25760.0, 339750.0, 3681674.0, 123746.0, 13763.0, 2507.0, 611.0, 232.0, 114.0, 74.0, 50.0, 37.0, 37.0, 29.0, 13.0, 11.0, 11.0, 12.0, 3.0, 8.0, 8.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0], "bins": [-27.09375, -26.3681640625, -25.642578125, -24.9169921875, -24.19140625, -23.4658203125, -22.740234375, -22.0146484375, -21.2890625, -20.5634765625, -19.837890625, -19.1123046875, -18.38671875, -17.6611328125, -16.935546875, -16.2099609375, -15.484375, -14.7587890625, -14.033203125, -13.3076171875, -12.58203125, -11.8564453125, -11.130859375, -10.4052734375, -9.6796875, -8.9541015625, -8.228515625, -7.5029296875, -6.77734375, -6.0517578125, -5.326171875, -4.6005859375, -3.875, -3.1494140625, -2.423828125, -1.6982421875, -0.97265625, -0.2470703125, 0.478515625, 1.2041015625, 1.9296875, 2.6552734375, 3.380859375, 4.1064453125, 4.83203125, 5.5576171875, 6.283203125, 7.0087890625, 7.734375, 8.4599609375, 9.185546875, 9.9111328125, 10.63671875, 11.3623046875, 12.087890625, 12.8134765625, 13.5390625, 14.2646484375, 14.990234375, 15.7158203125, 16.44140625, 17.1669921875, 17.892578125, 18.6181640625, 19.34375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 9.0, 14.0, 30.0, 72.0, 97.0, 120.0, 172.0, 179.0, 131.0, 66.0, 47.0, 22.0, 9.0, 12.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.42725372314453, -44.872169494628906, -43.31708526611328, -41.76200485229492, -40.2069206237793, -38.65183639526367, -37.09675598144531, -35.54167175292969, -33.98658752441406, -32.43150329589844, -30.876420974731445, -29.321338653564453, -27.766254425048828, -26.211170196533203, -24.65608787536621, -23.10100555419922, -21.545921325683594, -19.99083709716797, -18.435754776000977, -16.880672454833984, -15.32558822631836, -13.77050495147705, -12.215421676635742, -10.660338401794434, -9.105255126953125, -7.550171852111816, -5.995088577270508, -4.440005302429199, -2.8849220275878906, -1.329838752746582, 0.22524452209472656, 1.7803277969360352, 3.3354110717773438, 4.890494346618652, 6.445577621459961, 8.00066089630127, 9.555744171142578, 11.110827445983887, 12.665910720825195, 14.220993995666504, 15.776077270507812, 17.331161499023438, 18.88624382019043, 20.441326141357422, 21.996410369873047, 23.551494598388672, 25.106576919555664, 26.661659240722656, 28.21674346923828, 29.771827697753906, 31.3269100189209, 32.88199234008789, 34.437076568603516, 35.99216079711914, 37.5472412109375, 39.102325439453125, 40.65740966796875, 42.212493896484375, 43.767578125, 45.32265853881836, 46.877742767333984, 48.43282699584961, 49.98790740966797, 51.542991638183594, 53.09807586669922]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 7.0, 7.0, 11.0, 13.0, 12.0, 15.0, 14.0, 26.0, 26.0, 41.0, 28.0, 36.0, 27.0, 40.0, 46.0, 54.0, 48.0, 46.0, 49.0, 30.0, 43.0, 50.0, 41.0, 40.0, 32.0, 21.0, 17.0, 30.0, 24.0, 16.0, 14.0, 16.0, 15.0, 9.0, 16.0, 5.0, 9.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.067045211791992, -24.29473876953125, -23.522430419921875, -22.750123977661133, -21.97781753540039, -21.20551109313965, -20.433202743530273, -19.66089630126953, -18.88858985900879, -18.116283416748047, -17.343975067138672, -16.57166862487793, -15.799362182617188, -15.027054786682129, -14.25474739074707, -13.482440948486328, -12.71013355255127, -11.937826156616211, -11.165519714355469, -10.39321231842041, -9.620905876159668, -8.84859848022461, -8.076292037963867, -7.303984642028809, -6.531677722930908, -5.759370803833008, -4.987063884735107, -4.214756965637207, -3.4424498081207275, -2.670142889022827, -1.8978357315063477, -1.1255288124084473, -0.3532218933105469, 0.4190850853919983, 1.1913920640945435, 1.9636991024017334, 2.736006021499634, 3.508312940597534, 4.280620098114014, 5.052927017211914, 5.8252339363098145, 6.597540855407715, 7.369847774505615, 8.142154693603516, 8.914462089538574, 9.686768531799316, 10.459075927734375, 11.231382369995117, 12.003689765930176, 12.775997161865234, 13.548303604125977, 14.320611000061035, 15.092917442321777, 15.865224838256836, 16.637531280517578, 17.409839630126953, 18.182146072387695, 18.954452514648438, 19.726760864257812, 20.499067306518555, 21.271373748779297, 22.04368019104004, 22.815988540649414, 23.588294982910156, 24.3606014251709]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 5.0, 6.0, 17.0, 10.0, 15.0, 23.0, 19.0, 26.0, 30.0, 29.0, 27.0, 27.0, 54.0, 41.0, 41.0, 51.0, 45.0, 47.0, 38.0, 42.0, 51.0, 46.0, 35.0, 33.0, 20.0, 37.0, 27.0, 27.0, 16.0, 22.0, 19.0, 15.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.171875, -3.074005126953125, -2.97613525390625, -2.878265380859375, -2.7803955078125, -2.682525634765625, -2.58465576171875, -2.486785888671875, -2.388916015625, -2.291046142578125, -2.19317626953125, -2.095306396484375, -1.9974365234375, -1.899566650390625, -1.80169677734375, -1.703826904296875, -1.60595703125, -1.508087158203125, -1.41021728515625, -1.312347412109375, -1.2144775390625, -1.116607666015625, -1.01873779296875, -0.920867919921875, -0.822998046875, -0.725128173828125, -0.62725830078125, -0.529388427734375, -0.4315185546875, -0.333648681640625, -0.23577880859375, -0.137908935546875, -0.0400390625, 0.057830810546875, 0.15570068359375, 0.253570556640625, 0.3514404296875, 0.449310302734375, 0.54718017578125, 0.645050048828125, 0.742919921875, 0.840789794921875, 0.93865966796875, 1.036529541015625, 1.1343994140625, 1.232269287109375, 1.33013916015625, 1.428009033203125, 1.52587890625, 1.623748779296875, 1.72161865234375, 1.819488525390625, 1.9173583984375, 2.015228271484375, 2.11309814453125, 2.210968017578125, 2.308837890625, 2.406707763671875, 2.50457763671875, 2.602447509765625, 2.7003173828125, 2.798187255859375, 2.89605712890625, 2.993927001953125, 3.091796875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 12.0, 19.0, 17.0, 34.0, 30.0, 58.0, 48.0, 73.0, 111.0, 130.0, 176.0, 262.0, 384.0, 531.0, 732.0, 1053.0, 1446.0, 2225.0, 3469.0, 5939.0, 13468.0, 56814.0, 526579.0, 367296.0, 40773.0, 11307.0, 5430.0, 3244.0, 2006.0, 1451.0, 962.0, 630.0, 479.0, 347.0, 277.0, 203.0, 141.0, 101.0, 72.0, 53.0, 55.0, 29.0, 16.0, 11.0, 17.0, 10.0, 7.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.30078125, -4.17010498046875, -4.0394287109375, -3.90875244140625, -3.778076171875, -3.64739990234375, -3.5167236328125, -3.38604736328125, -3.25537109375, -3.12469482421875, -2.9940185546875, -2.86334228515625, -2.732666015625, -2.60198974609375, -2.4713134765625, -2.34063720703125, -2.2099609375, -2.07928466796875, -1.9486083984375, -1.81793212890625, -1.687255859375, -1.55657958984375, -1.4259033203125, -1.29522705078125, -1.16455078125, -1.03387451171875, -0.9031982421875, -0.77252197265625, -0.641845703125, -0.51116943359375, -0.3804931640625, -0.24981689453125, -0.119140625, 0.01153564453125, 0.1422119140625, 0.27288818359375, 0.403564453125, 0.53424072265625, 0.6649169921875, 0.79559326171875, 0.92626953125, 1.05694580078125, 1.1876220703125, 1.31829833984375, 1.448974609375, 1.57965087890625, 1.7103271484375, 1.84100341796875, 1.9716796875, 2.10235595703125, 2.2330322265625, 2.36370849609375, 2.494384765625, 2.62506103515625, 2.7557373046875, 2.88641357421875, 3.01708984375, 3.14776611328125, 3.2784423828125, 3.40911865234375, 3.539794921875, 3.67047119140625, 3.8011474609375, 3.93182373046875, 4.0625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 16.0, 17.0, 26.0, 20.0, 16.0, 30.0, 42.0, 37.0, 32.0, 29.0, 48.0, 26.0, 31.0, 34.0, 1067.0, 49.0, 39.0, 37.0, 41.0, 36.0, 33.0, 32.0, 29.0, 22.0, 25.0, 18.0, 19.0, 20.0, 19.0, 20.0, 6.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.1060791015625, -2.034423828125, -1.9627685546875, -1.89111328125, -1.8194580078125, -1.747802734375, -1.6761474609375, -1.6044921875, -1.5328369140625, -1.461181640625, -1.3895263671875, -1.31787109375, -1.2462158203125, -1.174560546875, -1.1029052734375, -1.03125, -0.9595947265625, -0.887939453125, -0.8162841796875, -0.74462890625, -0.6729736328125, -0.601318359375, -0.5296630859375, -0.4580078125, -0.3863525390625, -0.314697265625, -0.2430419921875, -0.17138671875, -0.0997314453125, -0.028076171875, 0.0435791015625, 0.115234375, 0.1868896484375, 0.258544921875, 0.3302001953125, 0.40185546875, 0.4735107421875, 0.545166015625, 0.6168212890625, 0.6884765625, 0.7601318359375, 0.831787109375, 0.9034423828125, 0.97509765625, 1.0467529296875, 1.118408203125, 1.1900634765625, 1.26171875, 1.3333740234375, 1.405029296875, 1.4766845703125, 1.54833984375, 1.6199951171875, 1.691650390625, 1.7633056640625, 1.8349609375, 1.9066162109375, 1.978271484375, 2.0499267578125, 2.12158203125, 2.1932373046875, 2.264892578125, 2.3365478515625, 2.408203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 7.0, 7.0, 9.0, 6.0, 19.0, 19.0, 20.0, 27.0, 48.0, 40.0, 72.0, 89.0, 109.0, 164.0, 207.0, 262.0, 363.0, 516.0, 735.0, 1191.0, 2089.0, 4056.0, 11325.0, 85587.0, 1878081.0, 89849.0, 11968.0, 4229.0, 2040.0, 1218.0, 770.0, 541.0, 382.0, 248.0, 187.0, 160.0, 112.0, 103.0, 53.0, 59.0, 43.0, 27.0, 29.0, 18.0, 18.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-3.974609375, -3.855987548828125, -3.73736572265625, -3.618743896484375, -3.5001220703125, -3.381500244140625, -3.26287841796875, -3.144256591796875, -3.025634765625, -2.907012939453125, -2.78839111328125, -2.669769287109375, -2.5511474609375, -2.432525634765625, -2.31390380859375, -2.195281982421875, -2.07666015625, -1.958038330078125, -1.83941650390625, -1.720794677734375, -1.6021728515625, -1.483551025390625, -1.36492919921875, -1.246307373046875, -1.127685546875, -1.009063720703125, -0.89044189453125, -0.771820068359375, -0.6531982421875, -0.534576416015625, -0.41595458984375, -0.297332763671875, -0.1787109375, -0.060089111328125, 0.05853271484375, 0.177154541015625, 0.2957763671875, 0.414398193359375, 0.53302001953125, 0.651641845703125, 0.770263671875, 0.888885498046875, 1.00750732421875, 1.126129150390625, 1.2447509765625, 1.363372802734375, 1.48199462890625, 1.600616455078125, 1.71923828125, 1.837860107421875, 1.95648193359375, 2.075103759765625, 2.1937255859375, 2.312347412109375, 2.43096923828125, 2.549591064453125, 2.668212890625, 2.786834716796875, 2.90545654296875, 3.024078369140625, 3.1427001953125, 3.261322021484375, 3.37994384765625, 3.498565673828125, 3.6171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 15.0, 17.0, 10.0, 32.0, 40.0, 78.0, 132.0, 155.0, 146.0, 101.0, 77.0, 49.0, 25.0, 27.0, 21.0, 7.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.45072174072265625, -0.4365997314453125, -0.42247772216796875, -0.408355712890625, -0.39423370361328125, -0.3801116943359375, -0.36598968505859375, -0.35186767578125, -0.33774566650390625, -0.3236236572265625, -0.30950164794921875, -0.295379638671875, -0.28125762939453125, -0.2671356201171875, -0.25301361083984375, -0.2388916015625, -0.22476959228515625, -0.2106475830078125, -0.19652557373046875, -0.182403564453125, -0.16828155517578125, -0.1541595458984375, -0.14003753662109375, -0.12591552734375, -0.11179351806640625, -0.0976715087890625, -0.08354949951171875, -0.069427490234375, -0.05530548095703125, -0.0411834716796875, -0.02706146240234375, -0.012939453125, 0.00118255615234375, 0.0153045654296875, 0.02942657470703125, 0.043548583984375, 0.05767059326171875, 0.0717926025390625, 0.08591461181640625, 0.10003662109375, 0.11415863037109375, 0.1282806396484375, 0.14240264892578125, 0.156524658203125, 0.17064666748046875, 0.1847686767578125, 0.19889068603515625, 0.2130126953125, 0.22713470458984375, 0.2412567138671875, 0.25537872314453125, 0.269500732421875, 0.28362274169921875, 0.2977447509765625, 0.31186676025390625, 0.32598876953125, 0.34011077880859375, 0.3542327880859375, 0.36835479736328125, 0.382476806640625, 0.39659881591796875, 0.4107208251953125, 0.42484283447265625, 0.43896484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 13.0, 30.0, 34.0, 56.0, 111.0, 378.0, 3271.0, 188902.0, 850654.0, 4317.0, 480.0, 103.0, 56.0, 36.0, 21.0, 23.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.73291015625, -8.4423828125, -8.15185546875, -7.861328125, -7.57080078125, -7.2802734375, -6.98974609375, -6.69921875, -6.40869140625, -6.1181640625, -5.82763671875, -5.537109375, -5.24658203125, -4.9560546875, -4.66552734375, -4.375, -4.08447265625, -3.7939453125, -3.50341796875, -3.212890625, -2.92236328125, -2.6318359375, -2.34130859375, -2.05078125, -1.76025390625, -1.4697265625, -1.17919921875, -0.888671875, -0.59814453125, -0.3076171875, -0.01708984375, 0.2734375, 0.56396484375, 0.8544921875, 1.14501953125, 1.435546875, 1.72607421875, 2.0166015625, 2.30712890625, 2.59765625, 2.88818359375, 3.1787109375, 3.46923828125, 3.759765625, 4.05029296875, 4.3408203125, 4.63134765625, 4.921875, 5.21240234375, 5.5029296875, 5.79345703125, 6.083984375, 6.37451171875, 6.6650390625, 6.95556640625, 7.24609375, 7.53662109375, 7.8271484375, 8.11767578125, 8.408203125, 8.69873046875, 8.9892578125, 9.27978515625, 9.5703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 6.0, 7.0, 22.0, 51.0, 93.0, 178.0, 264.0, 224.0, 85.0, 41.0, 20.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4520385265350342, -0.4051550328731537, -0.3582715392112732, -0.3113880455493927, -0.2645045518875122, -0.2176210582256317, -0.17073756456375122, -0.12385407090187073, -0.07697057723999023, -0.03008708357810974, 0.016796410083770752, 0.06367990374565125, 0.11056339740753174, 0.15744689106941223, 0.20433038473129272, 0.2512138783931732, 0.2980973720550537, 0.3449808657169342, 0.3918643593788147, 0.4387478530406952, 0.4856313467025757, 0.5325148105621338, 0.5793983340263367, 0.6262818574905396, 0.6731653213500977, 0.7200487852096558, 0.7669323086738586, 0.8138158321380615, 0.8606992959976196, 0.9075827598571777, 0.9544662833213806, 1.0013498067855835, 1.0482332706451416, 1.0951167345046997, 1.1420001983642578, 1.1888837814331055, 1.2357672452926636, 1.2826507091522217, 1.3295342922210693, 1.3764177560806274, 1.4233012199401855, 1.4701846837997437, 1.5170681476593018, 1.5639517307281494, 1.6108351945877075, 1.6577186584472656, 1.7046022415161133, 1.7514857053756714, 1.7983691692352295, 1.8452526330947876, 1.8921360969543457, 1.9390196800231934, 1.9859031438827515, 2.0327866077423096, 2.0796701908111572, 2.126553535461426, 2.1734371185302734, 2.220320701599121, 2.2672040462493896, 2.3140876293182373, 2.360970973968506, 2.4078545570373535, 2.454738140106201, 2.5016214847564697, 2.5485050678253174]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 7.0, 2.0, 4.0, 4.0, 6.0, 14.0, 12.0, 19.0, 10.0, 18.0, 19.0, 23.0, 27.0, 29.0, 39.0, 42.0, 35.0, 40.0, 43.0, 47.0, 53.0, 55.0, 38.0, 50.0, 39.0, 32.0, 36.0, 27.0, 34.0, 27.0, 32.0, 24.0, 21.0, 18.0, 25.0, 16.0, 11.0, 6.0, 9.0, 9.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432320773601532, -0.4188823699951172, -0.40544393658638, -0.3920055329799652, -0.3785671293735504, -0.36512869596481323, -0.35169029235839844, -0.33825188875198364, -0.32481348514556885, -0.31137508153915405, -0.29793664813041687, -0.2844982445240021, -0.2710598409175873, -0.2576214075088501, -0.2441830039024353, -0.2307446002960205, -0.21730618178844452, -0.20386776328086853, -0.19042935967445374, -0.17699094116687775, -0.16355253756046295, -0.15011411905288696, -0.13667571544647217, -0.12323729693889618, -0.10979888588190079, -0.0963604748249054, -0.08292206376791, -0.06948365271091461, -0.05604523792862892, -0.04260682314634323, -0.02916841208934784, -0.015730001032352448, -0.0022915899753570557, 0.01114682201296091, 0.024585234001278877, 0.03802364692091942, 0.05146205797791481, 0.0649004727602005, 0.07833888381719589, 0.09177729487419128, 0.10521570593118668, 0.11865411698818207, 0.13209253549575806, 0.14553093910217285, 0.15896935760974884, 0.17240777611732483, 0.18584617972373962, 0.19928458333015442, 0.2127230018377304, 0.2261614203453064, 0.2395998239517212, 0.253038227558136, 0.26647666096687317, 0.27991506457328796, 0.29335346817970276, 0.30679190158843994, 0.32023030519485474, 0.33366870880126953, 0.3471071422100067, 0.3605455458164215, 0.3739839494228363, 0.3874223828315735, 0.4008607864379883, 0.4142991900444031, 0.42773759365081787]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 8.0, 8.0, 14.0, 13.0, 17.0, 13.0, 21.0, 21.0, 30.0, 27.0, 34.0, 39.0, 40.0, 41.0, 41.0, 48.0, 52.0, 43.0, 36.0, 50.0, 52.0, 49.0, 38.0, 38.0, 28.0, 37.0, 25.0, 20.0, 18.0, 25.0, 18.0, 5.0, 13.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.101531982421875, -2.99993896484375, -2.898345947265625, -2.7967529296875, -2.695159912109375, -2.59356689453125, -2.491973876953125, -2.390380859375, -2.288787841796875, -2.18719482421875, -2.085601806640625, -1.9840087890625, -1.882415771484375, -1.78082275390625, -1.679229736328125, -1.57763671875, -1.476043701171875, -1.37445068359375, -1.272857666015625, -1.1712646484375, -1.069671630859375, -0.96807861328125, -0.866485595703125, -0.764892578125, -0.663299560546875, -0.56170654296875, -0.460113525390625, -0.3585205078125, -0.256927490234375, -0.15533447265625, -0.053741455078125, 0.0478515625, 0.149444580078125, 0.25103759765625, 0.352630615234375, 0.4542236328125, 0.555816650390625, 0.65740966796875, 0.759002685546875, 0.860595703125, 0.962188720703125, 1.06378173828125, 1.165374755859375, 1.2669677734375, 1.368560791015625, 1.47015380859375, 1.571746826171875, 1.67333984375, 1.774932861328125, 1.87652587890625, 1.978118896484375, 2.0797119140625, 2.181304931640625, 2.28289794921875, 2.384490966796875, 2.486083984375, 2.587677001953125, 2.68927001953125, 2.790863037109375, 2.8924560546875, 2.994049072265625, 3.09564208984375, 3.197235107421875, 3.298828125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 6.0, 9.0, 9.0, 22.0, 20.0, 41.0, 56.0, 74.0, 90.0, 175.0, 232.0, 284.0, 471.0, 591.0, 900.0, 1295.0, 1934.0, 2830.0, 4508.0, 7087.0, 11979.0, 20823.0, 39538.0, 81988.0, 205175.0, 377068.0, 149504.0, 64158.0, 32093.0, 17405.0, 10104.0, 6228.0, 3778.0, 2568.0, 1674.0, 1174.0, 835.0, 544.0, 364.0, 286.0, 177.0, 138.0, 100.0, 70.0, 56.0, 35.0, 18.0, 18.0, 8.0, 5.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.21484375, -3.112274169921875, -3.00970458984375, -2.907135009765625, -2.8045654296875, -2.701995849609375, -2.59942626953125, -2.496856689453125, -2.394287109375, -2.291717529296875, -2.18914794921875, -2.086578369140625, -1.9840087890625, -1.881439208984375, -1.77886962890625, -1.676300048828125, -1.57373046875, -1.471160888671875, -1.36859130859375, -1.266021728515625, -1.1634521484375, -1.060882568359375, -0.95831298828125, -0.855743408203125, -0.753173828125, -0.650604248046875, -0.54803466796875, -0.445465087890625, -0.3428955078125, -0.240325927734375, -0.13775634765625, -0.035186767578125, 0.0673828125, 0.169952392578125, 0.27252197265625, 0.375091552734375, 0.4776611328125, 0.580230712890625, 0.68280029296875, 0.785369873046875, 0.887939453125, 0.990509033203125, 1.09307861328125, 1.195648193359375, 1.2982177734375, 1.400787353515625, 1.50335693359375, 1.605926513671875, 1.70849609375, 1.811065673828125, 1.91363525390625, 2.016204833984375, 2.1187744140625, 2.221343994140625, 2.32391357421875, 2.426483154296875, 2.529052734375, 2.631622314453125, 2.73419189453125, 2.836761474609375, 2.9393310546875, 3.041900634765625, 3.14447021484375, 3.247039794921875, 3.349609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 11.0, 22.0, 25.0, 14.0, 34.0, 19.0, 35.0, 35.0, 51.0, 56.0, 64.0, 90.0, 184.0, 1389.0, 300.0, 160.0, 110.0, 63.0, 58.0, 50.0, 33.0, 34.0, 25.0, 26.0, 19.0, 21.0, 12.0, 21.0, 10.0, 9.0, 9.0, 9.0, 5.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.34375, -9.998291015625, -9.65283203125, -9.307373046875, -8.9619140625, -8.616455078125, -8.27099609375, -7.925537109375, -7.580078125, -7.234619140625, -6.88916015625, -6.543701171875, -6.1982421875, -5.852783203125, -5.50732421875, -5.161865234375, -4.81640625, -4.470947265625, -4.12548828125, -3.780029296875, -3.4345703125, -3.089111328125, -2.74365234375, -2.398193359375, -2.052734375, -1.707275390625, -1.36181640625, -1.016357421875, -0.6708984375, -0.325439453125, 0.02001953125, 0.365478515625, 0.7109375, 1.056396484375, 1.40185546875, 1.747314453125, 2.0927734375, 2.438232421875, 2.78369140625, 3.129150390625, 3.474609375, 3.820068359375, 4.16552734375, 4.510986328125, 4.8564453125, 5.201904296875, 5.54736328125, 5.892822265625, 6.23828125, 6.583740234375, 6.92919921875, 7.274658203125, 7.6201171875, 7.965576171875, 8.31103515625, 8.656494140625, 9.001953125, 9.347412109375, 9.69287109375, 10.038330078125, 10.3837890625, 10.729248046875, 11.07470703125, 11.420166015625, 11.765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 11.0, 10.0, 13.0, 14.0, 26.0, 10.0, 28.0, 25.0, 42.0, 60.0, 76.0, 95.0, 114.0, 181.0, 242.0, 401.0, 939.0, 2642.0, 11768.0, 119480.0, 2786104.0, 201856.0, 15923.0, 3231.0, 1040.0, 459.0, 265.0, 168.0, 121.0, 89.0, 52.0, 50.0, 39.0, 25.0, 21.0, 18.0, 13.0, 12.0, 12.0, 7.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.28125, -18.7236328125, -18.166015625, -17.6083984375, -17.05078125, -16.4931640625, -15.935546875, -15.3779296875, -14.8203125, -14.2626953125, -13.705078125, -13.1474609375, -12.58984375, -12.0322265625, -11.474609375, -10.9169921875, -10.359375, -9.8017578125, -9.244140625, -8.6865234375, -8.12890625, -7.5712890625, -7.013671875, -6.4560546875, -5.8984375, -5.3408203125, -4.783203125, -4.2255859375, -3.66796875, -3.1103515625, -2.552734375, -1.9951171875, -1.4375, -0.8798828125, -0.322265625, 0.2353515625, 0.79296875, 1.3505859375, 1.908203125, 2.4658203125, 3.0234375, 3.5810546875, 4.138671875, 4.6962890625, 5.25390625, 5.8115234375, 6.369140625, 6.9267578125, 7.484375, 8.0419921875, 8.599609375, 9.1572265625, 9.71484375, 10.2724609375, 10.830078125, 11.3876953125, 11.9453125, 12.5029296875, 13.060546875, 13.6181640625, 14.17578125, 14.7333984375, 15.291015625, 15.8486328125, 16.40625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 618.0, 393.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2069091796875, -579.0357055664062, -568.8645629882812, -558.693359375, -548.5221557617188, -538.3510131835938, -528.1798095703125, -518.0086059570312, -507.8374328613281, -497.666259765625, -487.49505615234375, -477.3238830566406, -467.1527099609375, -456.98150634765625, -446.8103332519531, -436.63916015625, -426.46795654296875, -416.2967834472656, -406.1255798339844, -395.95440673828125, -385.783203125, -375.6120300292969, -365.44085693359375, -355.2696533203125, -345.0984802246094, -334.92730712890625, -324.756103515625, -314.5849304199219, -304.41375732421875, -294.2425537109375, -284.0713806152344, -273.90020751953125, -263.72900390625, -253.5578155517578, -243.38662719726562, -233.2154541015625, -223.0442657470703, -212.87307739257812, -202.701904296875, -192.5307159423828, -182.3595428466797, -172.1883544921875, -162.01718139648438, -151.8459930419922, -141.6748046875, -131.5036163330078, -121.33243560791016, -111.1612548828125, -100.99006652832031, -90.81887817382812, -80.64769744873047, -70.47651672363281, -60.305328369140625, -50.1341438293457, -39.96295928955078, -29.791778564453125, -19.620586395263672, -9.44940185546875, 0.7217826843261719, 10.892967224121094, 21.064151763916016, 31.235336303710938, 41.40652084350586, 51.577701568603516, 61.7488899230957]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 13.0, 20.0, 14.0, 13.0, 25.0, 34.0, 22.0, 26.0, 42.0, 31.0, 32.0, 40.0, 40.0, 51.0, 44.0, 58.0, 45.0, 44.0, 45.0, 32.0, 39.0, 32.0, 21.0, 34.0, 27.0, 29.0, 21.0, 12.0, 20.0, 12.0, 10.0, 15.0, 10.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.83502769470215, -30.820438385009766, -29.805849075317383, -28.791259765625, -27.776670455932617, -26.762081146240234, -25.747493743896484, -24.73290252685547, -23.71831512451172, -22.703725814819336, -21.689136505126953, -20.67454719543457, -19.659957885742188, -18.645368576049805, -17.630779266357422, -16.616191864013672, -15.601600646972656, -14.587011337280273, -13.57242202758789, -12.557832717895508, -11.543243408203125, -10.528654098510742, -9.514065742492676, -8.499476432800293, -7.48488712310791, -6.470297813415527, -5.4557085037231445, -4.44111967086792, -3.426530361175537, -2.4119410514831543, -1.3973522186279297, -0.3827629089355469, 0.6318283081054688, 1.646417498588562, 2.6610066890716553, 3.675595760345459, 4.690185070037842, 5.704774379730225, 6.719363212585449, 7.733952522277832, 8.748541831970215, 9.763131141662598, 10.77772045135498, 11.792308807373047, 12.80689811706543, 13.821487426757812, 14.836076736450195, 15.850666046142578, 16.86525535583496, 17.879844665527344, 18.894433975219727, 19.90902328491211, 20.923612594604492, 21.938201904296875, 22.952789306640625, 23.96738052368164, 24.98196792602539, 25.996557235717773, 27.011146545410156, 28.02573585510254, 29.040325164794922, 30.054914474487305, 31.069503784179688, 32.08409118652344, 33.09868240356445]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 10.0, 9.0, 12.0, 17.0, 23.0, 28.0, 25.0, 30.0, 27.0, 42.0, 35.0, 37.0, 53.0, 47.0, 52.0, 44.0, 51.0, 57.0, 53.0, 42.0, 42.0, 34.0, 27.0, 29.0, 24.0, 29.0, 25.0, 17.0, 14.0, 9.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5625, -3.4490966796875, -3.335693359375, -3.2222900390625, -3.10888671875, -2.9954833984375, -2.882080078125, -2.7686767578125, -2.6552734375, -2.5418701171875, -2.428466796875, -2.3150634765625, -2.20166015625, -2.0882568359375, -1.974853515625, -1.8614501953125, -1.748046875, -1.6346435546875, -1.521240234375, -1.4078369140625, -1.29443359375, -1.1810302734375, -1.067626953125, -0.9542236328125, -0.8408203125, -0.7274169921875, -0.614013671875, -0.5006103515625, -0.38720703125, -0.2738037109375, -0.160400390625, -0.0469970703125, 0.06640625, 0.1798095703125, 0.293212890625, 0.4066162109375, 0.52001953125, 0.6334228515625, 0.746826171875, 0.8602294921875, 0.9736328125, 1.0870361328125, 1.200439453125, 1.3138427734375, 1.42724609375, 1.5406494140625, 1.654052734375, 1.7674560546875, 1.880859375, 1.9942626953125, 2.107666015625, 2.2210693359375, 2.33447265625, 2.4478759765625, 2.561279296875, 2.6746826171875, 2.7880859375, 2.9014892578125, 3.014892578125, 3.1282958984375, 3.24169921875, 3.3551025390625, 3.468505859375, 3.5819091796875, 3.6953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 16.0, 26.0, 45.0, 48.0, 81.0, 112.0, 212.0, 364.0, 592.0, 929.0, 1677.0, 3071.0, 5990.0, 12374.0, 27508.0, 77017.0, 537248.0, 2880165.0, 518450.0, 75922.0, 26745.0, 12218.0, 6032.0, 3118.0, 1667.0, 1033.0, 556.0, 372.0, 223.0, 141.0, 87.0, 68.0, 48.0, 24.0, 19.0, 16.0, 12.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5, -8.2384033203125, -7.976806640625, -7.7152099609375, -7.45361328125, -7.1920166015625, -6.930419921875, -6.6688232421875, -6.4072265625, -6.1456298828125, -5.884033203125, -5.6224365234375, -5.36083984375, -5.0992431640625, -4.837646484375, -4.5760498046875, -4.314453125, -4.0528564453125, -3.791259765625, -3.5296630859375, -3.26806640625, -3.0064697265625, -2.744873046875, -2.4832763671875, -2.2216796875, -1.9600830078125, -1.698486328125, -1.4368896484375, -1.17529296875, -0.9136962890625, -0.652099609375, -0.3905029296875, -0.12890625, 0.1326904296875, 0.394287109375, 0.6558837890625, 0.91748046875, 1.1790771484375, 1.440673828125, 1.7022705078125, 1.9638671875, 2.2254638671875, 2.487060546875, 2.7486572265625, 3.01025390625, 3.2718505859375, 3.533447265625, 3.7950439453125, 4.056640625, 4.3182373046875, 4.579833984375, 4.8414306640625, 5.10302734375, 5.3646240234375, 5.626220703125, 5.8878173828125, 6.1494140625, 6.4110107421875, 6.672607421875, 6.9342041015625, 7.19580078125, 7.4573974609375, 7.718994140625, 7.9805908203125, 8.2421875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 8.0, 10.0, 23.0, 27.0, 32.0, 37.0, 48.0, 98.0, 116.0, 248.0, 431.0, 764.0, 860.0, 510.0, 277.0, 160.0, 107.0, 82.0, 54.0, 38.0, 31.0, 22.0, 18.0, 18.0, 14.0, 7.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.0137939453125, -8.715087890625, -8.4163818359375, -8.11767578125, -7.8189697265625, -7.520263671875, -7.2215576171875, -6.9228515625, -6.6241455078125, -6.325439453125, -6.0267333984375, -5.72802734375, -5.4293212890625, -5.130615234375, -4.8319091796875, -4.533203125, -4.2344970703125, -3.935791015625, -3.6370849609375, -3.33837890625, -3.0396728515625, -2.740966796875, -2.4422607421875, -2.1435546875, -1.8448486328125, -1.546142578125, -1.2474365234375, -0.94873046875, -0.6500244140625, -0.351318359375, -0.0526123046875, 0.24609375, 0.5447998046875, 0.843505859375, 1.1422119140625, 1.44091796875, 1.7396240234375, 2.038330078125, 2.3370361328125, 2.6357421875, 2.9344482421875, 3.233154296875, 3.5318603515625, 3.83056640625, 4.1292724609375, 4.427978515625, 4.7266845703125, 5.025390625, 5.3240966796875, 5.622802734375, 5.9215087890625, 6.22021484375, 6.5189208984375, 6.817626953125, 7.1163330078125, 7.4150390625, 7.7137451171875, 8.012451171875, 8.3111572265625, 8.60986328125, 8.9085693359375, 9.207275390625, 9.5059814453125, 9.8046875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 17.0, 17.0, 20.0, 28.0, 30.0, 55.0, 96.0, 168.0, 377.0, 1310.0, 7880.0, 105315.0, 3889382.0, 176450.0, 10601.0, 1636.0, 444.0, 179.0, 91.0, 48.0, 40.0, 31.0, 13.0, 12.0, 7.0, 8.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.41064453125, -30.4462890625, -29.48193359375, -28.517578125, -27.55322265625, -26.5888671875, -25.62451171875, -24.66015625, -23.69580078125, -22.7314453125, -21.76708984375, -20.802734375, -19.83837890625, -18.8740234375, -17.90966796875, -16.9453125, -15.98095703125, -15.0166015625, -14.05224609375, -13.087890625, -12.12353515625, -11.1591796875, -10.19482421875, -9.23046875, -8.26611328125, -7.3017578125, -6.33740234375, -5.373046875, -4.40869140625, -3.4443359375, -2.47998046875, -1.515625, -0.55126953125, 0.4130859375, 1.37744140625, 2.341796875, 3.30615234375, 4.2705078125, 5.23486328125, 6.19921875, 7.16357421875, 8.1279296875, 9.09228515625, 10.056640625, 11.02099609375, 11.9853515625, 12.94970703125, 13.9140625, 14.87841796875, 15.8427734375, 16.80712890625, 17.771484375, 18.73583984375, 19.7001953125, 20.66455078125, 21.62890625, 22.59326171875, 23.5576171875, 24.52197265625, 25.486328125, 26.45068359375, 27.4150390625, 28.37939453125, 29.34375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 25.0, 23.0, 22.0, 47.0, 81.0, 99.0, 131.0, 110.0, 113.0, 96.0, 83.0, 50.0, 39.0, 23.0, 18.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.63386917114258, -44.47373580932617, -43.31360626220703, -42.153472900390625, -40.99333953857422, -39.83320617675781, -38.67307662963867, -37.512943267822266, -36.352813720703125, -35.19268035888672, -34.03255081176758, -32.87241744995117, -31.712284088134766, -30.552152633666992, -29.39202117919922, -28.231887817382812, -27.071754455566406, -25.911623001098633, -24.751489639282227, -23.591358184814453, -22.431224822998047, -21.271093368530273, -20.1109619140625, -18.950828552246094, -17.79069709777832, -16.630565643310547, -15.47043228149414, -14.310300827026367, -13.150168418884277, -11.990036010742188, -10.829904556274414, -9.669772148132324, -8.509637832641602, -7.349505424499512, -6.18937349319458, -5.029241561889648, -3.8691091537475586, -2.7089767456054688, -1.548844814300537, -0.38871288299560547, 0.7714195251464844, 1.9315516948699951, 3.091683864593506, 4.2518157958984375, 5.411948204040527, 6.572080612182617, 7.732212543487549, 8.89234447479248, 10.05247688293457, 11.21260929107666, 12.37274169921875, 13.532873153686523, 14.693005561828613, 15.853137969970703, 17.013269424438477, 18.17340087890625, 19.333534240722656, 20.49366569519043, 21.653799057006836, 22.81393051147461, 23.974063873291016, 25.13419532775879, 26.294326782226562, 27.45446014404297, 28.614591598510742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 1.0, 5.0, 7.0, 10.0, 12.0, 14.0, 23.0, 36.0, 19.0, 37.0, 38.0, 26.0, 41.0, 45.0, 38.0, 47.0, 31.0, 38.0, 46.0, 50.0, 37.0, 37.0, 38.0, 34.0, 39.0, 40.0, 33.0, 36.0, 24.0, 24.0, 16.0, 13.0, 12.0, 12.0, 2.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.061450958251953, -25.286300659179688, -24.51114845275879, -23.735998153686523, -22.960847854614258, -22.18569564819336, -21.410545349121094, -20.635395050048828, -19.86024284362793, -19.085092544555664, -18.309940338134766, -17.5347900390625, -16.759639739990234, -15.984487533569336, -15.20933723449707, -14.434185981750488, -13.659035682678223, -12.88388442993164, -12.108734130859375, -11.333582878112793, -10.558431625366211, -9.783281326293945, -9.008130073547363, -8.232978820800781, -7.457828044891357, -6.682677268981934, -5.907526016235352, -5.132375240325928, -4.357224464416504, -3.582073211669922, -2.806922435760498, -2.031771183013916, -1.2566204071044922, -0.48146945238113403, 0.2936815023422241, 1.0688323974609375, 1.8439834117889404, 2.6191344261169434, 3.394285202026367, 4.169436454772949, 4.944587230682373, 5.719738006591797, 6.494889259338379, 7.270040035247803, 8.045190811157227, 8.820342063903809, 9.59549331665039, 10.370643615722656, 11.145794868469238, 11.92094612121582, 12.696096420288086, 13.471247673034668, 14.24639892578125, 15.021549224853516, 15.796700477600098, 16.57185173034668, 17.347002029418945, 18.12215232849121, 18.89730453491211, 19.672454833984375, 20.44760513305664, 21.22275733947754, 21.997907638549805, 22.773059844970703, 23.54821014404297]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 6.0, 10.0, 8.0, 12.0, 22.0, 19.0, 21.0, 37.0, 28.0, 35.0, 38.0, 25.0, 36.0, 50.0, 45.0, 44.0, 38.0, 40.0, 33.0, 50.0, 45.0, 43.0, 37.0, 40.0, 33.0, 24.0, 15.0, 17.0, 24.0, 16.0, 16.0, 17.0, 15.0, 6.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84423828125, -2.7490234375, -2.65380859375, -2.55859375, -2.46337890625, -2.3681640625, -2.27294921875, -2.177734375, -2.08251953125, -1.9873046875, -1.89208984375, -1.796875, -1.70166015625, -1.6064453125, -1.51123046875, -1.416015625, -1.32080078125, -1.2255859375, -1.13037109375, -1.03515625, -0.93994140625, -0.8447265625, -0.74951171875, -0.654296875, -0.55908203125, -0.4638671875, -0.36865234375, -0.2734375, -0.17822265625, -0.0830078125, 0.01220703125, 0.107421875, 0.20263671875, 0.2978515625, 0.39306640625, 0.48828125, 0.58349609375, 0.6787109375, 0.77392578125, 0.869140625, 0.96435546875, 1.0595703125, 1.15478515625, 1.25, 1.34521484375, 1.4404296875, 1.53564453125, 1.630859375, 1.72607421875, 1.8212890625, 1.91650390625, 2.01171875, 2.10693359375, 2.2021484375, 2.29736328125, 2.392578125, 2.48779296875, 2.5830078125, 2.67822265625, 2.7734375, 2.86865234375, 2.9638671875, 3.05908203125, 3.154296875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 19.0, 25.0, 32.0, 44.0, 67.0, 92.0, 122.0, 150.0, 219.0, 342.0, 444.0, 662.0, 944.0, 1367.0, 2170.0, 3344.0, 5537.0, 9727.0, 18761.0, 43822.0, 173242.0, 586396.0, 125218.0, 36108.0, 16694.0, 8657.0, 5020.0, 3009.0, 1966.0, 1342.0, 893.0, 626.0, 382.0, 315.0, 221.0, 158.0, 111.0, 85.0, 46.0, 42.0, 32.0, 27.0, 15.0, 16.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.296875, -5.1334228515625, -4.969970703125, -4.8065185546875, -4.64306640625, -4.4796142578125, -4.316162109375, -4.1527099609375, -3.9892578125, -3.8258056640625, -3.662353515625, -3.4989013671875, -3.33544921875, -3.1719970703125, -3.008544921875, -2.8450927734375, -2.681640625, -2.5181884765625, -2.354736328125, -2.1912841796875, -2.02783203125, -1.8643798828125, -1.700927734375, -1.5374755859375, -1.3740234375, -1.2105712890625, -1.047119140625, -0.8836669921875, -0.72021484375, -0.5567626953125, -0.393310546875, -0.2298583984375, -0.06640625, 0.0970458984375, 0.260498046875, 0.4239501953125, 0.58740234375, 0.7508544921875, 0.914306640625, 1.0777587890625, 1.2412109375, 1.4046630859375, 1.568115234375, 1.7315673828125, 1.89501953125, 2.0584716796875, 2.221923828125, 2.3853759765625, 2.548828125, 2.7122802734375, 2.875732421875, 3.0391845703125, 3.20263671875, 3.3660888671875, 3.529541015625, 3.6929931640625, 3.8564453125, 4.0198974609375, 4.183349609375, 4.3468017578125, 4.51025390625, 4.6737060546875, 4.837158203125, 5.0006103515625, 5.1640625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 22.0, 24.0, 18.0, 19.0, 31.0, 28.0, 26.0, 34.0, 37.0, 31.0, 38.0, 36.0, 34.0, 36.0, 1059.0, 39.0, 47.0, 34.0, 39.0, 34.0, 39.0, 35.0, 31.0, 41.0, 20.0, 16.0, 21.0, 14.0, 14.0, 14.0, 17.0, 7.0, 6.0, 4.0, 9.0, 3.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.423828125, -2.347747802734375, -2.27166748046875, -2.195587158203125, -2.1195068359375, -2.043426513671875, -1.96734619140625, -1.891265869140625, -1.815185546875, -1.739105224609375, -1.66302490234375, -1.586944580078125, -1.5108642578125, -1.434783935546875, -1.35870361328125, -1.282623291015625, -1.20654296875, -1.130462646484375, -1.05438232421875, -0.978302001953125, -0.9022216796875, -0.826141357421875, -0.75006103515625, -0.673980712890625, -0.597900390625, -0.521820068359375, -0.44573974609375, -0.369659423828125, -0.2935791015625, -0.217498779296875, -0.14141845703125, -0.065338134765625, 0.0107421875, 0.086822509765625, 0.16290283203125, 0.238983154296875, 0.3150634765625, 0.391143798828125, 0.46722412109375, 0.543304443359375, 0.619384765625, 0.695465087890625, 0.77154541015625, 0.847625732421875, 0.9237060546875, 0.999786376953125, 1.07586669921875, 1.151947021484375, 1.22802734375, 1.304107666015625, 1.38018798828125, 1.456268310546875, 1.5323486328125, 1.608428955078125, 1.68450927734375, 1.760589599609375, 1.836669921875, 1.912750244140625, 1.98883056640625, 2.064910888671875, 2.1409912109375, 2.217071533203125, 2.29315185546875, 2.369232177734375, 2.4453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 10.0, 13.0, 28.0, 42.0, 55.0, 86.0, 131.0, 190.0, 288.0, 466.0, 678.0, 1234.0, 2022.0, 3582.0, 6827.0, 14110.0, 36540.0, 194763.0, 1674104.0, 109512.0, 27206.0, 11628.0, 5765.0, 3125.0, 1840.0, 1099.0, 617.0, 394.0, 273.0, 155.0, 125.0, 79.0, 48.0, 37.0, 20.0, 17.0, 5.0, 9.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.2830810546875, -5.109130859375, -4.9351806640625, -4.76123046875, -4.5872802734375, -4.413330078125, -4.2393798828125, -4.0654296875, -3.8914794921875, -3.717529296875, -3.5435791015625, -3.36962890625, -3.1956787109375, -3.021728515625, -2.8477783203125, -2.673828125, -2.4998779296875, -2.325927734375, -2.1519775390625, -1.97802734375, -1.8040771484375, -1.630126953125, -1.4561767578125, -1.2822265625, -1.1082763671875, -0.934326171875, -0.7603759765625, -0.58642578125, -0.4124755859375, -0.238525390625, -0.0645751953125, 0.109375, 0.2833251953125, 0.457275390625, 0.6312255859375, 0.80517578125, 0.9791259765625, 1.153076171875, 1.3270263671875, 1.5009765625, 1.6749267578125, 1.848876953125, 2.0228271484375, 2.19677734375, 2.3707275390625, 2.544677734375, 2.7186279296875, 2.892578125, 3.0665283203125, 3.240478515625, 3.4144287109375, 3.58837890625, 3.7623291015625, 3.936279296875, 4.1102294921875, 4.2841796875, 4.4581298828125, 4.632080078125, 4.8060302734375, 4.97998046875, 5.1539306640625, 5.327880859375, 5.5018310546875, 5.67578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 28.0, 33.0, 134.0, 342.0, 238.0, 93.0, 31.0, 17.0, 20.0, 9.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9052734375, -1.8489837646484375, -1.792694091796875, -1.7364044189453125, -1.68011474609375, -1.6238250732421875, -1.567535400390625, -1.5112457275390625, -1.4549560546875, -1.3986663818359375, -1.342376708984375, -1.2860870361328125, -1.22979736328125, -1.1735076904296875, -1.117218017578125, -1.0609283447265625, -1.004638671875, -0.9483489990234375, -0.892059326171875, -0.8357696533203125, -0.77947998046875, -0.7231903076171875, -0.666900634765625, -0.6106109619140625, -0.5543212890625, -0.4980316162109375, -0.441741943359375, -0.3854522705078125, -0.32916259765625, -0.2728729248046875, -0.216583251953125, -0.1602935791015625, -0.10400390625, -0.0477142333984375, 0.008575439453125, 0.0648651123046875, 0.12115478515625, 0.1774444580078125, 0.233734130859375, 0.2900238037109375, 0.3463134765625, 0.4026031494140625, 0.458892822265625, 0.5151824951171875, 0.57147216796875, 0.6277618408203125, 0.684051513671875, 0.7403411865234375, 0.796630859375, 0.8529205322265625, 0.909210205078125, 0.9654998779296875, 1.02178955078125, 1.0780792236328125, 1.134368896484375, 1.1906585693359375, 1.2469482421875, 1.3032379150390625, 1.359527587890625, 1.4158172607421875, 1.47210693359375, 1.5283966064453125, 1.584686279296875, 1.6409759521484375, 1.697265625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 5.0, 9.0, 15.0, 37.0, 65.0, 231.0, 1412.0, 41236.0, 1002252.0, 2701.0, 411.0, 77.0, 30.0, 23.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.9375, -31.84521484375, -30.7529296875, -29.66064453125, -28.568359375, -27.47607421875, -26.3837890625, -25.29150390625, -24.19921875, -23.10693359375, -22.0146484375, -20.92236328125, -19.830078125, -18.73779296875, -17.6455078125, -16.55322265625, -15.4609375, -14.36865234375, -13.2763671875, -12.18408203125, -11.091796875, -9.99951171875, -8.9072265625, -7.81494140625, -6.72265625, -5.63037109375, -4.5380859375, -3.44580078125, -2.353515625, -1.26123046875, -0.1689453125, 0.92333984375, 2.015625, 3.10791015625, 4.2001953125, 5.29248046875, 6.384765625, 7.47705078125, 8.5693359375, 9.66162109375, 10.75390625, 11.84619140625, 12.9384765625, 14.03076171875, 15.123046875, 16.21533203125, 17.3076171875, 18.39990234375, 19.4921875, 20.58447265625, 21.6767578125, 22.76904296875, 23.861328125, 24.95361328125, 26.0458984375, 27.13818359375, 28.23046875, 29.32275390625, 30.4150390625, 31.50732421875, 32.599609375, 33.69189453125, 34.7841796875, 35.87646484375, 36.96875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 31.0, 153.0, 664.0, 141.0, 19.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.514542579650879, -1.239621877670288, -0.9647012948989868, -0.6897806525230408, -0.4148600101470947, -0.1399393081665039, 0.13498127460479736, 0.40990185737609863, 0.6848225593566895, 0.9597432017326355, 1.2346638441085815, 1.5095844268798828, 1.7845051288604736, 2.0594258308410645, 2.334346294403076, 2.609266996383667, 2.884187698364258, 3.1591084003448486, 3.4340291023254395, 3.708949565887451, 3.983870267868042, 4.258790969848633, 4.5337114334106445, 4.808631896972656, 5.083552837371826, 5.358473300933838, 5.633394241333008, 5.9083147048950195, 6.183235168457031, 6.458156108856201, 6.733076572418213, 7.007997512817383, 7.282918930053711, 7.557839393615723, 7.832760334014893, 8.107681274414062, 8.382601737976074, 8.657522201538086, 8.932442665100098, 9.20736312866211, 9.482284545898438, 9.75720500946045, 10.032125473022461, 10.307046890258789, 10.5819673538208, 10.856887817382812, 11.131808280944824, 11.406728744506836, 11.681649208068848, 11.95656967163086, 12.231490135192871, 12.5064115524292, 12.781332015991211, 13.056252479553223, 13.331172943115234, 13.606093406677246, 13.881013870239258, 14.15593433380127, 14.430854797363281, 14.70577621459961, 14.980696678161621, 15.255617141723633, 15.530537605285645, 15.805458068847656, 16.080379486083984]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 12.0, 13.0, 19.0, 11.0, 23.0, 24.0, 35.0, 21.0, 25.0, 31.0, 43.0, 32.0, 38.0, 41.0, 36.0, 48.0, 39.0, 41.0, 40.0, 41.0, 30.0, 33.0, 33.0, 32.0, 28.0, 28.0, 31.0, 12.0, 19.0, 20.0, 14.0, 14.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9238834381103516, -0.8947098255157471, -0.8655362129211426, -0.8363626003265381, -0.8071890473365784, -0.7780154347419739, -0.7488418221473694, -0.7196682095527649, -0.6904945969581604, -0.6613209843635559, -0.6321473717689514, -0.6029738187789917, -0.5738002061843872, -0.5446265935897827, -0.5154529809951782, -0.48627936840057373, -0.4571057856082916, -0.42793217301368713, -0.39875859022140503, -0.36958497762680054, -0.34041136503219604, -0.31123775243759155, -0.28206416964530945, -0.25289055705070496, -0.22371695935726166, -0.19454336166381836, -0.16536974906921387, -0.13619615137577057, -0.10702254623174667, -0.07784894108772278, -0.04867534339427948, -0.019501730799674988, 0.00967186689376831, 0.038845472037792206, 0.0680190771818161, 0.0971926748752594, 0.1263662874698639, 0.1555398851633072, 0.1847134828567505, 0.21388709545135498, 0.24306069314479828, 0.2722342908382416, 0.30140790343284607, 0.3305814862251282, 0.35975509881973267, 0.38892871141433716, 0.41810232400894165, 0.44727593660354614, 0.47644951939582825, 0.5056231021881104, 0.5347967147827148, 0.5639703273773193, 0.5931439399719238, 0.6223175525665283, 0.6514911651611328, 0.6806647777557373, 0.709838330745697, 0.7390119433403015, 0.768185555934906, 0.7973591089248657, 0.8265327215194702, 0.8557063341140747, 0.8848799467086792, 0.9140535593032837, 0.9432271718978882]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 10.0, 8.0, 11.0, 14.0, 14.0, 24.0, 24.0, 29.0, 26.0, 20.0, 29.0, 46.0, 42.0, 44.0, 35.0, 47.0, 40.0, 33.0, 38.0, 34.0, 41.0, 51.0, 43.0, 39.0, 33.0, 28.0, 18.0, 17.0, 24.0, 23.0, 11.0, 12.0, 12.0, 9.0, 6.0, 14.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.744140625, -2.653533935546875, -2.56292724609375, -2.472320556640625, -2.3817138671875, -2.291107177734375, -2.20050048828125, -2.109893798828125, -2.019287109375, -1.928680419921875, -1.83807373046875, -1.747467041015625, -1.6568603515625, -1.566253662109375, -1.47564697265625, -1.385040283203125, -1.29443359375, -1.203826904296875, -1.11322021484375, -1.022613525390625, -0.9320068359375, -0.841400146484375, -0.75079345703125, -0.660186767578125, -0.569580078125, -0.478973388671875, -0.38836669921875, -0.297760009765625, -0.2071533203125, -0.116546630859375, -0.02593994140625, 0.064666748046875, 0.1552734375, 0.245880126953125, 0.33648681640625, 0.427093505859375, 0.5177001953125, 0.608306884765625, 0.69891357421875, 0.789520263671875, 0.880126953125, 0.970733642578125, 1.06134033203125, 1.151947021484375, 1.2425537109375, 1.333160400390625, 1.42376708984375, 1.514373779296875, 1.60498046875, 1.695587158203125, 1.78619384765625, 1.876800537109375, 1.9674072265625, 2.058013916015625, 2.14862060546875, 2.239227294921875, 2.329833984375, 2.420440673828125, 2.51104736328125, 2.601654052734375, 2.6922607421875, 2.782867431640625, 2.87347412109375, 2.964080810546875, 3.0546875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 21.0, 34.0, 46.0, 55.0, 97.0, 119.0, 145.0, 231.0, 329.0, 377.0, 538.0, 872.0, 1154.0, 1658.0, 2546.0, 4133.0, 7588.0, 16394.0, 46752.0, 185822.0, 553396.0, 152198.0, 40565.0, 14680.0, 7019.0, 3844.0, 2514.0, 1601.0, 1115.0, 759.0, 550.0, 365.0, 295.0, 194.0, 171.0, 108.0, 68.0, 59.0, 44.0, 33.0, 10.0, 18.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.90679931640625, -3.7784423828125, -3.65008544921875, -3.521728515625, -3.39337158203125, -3.2650146484375, -3.13665771484375, -3.00830078125, -2.87994384765625, -2.7515869140625, -2.62322998046875, -2.494873046875, -2.36651611328125, -2.2381591796875, -2.10980224609375, -1.9814453125, -1.85308837890625, -1.7247314453125, -1.59637451171875, -1.468017578125, -1.33966064453125, -1.2113037109375, -1.08294677734375, -0.95458984375, -0.82623291015625, -0.6978759765625, -0.56951904296875, -0.441162109375, -0.31280517578125, -0.1844482421875, -0.05609130859375, 0.072265625, 0.20062255859375, 0.3289794921875, 0.45733642578125, 0.585693359375, 0.71405029296875, 0.8424072265625, 0.97076416015625, 1.09912109375, 1.22747802734375, 1.3558349609375, 1.48419189453125, 1.612548828125, 1.74090576171875, 1.8692626953125, 1.99761962890625, 2.1259765625, 2.25433349609375, 2.3826904296875, 2.51104736328125, 2.639404296875, 2.76776123046875, 2.8961181640625, 3.02447509765625, 3.15283203125, 3.28118896484375, 3.4095458984375, 3.53790283203125, 3.666259765625, 3.79461669921875, 3.9229736328125, 4.05133056640625, 4.1796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 14.0, 11.0, 18.0, 19.0, 20.0, 17.0, 21.0, 25.0, 28.0, 42.0, 36.0, 44.0, 54.0, 71.0, 86.0, 188.0, 1519.0, 252.0, 113.0, 74.0, 43.0, 40.0, 36.0, 42.0, 33.0, 26.0, 17.0, 28.0, 15.0, 18.0, 18.0, 17.0, 9.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3260498046875, -9.011474609375, -8.6968994140625, -8.38232421875, -8.0677490234375, -7.753173828125, -7.4385986328125, -7.1240234375, -6.8094482421875, -6.494873046875, -6.1802978515625, -5.86572265625, -5.5511474609375, -5.236572265625, -4.9219970703125, -4.607421875, -4.2928466796875, -3.978271484375, -3.6636962890625, -3.34912109375, -3.0345458984375, -2.719970703125, -2.4053955078125, -2.0908203125, -1.7762451171875, -1.461669921875, -1.1470947265625, -0.83251953125, -0.5179443359375, -0.203369140625, 0.1112060546875, 0.42578125, 0.7403564453125, 1.054931640625, 1.3695068359375, 1.68408203125, 1.9986572265625, 2.313232421875, 2.6278076171875, 2.9423828125, 3.2569580078125, 3.571533203125, 3.8861083984375, 4.20068359375, 4.5152587890625, 4.829833984375, 5.1444091796875, 5.458984375, 5.7735595703125, 6.088134765625, 6.4027099609375, 6.71728515625, 7.0318603515625, 7.346435546875, 7.6610107421875, 7.9755859375, 8.2901611328125, 8.604736328125, 8.9193115234375, 9.23388671875, 9.5484619140625, 9.863037109375, 10.1776123046875, 10.4921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 5.0, 1.0, 4.0, 16.0, 15.0, 13.0, 21.0, 24.0, 33.0, 51.0, 59.0, 98.0, 140.0, 264.0, 452.0, 1064.0, 3451.0, 19201.0, 2195394.0, 904992.0, 15230.0, 3020.0, 996.0, 448.0, 257.0, 128.0, 84.0, 53.0, 41.0, 24.0, 32.0, 20.0, 18.0, 11.0, 11.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.862548828125, -21.17822265625, -20.493896484375, -19.8095703125, -19.125244140625, -18.44091796875, -17.756591796875, -17.072265625, -16.387939453125, -15.70361328125, -15.019287109375, -14.3349609375, -13.650634765625, -12.96630859375, -12.281982421875, -11.59765625, -10.913330078125, -10.22900390625, -9.544677734375, -8.8603515625, -8.176025390625, -7.49169921875, -6.807373046875, -6.123046875, -5.438720703125, -4.75439453125, -4.070068359375, -3.3857421875, -2.701416015625, -2.01708984375, -1.332763671875, -0.6484375, 0.035888671875, 0.72021484375, 1.404541015625, 2.0888671875, 2.773193359375, 3.45751953125, 4.141845703125, 4.826171875, 5.510498046875, 6.19482421875, 6.879150390625, 7.5634765625, 8.247802734375, 8.93212890625, 9.616455078125, 10.30078125, 10.985107421875, 11.66943359375, 12.353759765625, 13.0380859375, 13.722412109375, 14.40673828125, 15.091064453125, 15.775390625, 16.459716796875, 17.14404296875, 17.828369140625, 18.5126953125, 19.197021484375, 19.88134765625, 20.565673828125, 21.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 18.0, 144.0, 530.0, 269.0, 47.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.36990737915039, -17.147403717041016, -14.924901962280273, -12.702398300170898, -10.47989559173584, -8.257392883300781, -6.034889221191406, -3.8123865127563477, -1.589883804321289, 0.6326191425323486, 2.8551220893859863, 5.077625274658203, 7.300127983093262, 9.52263069152832, 11.745134353637695, 13.967637062072754, 16.190139770507812, 18.412643432617188, 20.63514518737793, 22.857648849487305, 25.080150604248047, 27.302654266357422, 29.525157928466797, 31.747661590576172, 33.97016143798828, 36.192665100097656, 38.41516876220703, 40.637672424316406, 42.860172271728516, 45.08267593383789, 47.305179595947266, 49.52768325805664, 51.75018310546875, 53.972686767578125, 56.1951904296875, 58.417694091796875, 60.640193939208984, 62.86269760131836, 65.085205078125, 67.30770111083984, 69.53020477294922, 71.7527084350586, 73.97521209716797, 76.19771575927734, 78.42021942138672, 80.64271545410156, 82.86521911621094, 85.08772277832031, 87.31022644042969, 89.53273010253906, 91.75523376464844, 93.97773742675781, 96.20024108886719, 98.42274475097656, 100.64524841308594, 102.86774444580078, 105.09025573730469, 107.31275939941406, 109.53526306152344, 111.75776672363281, 113.98027038574219, 116.20277404785156, 118.42527770996094, 120.64777374267578, 122.87027740478516]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 20.0, 17.0, 36.0, 32.0, 45.0, 33.0, 41.0, 43.0, 46.0, 43.0, 32.0, 35.0, 31.0, 46.0, 34.0, 42.0, 30.0, 40.0, 31.0, 29.0, 24.0, 21.0, 22.0, 18.0, 16.0, 20.0, 6.0, 8.0, 3.0, 7.0, 8.0, 10.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.262863159179688, -22.507118225097656, -21.751375198364258, -20.995630264282227, -20.239887237548828, -19.484142303466797, -18.728397369384766, -17.972652435302734, -17.216909408569336, -16.461164474487305, -15.705421447753906, -14.949676513671875, -14.19393253326416, -13.438188552856445, -12.682443618774414, -11.9266996383667, -11.170955657958984, -10.41521167755127, -9.659467697143555, -8.903722763061523, -8.147978782653809, -7.392234802246094, -6.636490345001221, -5.880745887756348, -5.125001907348633, -4.369257926940918, -3.613513469696045, -2.857769250869751, -2.102025032043457, -1.346280813217163, -0.5905365943908691, 0.1652078628540039, 0.9209537506103516, 1.6766979694366455, 2.4324421882629395, 3.1881864070892334, 3.9439306259155273, 4.699674606323242, 5.455419063568115, 6.211163520812988, 6.966907501220703, 7.722651481628418, 8.478395462036133, 9.234140396118164, 9.989884376525879, 10.745628356933594, 11.501373291015625, 12.25711727142334, 13.012861251831055, 13.76860523223877, 14.524349212646484, 15.280094146728516, 16.035839080810547, 16.791582107543945, 17.547327041625977, 18.303070068359375, 19.058815002441406, 19.814559936523438, 20.570302963256836, 21.326047897338867, 22.081790924072266, 22.837535858154297, 23.593280792236328, 24.34902572631836, 25.104768753051758]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 9.0, 8.0, 9.0, 15.0, 20.0, 30.0, 30.0, 18.0, 27.0, 41.0, 49.0, 49.0, 41.0, 36.0, 49.0, 37.0, 55.0, 49.0, 54.0, 39.0, 39.0, 38.0, 24.0, 35.0, 34.0, 21.0, 16.0, 29.0, 16.0, 16.0, 6.0, 13.0, 4.0, 5.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.56536865234375, -3.4569091796875, -3.34844970703125, -3.239990234375, -3.13153076171875, -3.0230712890625, -2.91461181640625, -2.80615234375, -2.69769287109375, -2.5892333984375, -2.48077392578125, -2.372314453125, -2.26385498046875, -2.1553955078125, -2.04693603515625, -1.9384765625, -1.83001708984375, -1.7215576171875, -1.61309814453125, -1.504638671875, -1.39617919921875, -1.2877197265625, -1.17926025390625, -1.07080078125, -0.96234130859375, -0.8538818359375, -0.74542236328125, -0.636962890625, -0.52850341796875, -0.4200439453125, -0.31158447265625, -0.203125, -0.09466552734375, 0.0137939453125, 0.12225341796875, 0.230712890625, 0.33917236328125, 0.4476318359375, 0.55609130859375, 0.66455078125, 0.77301025390625, 0.8814697265625, 0.98992919921875, 1.098388671875, 1.20684814453125, 1.3153076171875, 1.42376708984375, 1.5322265625, 1.64068603515625, 1.7491455078125, 1.85760498046875, 1.966064453125, 2.07452392578125, 2.1829833984375, 2.29144287109375, 2.39990234375, 2.50836181640625, 2.6168212890625, 2.72528076171875, 2.833740234375, 2.94219970703125, 3.0506591796875, 3.15911865234375, 3.267578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 5.0, 12.0, 14.0, 17.0, 24.0, 63.0, 60.0, 85.0, 135.0, 167.0, 301.0, 378.0, 576.0, 896.0, 1258.0, 1973.0, 3147.0, 4918.0, 8280.0, 14262.0, 27191.0, 58618.0, 190281.0, 1178063.0, 2135071.0, 395863.0, 89187.0, 36980.0, 18682.0, 10697.0, 6093.0, 3855.0, 2438.0, 1602.0, 1006.0, 699.0, 436.0, 323.0, 187.0, 131.0, 103.0, 61.0, 50.0, 28.0, 17.0, 12.0, 15.0, 5.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.21875, -6.02569580078125, -5.8326416015625, -5.63958740234375, -5.446533203125, -5.25347900390625, -5.0604248046875, -4.86737060546875, -4.67431640625, -4.48126220703125, -4.2882080078125, -4.09515380859375, -3.902099609375, -3.70904541015625, -3.5159912109375, -3.32293701171875, -3.1298828125, -2.93682861328125, -2.7437744140625, -2.55072021484375, -2.357666015625, -2.16461181640625, -1.9715576171875, -1.77850341796875, -1.58544921875, -1.39239501953125, -1.1993408203125, -1.00628662109375, -0.813232421875, -0.62017822265625, -0.4271240234375, -0.23406982421875, -0.041015625, 0.15203857421875, 0.3450927734375, 0.53814697265625, 0.731201171875, 0.92425537109375, 1.1173095703125, 1.31036376953125, 1.50341796875, 1.69647216796875, 1.8895263671875, 2.08258056640625, 2.275634765625, 2.46868896484375, 2.6617431640625, 2.85479736328125, 3.0478515625, 3.24090576171875, 3.4339599609375, 3.62701416015625, 3.820068359375, 4.01312255859375, 4.2061767578125, 4.39923095703125, 4.59228515625, 4.78533935546875, 4.9783935546875, 5.17144775390625, 5.364501953125, 5.55755615234375, 5.7506103515625, 5.94366455078125, 6.13671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 1.0, 8.0, 7.0, 5.0, 8.0, 11.0, 13.0, 12.0, 31.0, 22.0, 37.0, 43.0, 47.0, 50.0, 58.0, 67.0, 97.0, 135.0, 215.0, 341.0, 470.0, 619.0, 471.0, 355.0, 237.0, 178.0, 116.0, 84.0, 63.0, 56.0, 32.0, 40.0, 23.0, 19.0, 16.0, 17.0, 13.0, 13.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-6.87109375, -6.67791748046875, -6.4847412109375, -6.29156494140625, -6.098388671875, -5.90521240234375, -5.7120361328125, -5.51885986328125, -5.32568359375, -5.13250732421875, -4.9393310546875, -4.74615478515625, -4.552978515625, -4.35980224609375, -4.1666259765625, -3.97344970703125, -3.7802734375, -3.58709716796875, -3.3939208984375, -3.20074462890625, -3.007568359375, -2.81439208984375, -2.6212158203125, -2.42803955078125, -2.23486328125, -2.04168701171875, -1.8485107421875, -1.65533447265625, -1.462158203125, -1.26898193359375, -1.0758056640625, -0.88262939453125, -0.689453125, -0.49627685546875, -0.3031005859375, -0.10992431640625, 0.083251953125, 0.27642822265625, 0.4696044921875, 0.66278076171875, 0.85595703125, 1.04913330078125, 1.2423095703125, 1.43548583984375, 1.628662109375, 1.82183837890625, 2.0150146484375, 2.20819091796875, 2.4013671875, 2.59454345703125, 2.7877197265625, 2.98089599609375, 3.174072265625, 3.36724853515625, 3.5604248046875, 3.75360107421875, 3.94677734375, 4.13995361328125, 4.3331298828125, 4.52630615234375, 4.719482421875, 4.91265869140625, 5.1058349609375, 5.29901123046875, 5.4921875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 20.0, 10.0, 22.0, 26.0, 38.0, 46.0, 68.0, 75.0, 134.0, 230.0, 643.0, 3621.0, 34842.0, 1746019.0, 2363851.0, 39242.0, 3875.0, 701.0, 237.0, 115.0, 57.0, 55.0, 48.0, 54.0, 39.0, 33.0, 24.0, 25.0, 8.0, 12.0, 7.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.485595703125, -23.61181640625, -22.738037109375, -21.8642578125, -20.990478515625, -20.11669921875, -19.242919921875, -18.369140625, -17.495361328125, -16.62158203125, -15.747802734375, -14.8740234375, -14.000244140625, -13.12646484375, -12.252685546875, -11.37890625, -10.505126953125, -9.63134765625, -8.757568359375, -7.8837890625, -7.010009765625, -6.13623046875, -5.262451171875, -4.388671875, -3.514892578125, -2.64111328125, -1.767333984375, -0.8935546875, -0.019775390625, 0.85400390625, 1.727783203125, 2.6015625, 3.475341796875, 4.34912109375, 5.222900390625, 6.0966796875, 6.970458984375, 7.84423828125, 8.718017578125, 9.591796875, 10.465576171875, 11.33935546875, 12.213134765625, 13.0869140625, 13.960693359375, 14.83447265625, 15.708251953125, 16.58203125, 17.455810546875, 18.32958984375, 19.203369140625, 20.0771484375, 20.950927734375, 21.82470703125, 22.698486328125, 23.572265625, 24.446044921875, 25.31982421875, 26.193603515625, 27.0673828125, 27.941162109375, 28.81494140625, 29.688720703125, 30.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 7.0, 19.0, 62.0, 177.0, 303.0, 284.0, 115.0, 35.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.066129684448242, -24.87198829650879, -21.677846908569336, -18.48370361328125, -15.289563179016113, -12.09542179107666, -8.90127944946289, -5.7071380615234375, -2.5129966735839844, 0.6811449527740479, 3.87528657913208, 7.069428443908691, 10.263569831848145, 13.457711219787598, 16.651853561401367, 19.84599494934082, 23.040136337280273, 26.234277725219727, 29.42841911315918, 32.622562408447266, 35.81670379638672, 39.01084518432617, 42.204986572265625, 45.39912796020508, 48.59326934814453, 51.787410736083984, 54.98155212402344, 58.17569351196289, 61.369834899902344, 64.56398010253906, 67.75811767578125, 70.95226287841797, 74.14640045166016, 77.34054565429688, 80.53468322753906, 83.72882843017578, 86.92296600341797, 90.11711120605469, 93.31124877929688, 96.5053939819336, 99.69953155517578, 102.8936767578125, 106.08781433105469, 109.2819595336914, 112.4760971069336, 115.67024230957031, 118.8643798828125, 122.05852508544922, 125.25267028808594, 128.44680786132812, 131.64096069335938, 134.83509826660156, 138.02923583984375, 141.22337341308594, 144.4175262451172, 147.61166381835938, 150.80580139160156, 153.99993896484375, 157.194091796875, 160.3882293701172, 163.58236694335938, 166.77650451660156, 169.9706573486328, 173.164794921875, 176.3589324951172]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 11.0, 9.0, 12.0, 13.0, 14.0, 11.0, 15.0, 17.0, 20.0, 20.0, 23.0, 27.0, 26.0, 31.0, 43.0, 41.0, 34.0, 36.0, 48.0, 41.0, 45.0, 36.0, 42.0, 41.0, 35.0, 46.0, 34.0, 35.0, 20.0, 28.0, 27.0, 20.0, 19.0, 13.0, 15.0, 13.0, 5.0, 7.0, 16.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.957801818847656, -24.247831344604492, -23.537860870361328, -22.827890396118164, -22.117919921875, -21.407947540283203, -20.69797706604004, -19.988006591796875, -19.27803611755371, -18.568065643310547, -17.858095169067383, -17.14812469482422, -16.438152313232422, -15.728182792663574, -15.018211364746094, -14.30824089050293, -13.598270416259766, -12.888299942016602, -12.178329467773438, -11.468358039855957, -10.758387565612793, -10.048417091369629, -9.338445663452148, -8.628475189208984, -7.91850471496582, -7.208534240722656, -6.498563289642334, -5.788592338562012, -5.078621864318848, -4.368651390075684, -3.6586804389953613, -2.948709487915039, -2.238740921020508, -1.5287702083587646, -0.8187994956970215, -0.10882878303527832, 0.6011419296264648, 1.311112642288208, 2.021083354949951, 2.7310543060302734, 3.4410247802734375, 4.150995254516602, 4.860966205596924, 5.570937156677246, 6.28090763092041, 6.990878105163574, 7.7008490562438965, 8.410820007324219, 9.120790481567383, 9.830760955810547, 10.540731430053711, 11.250702857971191, 11.960673332214355, 12.67064380645752, 13.380615234375, 14.090585708618164, 14.800556182861328, 15.510526657104492, 16.220497131347656, 16.93046760559082, 17.640438079833984, 18.35041046142578, 19.060380935668945, 19.77035140991211, 20.480321884155273]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 13.0, 27.0, 14.0, 14.0, 12.0, 23.0, 21.0, 22.0, 26.0, 40.0, 33.0, 34.0, 42.0, 37.0, 30.0, 46.0, 44.0, 41.0, 41.0, 40.0, 41.0, 42.0, 33.0, 29.0, 30.0, 23.0, 30.0, 25.0, 22.0, 18.0, 16.0, 9.0, 6.0, 8.0, 10.0, 14.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.693359375, -2.60345458984375, -2.5135498046875, -2.42364501953125, -2.333740234375, -2.24383544921875, -2.1539306640625, -2.06402587890625, -1.97412109375, -1.88421630859375, -1.7943115234375, -1.70440673828125, -1.614501953125, -1.52459716796875, -1.4346923828125, -1.34478759765625, -1.2548828125, -1.16497802734375, -1.0750732421875, -0.98516845703125, -0.895263671875, -0.80535888671875, -0.7154541015625, -0.62554931640625, -0.53564453125, -0.44573974609375, -0.3558349609375, -0.26593017578125, -0.176025390625, -0.08612060546875, 0.0037841796875, 0.09368896484375, 0.18359375, 0.27349853515625, 0.3634033203125, 0.45330810546875, 0.543212890625, 0.63311767578125, 0.7230224609375, 0.81292724609375, 0.90283203125, 0.99273681640625, 1.0826416015625, 1.17254638671875, 1.262451171875, 1.35235595703125, 1.4422607421875, 1.53216552734375, 1.6220703125, 1.71197509765625, 1.8018798828125, 1.89178466796875, 1.981689453125, 2.07159423828125, 2.1614990234375, 2.25140380859375, 2.34130859375, 2.43121337890625, 2.5211181640625, 2.61102294921875, 2.700927734375, 2.79083251953125, 2.8807373046875, 2.97064208984375, 3.060546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 7.0, 16.0, 16.0, 29.0, 35.0, 49.0, 69.0, 84.0, 94.0, 148.0, 224.0, 277.0, 402.0, 473.0, 677.0, 920.0, 1292.0, 1865.0, 2634.0, 3950.0, 5825.0, 9487.0, 16601.0, 37772.0, 154652.0, 583999.0, 146131.0, 36349.0, 16044.0, 9245.0, 5997.0, 3892.0, 2644.0, 1860.0, 1322.0, 929.0, 632.0, 493.0, 388.0, 282.0, 198.0, 146.0, 100.0, 83.0, 54.0, 45.0, 34.0, 26.0, 19.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.28515625, -4.1490478515625, -4.012939453125, -3.8768310546875, -3.74072265625, -3.6046142578125, -3.468505859375, -3.3323974609375, -3.1962890625, -3.0601806640625, -2.924072265625, -2.7879638671875, -2.65185546875, -2.5157470703125, -2.379638671875, -2.2435302734375, -2.107421875, -1.9713134765625, -1.835205078125, -1.6990966796875, -1.56298828125, -1.4268798828125, -1.290771484375, -1.1546630859375, -1.0185546875, -0.8824462890625, -0.746337890625, -0.6102294921875, -0.47412109375, -0.3380126953125, -0.201904296875, -0.0657958984375, 0.0703125, 0.2064208984375, 0.342529296875, 0.4786376953125, 0.61474609375, 0.7508544921875, 0.886962890625, 1.0230712890625, 1.1591796875, 1.2952880859375, 1.431396484375, 1.5675048828125, 1.70361328125, 1.8397216796875, 1.975830078125, 2.1119384765625, 2.248046875, 2.3841552734375, 2.520263671875, 2.6563720703125, 2.79248046875, 2.9285888671875, 3.064697265625, 3.2008056640625, 3.3369140625, 3.4730224609375, 3.609130859375, 3.7452392578125, 3.88134765625, 4.0174560546875, 4.153564453125, 4.2896728515625, 4.42578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 8.0, 12.0, 5.0, 5.0, 15.0, 14.0, 19.0, 17.0, 24.0, 27.0, 16.0, 19.0, 33.0, 39.0, 34.0, 46.0, 41.0, 35.0, 43.0, 53.0, 1056.0, 48.0, 26.0, 38.0, 30.0, 30.0, 34.0, 27.0, 36.0, 20.0, 22.0, 24.0, 24.0, 10.0, 16.0, 19.0, 12.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.994659423828125, -1.92291259765625, -1.851165771484375, -1.7794189453125, -1.707672119140625, -1.63592529296875, -1.564178466796875, -1.492431640625, -1.420684814453125, -1.34893798828125, -1.277191162109375, -1.2054443359375, -1.133697509765625, -1.06195068359375, -0.990203857421875, -0.91845703125, -0.846710205078125, -0.77496337890625, -0.703216552734375, -0.6314697265625, -0.559722900390625, -0.48797607421875, -0.416229248046875, -0.344482421875, -0.272735595703125, -0.20098876953125, -0.129241943359375, -0.0574951171875, 0.014251708984375, 0.08599853515625, 0.157745361328125, 0.2294921875, 0.301239013671875, 0.37298583984375, 0.444732666015625, 0.5164794921875, 0.588226318359375, 0.65997314453125, 0.731719970703125, 0.803466796875, 0.875213623046875, 0.94696044921875, 1.018707275390625, 1.0904541015625, 1.162200927734375, 1.23394775390625, 1.305694580078125, 1.37744140625, 1.449188232421875, 1.52093505859375, 1.592681884765625, 1.6644287109375, 1.736175537109375, 1.80792236328125, 1.879669189453125, 1.951416015625, 2.023162841796875, 2.09490966796875, 2.166656494140625, 2.2384033203125, 2.310150146484375, 2.38189697265625, 2.453643798828125, 2.525390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 16.0, 11.0, 33.0, 48.0, 53.0, 93.0, 132.0, 176.0, 299.0, 468.0, 711.0, 1036.0, 1813.0, 3119.0, 5679.0, 11993.0, 30723.0, 148886.0, 1647846.0, 182442.0, 34334.0, 12759.0, 5995.0, 3323.0, 1860.0, 1154.0, 713.0, 430.0, 306.0, 200.0, 133.0, 83.0, 66.0, 47.0, 32.0, 27.0, 16.0, 16.0, 11.0, 1.0, 0.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.912109375, -3.784027099609375, -3.65594482421875, -3.527862548828125, -3.3997802734375, -3.271697998046875, -3.14361572265625, -3.015533447265625, -2.887451171875, -2.759368896484375, -2.63128662109375, -2.503204345703125, -2.3751220703125, -2.247039794921875, -2.11895751953125, -1.990875244140625, -1.86279296875, -1.734710693359375, -1.60662841796875, -1.478546142578125, -1.3504638671875, -1.222381591796875, -1.09429931640625, -0.966217041015625, -0.838134765625, -0.710052490234375, -0.58197021484375, -0.453887939453125, -0.3258056640625, -0.197723388671875, -0.06964111328125, 0.058441162109375, 0.1865234375, 0.314605712890625, 0.44268798828125, 0.570770263671875, 0.6988525390625, 0.826934814453125, 0.95501708984375, 1.083099365234375, 1.211181640625, 1.339263916015625, 1.46734619140625, 1.595428466796875, 1.7235107421875, 1.851593017578125, 1.97967529296875, 2.107757568359375, 2.23583984375, 2.363922119140625, 2.49200439453125, 2.620086669921875, 2.7481689453125, 2.876251220703125, 3.00433349609375, 3.132415771484375, 3.260498046875, 3.388580322265625, 3.51666259765625, 3.644744873046875, 3.7728271484375, 3.900909423828125, 4.02899169921875, 4.157073974609375, 4.28515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 17.0, 21.0, 26.0, 55.0, 120.0, 227.0, 259.0, 106.0, 39.0, 29.0, 21.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4947509765625, -1.449462890625, -1.4041748046875, -1.35888671875, -1.3135986328125, -1.268310546875, -1.2230224609375, -1.177734375, -1.1324462890625, -1.087158203125, -1.0418701171875, -0.99658203125, -0.9512939453125, -0.906005859375, -0.8607177734375, -0.8154296875, -0.7701416015625, -0.724853515625, -0.6795654296875, -0.63427734375, -0.5889892578125, -0.543701171875, -0.4984130859375, -0.453125, -0.4078369140625, -0.362548828125, -0.3172607421875, -0.27197265625, -0.2266845703125, -0.181396484375, -0.1361083984375, -0.0908203125, -0.0455322265625, -0.000244140625, 0.0450439453125, 0.09033203125, 0.1356201171875, 0.180908203125, 0.2261962890625, 0.271484375, 0.3167724609375, 0.362060546875, 0.4073486328125, 0.45263671875, 0.4979248046875, 0.543212890625, 0.5885009765625, 0.6337890625, 0.6790771484375, 0.724365234375, 0.7696533203125, 0.81494140625, 0.8602294921875, 0.905517578125, 0.9508056640625, 0.99609375, 1.0413818359375, 1.086669921875, 1.1319580078125, 1.17724609375, 1.2225341796875, 1.267822265625, 1.3131103515625, 1.3583984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 25.0, 32.0, 68.0, 122.0, 958.0, 83425.0, 961860.0, 1660.0, 192.0, 64.0, 43.0, 23.0, 13.0, 14.0, 5.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.828125, -26.9033203125, -25.978515625, -25.0537109375, -24.12890625, -23.2041015625, -22.279296875, -21.3544921875, -20.4296875, -19.5048828125, -18.580078125, -17.6552734375, -16.73046875, -15.8056640625, -14.880859375, -13.9560546875, -13.03125, -12.1064453125, -11.181640625, -10.2568359375, -9.33203125, -8.4072265625, -7.482421875, -6.5576171875, -5.6328125, -4.7080078125, -3.783203125, -2.8583984375, -1.93359375, -1.0087890625, -0.083984375, 0.8408203125, 1.765625, 2.6904296875, 3.615234375, 4.5400390625, 5.46484375, 6.3896484375, 7.314453125, 8.2392578125, 9.1640625, 10.0888671875, 11.013671875, 11.9384765625, 12.86328125, 13.7880859375, 14.712890625, 15.6376953125, 16.5625, 17.4873046875, 18.412109375, 19.3369140625, 20.26171875, 21.1865234375, 22.111328125, 23.0361328125, 23.9609375, 24.8857421875, 25.810546875, 26.7353515625, 27.66015625, 28.5849609375, 29.509765625, 30.4345703125, 31.359375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 9.0, 12.0, 13.0, 22.0, 32.0, 60.0, 84.0, 113.0, 152.0, 157.0, 129.0, 81.0, 51.0, 38.0, 24.0, 15.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.998117208480835, -1.9491727352142334, -1.9002282619476318, -1.8512837886810303, -1.8023391962051392, -1.7533947229385376, -1.704450249671936, -1.6555057764053345, -1.6065611839294434, -1.5576167106628418, -1.5086722373962402, -1.4597277641296387, -1.4107831716537476, -1.361838698387146, -1.3128942251205444, -1.2639497518539429, -1.2150052785873413, -1.1660608053207397, -1.1171163320541382, -1.068171739578247, -1.0192272663116455, -0.970282793045044, -0.9213383197784424, -0.8723938465118408, -0.8234493136405945, -0.7745048403739929, -0.7255603075027466, -0.676615834236145, -0.6276713609695435, -0.5787268280982971, -0.5297823548316956, -0.4808378517627716, -0.4318934679031372, -0.38294896483421326, -0.3340044617652893, -0.28505998849868774, -0.2361154854297638, -0.18717098236083984, -0.13822650909423828, -0.08928200602531433, -0.04033750295639038, 0.008606992661952972, 0.057551488280296326, 0.10649597644805908, 0.15544047951698303, 0.20438498258590698, 0.25332945585250854, 0.3022739589214325, 0.35121846199035645, 0.4001629650592804, 0.44910746812820435, 0.4980519413948059, 0.5469964742660522, 0.5959409475326538, 0.6448854207992554, 0.6938298940658569, 0.7427744269371033, 0.7917189002037048, 0.8406634330749512, 0.8896079063415527, 0.9385523796081543, 0.9874969124794006, 1.0364413261413574, 1.0853859186172485, 1.13433039188385]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 17.0, 16.0, 9.0, 13.0, 21.0, 22.0, 29.0, 34.0, 40.0, 38.0, 33.0, 34.0, 44.0, 39.0, 37.0, 42.0, 38.0, 45.0, 38.0, 39.0, 42.0, 30.0, 36.0, 26.0, 27.0, 25.0, 25.0, 23.0, 24.0, 20.0, 12.0, 12.0, 10.0, 3.0, 8.0, 7.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8735390901565552, -0.8446713089942932, -0.8158035278320312, -0.7869357466697693, -0.7580679655075073, -0.7292001843452454, -0.7003324031829834, -0.6714646816253662, -0.6425968408584595, -0.6137290596961975, -0.5848612785339355, -0.5559934973716736, -0.5271257162094116, -0.49825793504714966, -0.4693901836872101, -0.4405224025249481, -0.41165465116500854, -0.3827868700027466, -0.3539190888404846, -0.32505130767822266, -0.2961835265159607, -0.26731574535369873, -0.23844799399375916, -0.2095802128314972, -0.18071243166923523, -0.15184465050697327, -0.1229768767952919, -0.09410910308361053, -0.06524132192134857, -0.03637354075908661, -0.00750577449798584, 0.021362006664276123, 0.05022972822189331, 0.07909750938415527, 0.10796528309583664, 0.136833056807518, 0.16570083796977997, 0.19456861913204193, 0.2234363853931427, 0.25230416655540466, 0.2811719477176666, 0.3100397288799286, 0.33890751004219055, 0.3677752614021301, 0.3966430425643921, 0.42551082372665405, 0.454378604888916, 0.483246386051178, 0.5121141672134399, 0.5409819483757019, 0.5698497295379639, 0.5987175107002258, 0.6275852918624878, 0.6564530730247498, 0.6853208541870117, 0.7141885757446289, 0.7430564165115356, 0.7719241976737976, 0.8007919788360596, 0.8296597599983215, 0.8585275411605835, 0.8873953223228455, 0.9162631034851074, 0.9451308250427246, 0.9739986062049866]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 9.0, 11.0, 9.0, 12.0, 20.0, 18.0, 14.0, 20.0, 29.0, 26.0, 40.0, 35.0, 35.0, 35.0, 37.0, 33.0, 37.0, 36.0, 48.0, 40.0, 41.0, 45.0, 38.0, 39.0, 26.0, 21.0, 24.0, 29.0, 26.0, 22.0, 23.0, 14.0, 13.0, 15.0, 10.0, 15.0, 6.0, 13.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.701171875, -2.612457275390625, -2.52374267578125, -2.435028076171875, -2.3463134765625, -2.257598876953125, -2.16888427734375, -2.080169677734375, -1.991455078125, -1.902740478515625, -1.81402587890625, -1.725311279296875, -1.6365966796875, -1.547882080078125, -1.45916748046875, -1.370452880859375, -1.28173828125, -1.193023681640625, -1.10430908203125, -1.015594482421875, -0.9268798828125, -0.838165283203125, -0.74945068359375, -0.660736083984375, -0.572021484375, -0.483306884765625, -0.39459228515625, -0.305877685546875, -0.2171630859375, -0.128448486328125, -0.03973388671875, 0.048980712890625, 0.1376953125, 0.226409912109375, 0.31512451171875, 0.403839111328125, 0.4925537109375, 0.581268310546875, 0.66998291015625, 0.758697509765625, 0.847412109375, 0.936126708984375, 1.02484130859375, 1.113555908203125, 1.2022705078125, 1.290985107421875, 1.37969970703125, 1.468414306640625, 1.55712890625, 1.645843505859375, 1.73455810546875, 1.823272705078125, 1.9119873046875, 2.000701904296875, 2.08941650390625, 2.178131103515625, 2.266845703125, 2.355560302734375, 2.44427490234375, 2.532989501953125, 2.6217041015625, 2.710418701171875, 2.79913330078125, 2.887847900390625, 2.9765625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 13.0, 13.0, 14.0, 31.0, 31.0, 45.0, 50.0, 88.0, 110.0, 166.0, 230.0, 340.0, 570.0, 924.0, 1490.0, 2540.0, 4654.0, 8524.0, 18114.0, 52040.0, 378990.0, 479591.0, 59370.0, 19580.0, 9064.0, 4827.0, 2697.0, 1600.0, 925.0, 635.0, 391.0, 263.0, 152.0, 102.0, 100.0, 64.0, 47.0, 34.0, 29.0, 20.0, 21.0, 11.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.828125, -5.6341552734375, -5.440185546875, -5.2462158203125, -5.05224609375, -4.8582763671875, -4.664306640625, -4.4703369140625, -4.2763671875, -4.0823974609375, -3.888427734375, -3.6944580078125, -3.50048828125, -3.3065185546875, -3.112548828125, -2.9185791015625, -2.724609375, -2.5306396484375, -2.336669921875, -2.1427001953125, -1.94873046875, -1.7547607421875, -1.560791015625, -1.3668212890625, -1.1728515625, -0.9788818359375, -0.784912109375, -0.5909423828125, -0.39697265625, -0.2030029296875, -0.009033203125, 0.1849365234375, 0.37890625, 0.5728759765625, 0.766845703125, 0.9608154296875, 1.15478515625, 1.3487548828125, 1.542724609375, 1.7366943359375, 1.9306640625, 2.1246337890625, 2.318603515625, 2.5125732421875, 2.70654296875, 2.9005126953125, 3.094482421875, 3.2884521484375, 3.482421875, 3.6763916015625, 3.870361328125, 4.0643310546875, 4.25830078125, 4.4522705078125, 4.646240234375, 4.8402099609375, 5.0341796875, 5.2281494140625, 5.422119140625, 5.6160888671875, 5.81005859375, 6.0040283203125, 6.197998046875, 6.3919677734375, 6.5859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 9.0, 24.0, 20.0, 22.0, 34.0, 26.0, 23.0, 41.0, 50.0, 44.0, 77.0, 108.0, 146.0, 1509.0, 261.0, 119.0, 90.0, 74.0, 50.0, 47.0, 35.0, 37.0, 29.0, 25.0, 18.0, 19.0, 10.0, 13.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.3359375, -11.970703125, -11.60546875, -11.240234375, -10.875, -10.509765625, -10.14453125, -9.779296875, -9.4140625, -9.048828125, -8.68359375, -8.318359375, -7.953125, -7.587890625, -7.22265625, -6.857421875, -6.4921875, -6.126953125, -5.76171875, -5.396484375, -5.03125, -4.666015625, -4.30078125, -3.935546875, -3.5703125, -3.205078125, -2.83984375, -2.474609375, -2.109375, -1.744140625, -1.37890625, -1.013671875, -0.6484375, -0.283203125, 0.08203125, 0.447265625, 0.8125, 1.177734375, 1.54296875, 1.908203125, 2.2734375, 2.638671875, 3.00390625, 3.369140625, 3.734375, 4.099609375, 4.46484375, 4.830078125, 5.1953125, 5.560546875, 5.92578125, 6.291015625, 6.65625, 7.021484375, 7.38671875, 7.751953125, 8.1171875, 8.482421875, 8.84765625, 9.212890625, 9.578125, 9.943359375, 10.30859375, 10.673828125, 11.0390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 7.0, 11.0, 15.0, 8.0, 19.0, 26.0, 32.0, 38.0, 53.0, 64.0, 74.0, 125.0, 159.0, 286.0, 828.0, 5503.0, 84324.0, 2962562.0, 84260.0, 5558.0, 833.0, 266.0, 156.0, 120.0, 95.0, 52.0, 53.0, 37.0, 28.0, 25.0, 22.0, 10.0, 13.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.182861328125, -22.39697265625, -21.611083984375, -20.8251953125, -20.039306640625, -19.25341796875, -18.467529296875, -17.681640625, -16.895751953125, -16.10986328125, -15.323974609375, -14.5380859375, -13.752197265625, -12.96630859375, -12.180419921875, -11.39453125, -10.608642578125, -9.82275390625, -9.036865234375, -8.2509765625, -7.465087890625, -6.67919921875, -5.893310546875, -5.107421875, -4.321533203125, -3.53564453125, -2.749755859375, -1.9638671875, -1.177978515625, -0.39208984375, 0.393798828125, 1.1796875, 1.965576171875, 2.75146484375, 3.537353515625, 4.3232421875, 5.109130859375, 5.89501953125, 6.680908203125, 7.466796875, 8.252685546875, 9.03857421875, 9.824462890625, 10.6103515625, 11.396240234375, 12.18212890625, 12.968017578125, 13.75390625, 14.539794921875, 15.32568359375, 16.111572265625, 16.8974609375, 17.683349609375, 18.46923828125, 19.255126953125, 20.041015625, 20.826904296875, 21.61279296875, 22.398681640625, 23.1845703125, 23.970458984375, 24.75634765625, 25.542236328125, 26.328125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 35.0, 102.0, 329.0, 366.0, 138.0, 34.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.385540008544922, -27.14822769165039, -24.91091537475586, -22.673603057861328, -20.436290740966797, -18.198978424072266, -15.961664199829102, -13.72435188293457, -11.487039566040039, -9.249727249145508, -7.012414455413818, -4.775101661682129, -2.5377893447875977, -0.3004770278930664, 1.9368362426757812, 4.1741485595703125, 6.411460876464844, 8.648773193359375, 10.886085510253906, 13.123398780822754, 15.360711097717285, 17.5980224609375, 19.835336685180664, 22.072649002075195, 24.309961318969727, 26.547273635864258, 28.78458595275879, 31.021900177001953, 33.259212493896484, 35.496524810791016, 37.73383712768555, 39.97114944458008, 42.208457946777344, 44.445770263671875, 46.683082580566406, 48.92039489746094, 51.15770721435547, 53.39501953125, 55.63233184814453, 57.86964416503906, 60.106956481933594, 62.344268798828125, 64.58158111572266, 66.81889343261719, 69.05620574951172, 71.29351806640625, 73.53083038330078, 75.76814270019531, 78.00546264648438, 80.2427749633789, 82.48008728027344, 84.71739959716797, 86.9547119140625, 89.19202423095703, 91.42933654785156, 93.6666488647461, 95.90396118164062, 98.14127349853516, 100.37858581542969, 102.61589813232422, 104.85321044921875, 107.09052276611328, 109.32783508300781, 111.56514739990234, 113.80245971679688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 4.0, 6.0, 7.0, 7.0, 11.0, 14.0, 7.0, 14.0, 21.0, 18.0, 16.0, 28.0, 30.0, 24.0, 34.0, 35.0, 38.0, 44.0, 33.0, 48.0, 43.0, 47.0, 40.0, 43.0, 43.0, 33.0, 40.0, 40.0, 31.0, 41.0, 43.0, 19.0, 12.0, 16.0, 10.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.859025955200195, -28.9013614654541, -27.94369888305664, -26.986034393310547, -26.028371810913086, -25.070707321166992, -24.11304473876953, -23.155380249023438, -22.197715759277344, -21.24005126953125, -20.28238868713379, -19.324724197387695, -18.367061614990234, -17.40939712524414, -16.451732635498047, -15.494070053100586, -14.536407470703125, -13.578743934631348, -12.62108039855957, -11.663415908813477, -10.705753326416016, -9.748088836669922, -8.790425300598145, -7.832761764526367, -6.87509822845459, -5.9174346923828125, -4.959771156311035, -4.0021071434021, -3.0444436073303223, -2.086780071258545, -1.1291160583496094, -0.17145252227783203, 0.7862110137939453, 1.7438746690750122, 2.701538324356079, 3.6592020988464355, 4.616865634918213, 5.57452917098999, 6.532193183898926, 7.489856719970703, 8.44752025604248, 9.405183792114258, 10.362847328186035, 11.320510864257812, 12.278175354003906, 13.235837936401367, 14.193502426147461, 15.151165962219238, 16.108829498291016, 17.06649398803711, 18.02415657043457, 18.981821060180664, 19.939483642578125, 20.89714813232422, 21.854812622070312, 22.812475204467773, 23.770137786865234, 24.727802276611328, 25.68546485900879, 26.643129348754883, 27.600791931152344, 28.558456420898438, 29.51612091064453, 30.473783493041992, 31.431447982788086]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 7.0, 11.0, 13.0, 14.0, 17.0, 15.0, 19.0, 23.0, 27.0, 22.0, 23.0, 38.0, 34.0, 32.0, 35.0, 40.0, 32.0, 39.0, 53.0, 34.0, 43.0, 56.0, 47.0, 29.0, 21.0, 36.0, 22.0, 34.0, 27.0, 24.0, 21.0, 23.0, 13.0, 15.0, 12.0, 10.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.938720703125, -2.83642578125, -2.734130859375, -2.6318359375, -2.529541015625, -2.42724609375, -2.324951171875, -2.22265625, -2.120361328125, -2.01806640625, -1.915771484375, -1.8134765625, -1.711181640625, -1.60888671875, -1.506591796875, -1.404296875, -1.302001953125, -1.19970703125, -1.097412109375, -0.9951171875, -0.892822265625, -0.79052734375, -0.688232421875, -0.5859375, -0.483642578125, -0.38134765625, -0.279052734375, -0.1767578125, -0.074462890625, 0.02783203125, 0.130126953125, 0.232421875, 0.334716796875, 0.43701171875, 0.539306640625, 0.6416015625, 0.743896484375, 0.84619140625, 0.948486328125, 1.05078125, 1.153076171875, 1.25537109375, 1.357666015625, 1.4599609375, 1.562255859375, 1.66455078125, 1.766845703125, 1.869140625, 1.971435546875, 2.07373046875, 2.176025390625, 2.2783203125, 2.380615234375, 2.48291015625, 2.585205078125, 2.6875, 2.789794921875, 2.89208984375, 2.994384765625, 3.0966796875, 3.198974609375, 3.30126953125, 3.403564453125, 3.505859375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 6.0, 9.0, 11.0, 11.0, 15.0, 30.0, 34.0, 63.0, 83.0, 111.0, 136.0, 191.0, 298.0, 420.0, 735.0, 1224.0, 2267.0, 4365.0, 9227.0, 21311.0, 62264.0, 451353.0, 2985198.0, 542965.0, 68253.0, 23040.0, 9962.0, 4723.0, 2315.0, 1304.0, 761.0, 502.0, 311.0, 232.0, 153.0, 93.0, 74.0, 61.0, 37.0, 32.0, 30.0, 12.0, 17.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.2109375, -8.9188232421875, -8.626708984375, -8.3345947265625, -8.04248046875, -7.7503662109375, -7.458251953125, -7.1661376953125, -6.8740234375, -6.5819091796875, -6.289794921875, -5.9976806640625, -5.70556640625, -5.4134521484375, -5.121337890625, -4.8292236328125, -4.537109375, -4.2449951171875, -3.952880859375, -3.6607666015625, -3.36865234375, -3.0765380859375, -2.784423828125, -2.4923095703125, -2.2001953125, -1.9080810546875, -1.615966796875, -1.3238525390625, -1.03173828125, -0.7396240234375, -0.447509765625, -0.1553955078125, 0.13671875, 0.4288330078125, 0.720947265625, 1.0130615234375, 1.30517578125, 1.5972900390625, 1.889404296875, 2.1815185546875, 2.4736328125, 2.7657470703125, 3.057861328125, 3.3499755859375, 3.64208984375, 3.9342041015625, 4.226318359375, 4.5184326171875, 4.810546875, 5.1026611328125, 5.394775390625, 5.6868896484375, 5.97900390625, 6.2711181640625, 6.563232421875, 6.8553466796875, 7.1474609375, 7.4395751953125, 7.731689453125, 8.0238037109375, 8.31591796875, 8.6080322265625, 8.900146484375, 9.1922607421875, 9.484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 4.0, 4.0, 8.0, 13.0, 22.0, 27.0, 25.0, 26.0, 43.0, 67.0, 79.0, 81.0, 148.0, 200.0, 350.0, 557.0, 701.0, 543.0, 343.0, 241.0, 125.0, 100.0, 76.0, 64.0, 47.0, 41.0, 31.0, 18.0, 16.0, 9.0, 14.0, 9.0, 10.0, 11.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.15203857421875, -6.9251708984375, -6.69830322265625, -6.471435546875, -6.24456787109375, -6.0177001953125, -5.79083251953125, -5.56396484375, -5.33709716796875, -5.1102294921875, -4.88336181640625, -4.656494140625, -4.42962646484375, -4.2027587890625, -3.97589111328125, -3.7490234375, -3.52215576171875, -3.2952880859375, -3.06842041015625, -2.841552734375, -2.61468505859375, -2.3878173828125, -2.16094970703125, -1.93408203125, -1.70721435546875, -1.4803466796875, -1.25347900390625, -1.026611328125, -0.79974365234375, -0.5728759765625, -0.34600830078125, -0.119140625, 0.10772705078125, 0.3345947265625, 0.56146240234375, 0.788330078125, 1.01519775390625, 1.2420654296875, 1.46893310546875, 1.69580078125, 1.92266845703125, 2.1495361328125, 2.37640380859375, 2.603271484375, 2.83013916015625, 3.0570068359375, 3.28387451171875, 3.5107421875, 3.73760986328125, 3.9644775390625, 4.19134521484375, 4.418212890625, 4.64508056640625, 4.8719482421875, 5.09881591796875, 5.32568359375, 5.55255126953125, 5.7794189453125, 6.00628662109375, 6.233154296875, 6.46002197265625, 6.6868896484375, 6.91375732421875, 7.140625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 9.0, 16.0, 8.0, 21.0, 20.0, 28.0, 41.0, 50.0, 70.0, 71.0, 136.0, 256.0, 854.0, 5022.0, 82183.0, 3880748.0, 213433.0, 9246.0, 1175.0, 328.0, 144.0, 107.0, 80.0, 43.0, 35.0, 27.0, 21.0, 24.0, 23.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.90625, -29.928955078125, -28.95166015625, -27.974365234375, -26.9970703125, -26.019775390625, -25.04248046875, -24.065185546875, -23.087890625, -22.110595703125, -21.13330078125, -20.156005859375, -19.1787109375, -18.201416015625, -17.22412109375, -16.246826171875, -15.26953125, -14.292236328125, -13.31494140625, -12.337646484375, -11.3603515625, -10.383056640625, -9.40576171875, -8.428466796875, -7.451171875, -6.473876953125, -5.49658203125, -4.519287109375, -3.5419921875, -2.564697265625, -1.58740234375, -0.610107421875, 0.3671875, 1.344482421875, 2.32177734375, 3.299072265625, 4.2763671875, 5.253662109375, 6.23095703125, 7.208251953125, 8.185546875, 9.162841796875, 10.14013671875, 11.117431640625, 12.0947265625, 13.072021484375, 14.04931640625, 15.026611328125, 16.00390625, 16.981201171875, 17.95849609375, 18.935791015625, 19.9130859375, 20.890380859375, 21.86767578125, 22.844970703125, 23.822265625, 24.799560546875, 25.77685546875, 26.754150390625, 27.7314453125, 28.708740234375, 29.68603515625, 30.663330078125, 31.640625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 13.0, 21.0, 39.0, 74.0, 139.0, 213.0, 209.0, 130.0, 80.0, 40.0, 23.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62064743041992, -52.782440185546875, -50.944236755371094, -49.10602951049805, -47.267822265625, -45.42961883544922, -43.59141159057617, -41.753204345703125, -39.915000915527344, -38.0767936706543, -36.238590240478516, -34.40038299560547, -32.56217575073242, -30.723970413208008, -28.885765075683594, -27.047557830810547, -25.2093505859375, -23.371145248413086, -21.53293800354004, -19.694732666015625, -17.856525421142578, -16.018320083618164, -14.18011474609375, -12.34190845489502, -10.503702163696289, -8.665495872497559, -6.827290058135986, -4.989084243774414, -3.1508779525756836, -1.3126716613769531, 0.5255336761474609, 2.3637399673461914, 4.201946258544922, 6.040152549743652, 7.878358364105225, 9.716564178466797, 11.554770469665527, 13.392976760864258, 15.231182098388672, 17.06938934326172, 18.907594680786133, 20.745800018310547, 22.584007263183594, 24.422212600708008, 26.260417938232422, 28.09862518310547, 29.936830520629883, 31.775035858154297, 33.613243103027344, 35.45145034790039, 37.28965377807617, 39.12786102294922, 40.966068267822266, 42.80427551269531, 44.642478942871094, 46.48068618774414, 48.31889343261719, 50.157100677490234, 51.995304107666016, 53.83351135253906, 55.67171859741211, 57.509925842285156, 59.34812927246094, 61.186336517333984, 63.024539947509766]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 12.0, 10.0, 17.0, 20.0, 15.0, 24.0, 34.0, 34.0, 42.0, 27.0, 27.0, 44.0, 56.0, 37.0, 39.0, 48.0, 42.0, 37.0, 39.0, 38.0, 33.0, 30.0, 34.0, 30.0, 32.0, 25.0, 15.0, 24.0, 22.0, 19.0, 9.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.095863342285156, -21.375322341918945, -20.6547794342041, -19.93423843383789, -19.213695526123047, -18.493154525756836, -17.772613525390625, -17.05207061767578, -16.33152961730957, -15.610987663269043, -14.890445709228516, -14.169904708862305, -13.449362754821777, -12.72882080078125, -12.008279800415039, -11.287737846374512, -10.567195892333984, -9.846653938293457, -9.12611198425293, -8.405570983886719, -7.685029029846191, -6.964487075805664, -6.243945598602295, -5.523404121398926, -4.802862167358398, -4.082320213317871, -3.361778736114502, -2.6412370204925537, -1.9206953048706055, -1.2001535892486572, -0.479611873626709, 0.24092960357666016, 0.9614734649658203, 1.6820151805877686, 2.402556896209717, 3.123098611831665, 3.8436403274536133, 4.564182281494141, 5.28472375869751, 6.005265235900879, 6.725807189941406, 7.446349143981934, 8.166891098022461, 8.887432098388672, 9.6079740524292, 10.328516006469727, 11.049057006835938, 11.769598960876465, 12.490140914916992, 13.21068286895752, 13.931224822998047, 14.651765823364258, 15.372307777404785, 16.092849731445312, 16.813390731811523, 17.533931732177734, 18.254474639892578, 18.97501564025879, 19.695558547973633, 20.416099548339844, 21.136642456054688, 21.8571834564209, 22.57772445678711, 23.298267364501953, 24.018808364868164]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 4.0, 9.0, 10.0, 16.0, 14.0, 13.0, 14.0, 21.0, 22.0, 25.0, 25.0, 29.0, 33.0, 46.0, 39.0, 49.0, 36.0, 40.0, 42.0, 46.0, 26.0, 52.0, 63.0, 37.0, 35.0, 31.0, 21.0, 20.0, 24.0, 39.0, 16.0, 13.0, 25.0, 9.0, 16.0, 12.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.835906982421875, -2.73040771484375, -2.624908447265625, -2.5194091796875, -2.413909912109375, -2.30841064453125, -2.202911376953125, -2.097412109375, -1.991912841796875, -1.88641357421875, -1.780914306640625, -1.6754150390625, -1.569915771484375, -1.46441650390625, -1.358917236328125, -1.25341796875, -1.147918701171875, -1.04241943359375, -0.936920166015625, -0.8314208984375, -0.725921630859375, -0.62042236328125, -0.514923095703125, -0.409423828125, -0.303924560546875, -0.19842529296875, -0.092926025390625, 0.0125732421875, 0.118072509765625, 0.22357177734375, 0.329071044921875, 0.4345703125, 0.540069580078125, 0.64556884765625, 0.751068115234375, 0.8565673828125, 0.962066650390625, 1.06756591796875, 1.173065185546875, 1.278564453125, 1.384063720703125, 1.48956298828125, 1.595062255859375, 1.7005615234375, 1.806060791015625, 1.91156005859375, 2.017059326171875, 2.12255859375, 2.228057861328125, 2.33355712890625, 2.439056396484375, 2.5445556640625, 2.650054931640625, 2.75555419921875, 2.861053466796875, 2.966552734375, 3.072052001953125, 3.17755126953125, 3.283050537109375, 3.3885498046875, 3.494049072265625, 3.59954833984375, 3.705047607421875, 3.810546875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 20.0, 13.0, 29.0, 70.0, 156.0, 308.0, 610.0, 1424.0, 3555.0, 11157.0, 76747.0, 815142.0, 118219.0, 14017.0, 4024.0, 1623.0, 756.0, 309.0, 157.0, 87.0, 46.0, 24.0, 11.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.44921875, -4.32415771484375, -4.1990966796875, -4.07403564453125, -3.948974609375, -3.82391357421875, -3.6988525390625, -3.57379150390625, -3.44873046875, -3.32366943359375, -3.1986083984375, -3.07354736328125, -2.948486328125, -2.82342529296875, -2.6983642578125, -2.57330322265625, -2.4482421875, -2.32318115234375, -2.1981201171875, -2.07305908203125, -1.947998046875, -1.82293701171875, -1.6978759765625, -1.57281494140625, -1.44775390625, -1.32269287109375, -1.1976318359375, -1.07257080078125, -0.947509765625, -0.82244873046875, -0.6973876953125, -0.57232666015625, -0.447265625, -0.32220458984375, -0.1971435546875, -0.07208251953125, 0.052978515625, 0.17803955078125, 0.3031005859375, 0.42816162109375, 0.55322265625, 0.67828369140625, 0.8033447265625, 0.92840576171875, 1.053466796875, 1.17852783203125, 1.3035888671875, 1.42864990234375, 1.5537109375, 1.67877197265625, 1.8038330078125, 1.92889404296875, 2.053955078125, 2.17901611328125, 2.3040771484375, 2.42913818359375, 2.55419921875, 2.67926025390625, 2.8043212890625, 2.92938232421875, 3.054443359375, 3.17950439453125, 3.3045654296875, 3.42962646484375, 3.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 10.0, 9.0, 11.0, 17.0, 11.0, 16.0, 15.0, 26.0, 21.0, 24.0, 33.0, 24.0, 35.0, 38.0, 25.0, 37.0, 47.0, 1066.0, 34.0, 41.0, 46.0, 45.0, 44.0, 35.0, 31.0, 35.0, 33.0, 25.0, 34.0, 13.0, 18.0, 16.0, 22.0, 10.0, 5.0, 12.0, 7.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.44921875, -2.370208740234375, -2.29119873046875, -2.212188720703125, -2.1331787109375, -2.054168701171875, -1.97515869140625, -1.896148681640625, -1.817138671875, -1.738128662109375, -1.65911865234375, -1.580108642578125, -1.5010986328125, -1.422088623046875, -1.34307861328125, -1.264068603515625, -1.18505859375, -1.106048583984375, -1.02703857421875, -0.948028564453125, -0.8690185546875, -0.790008544921875, -0.71099853515625, -0.631988525390625, -0.552978515625, -0.473968505859375, -0.39495849609375, -0.315948486328125, -0.2369384765625, -0.157928466796875, -0.07891845703125, 9.1552734375e-05, 0.0791015625, 0.158111572265625, 0.23712158203125, 0.316131591796875, 0.3951416015625, 0.474151611328125, 0.55316162109375, 0.632171630859375, 0.711181640625, 0.790191650390625, 0.86920166015625, 0.948211669921875, 1.0272216796875, 1.106231689453125, 1.18524169921875, 1.264251708984375, 1.34326171875, 1.422271728515625, 1.50128173828125, 1.580291748046875, 1.6593017578125, 1.738311767578125, 1.81732177734375, 1.896331787109375, 1.975341796875, 2.054351806640625, 2.13336181640625, 2.212371826171875, 2.2913818359375, 2.370391845703125, 2.44940185546875, 2.528411865234375, 2.607421875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 3.0, 6.0, 5.0, 17.0, 33.0, 48.0, 56.0, 103.0, 131.0, 244.0, 379.0, 569.0, 999.0, 1877.0, 3985.0, 12042.0, 74235.0, 1792372.0, 180284.0, 18799.0, 5510.0, 2288.0, 1223.0, 754.0, 432.0, 248.0, 177.0, 102.0, 71.0, 41.0, 31.0, 20.0, 7.0, 10.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.505859375, -2.4374847412109375, -2.369110107421875, -2.3007354736328125, -2.23236083984375, -2.1639862060546875, -2.095611572265625, -2.0272369384765625, -1.9588623046875, -1.8904876708984375, -1.822113037109375, -1.7537384033203125, -1.68536376953125, -1.6169891357421875, -1.548614501953125, -1.4802398681640625, -1.411865234375, -1.3434906005859375, -1.275115966796875, -1.2067413330078125, -1.13836669921875, -1.0699920654296875, -1.001617431640625, -0.9332427978515625, -0.8648681640625, -0.7964935302734375, -0.728118896484375, -0.6597442626953125, -0.59136962890625, -0.5229949951171875, -0.454620361328125, -0.3862457275390625, -0.31787109375, -0.2494964599609375, -0.181121826171875, -0.1127471923828125, -0.04437255859375, 0.0240020751953125, 0.092376708984375, 0.1607513427734375, 0.2291259765625, 0.2975006103515625, 0.365875244140625, 0.4342498779296875, 0.50262451171875, 0.5709991455078125, 0.639373779296875, 0.7077484130859375, 0.776123046875, 0.8444976806640625, 0.912872314453125, 0.9812469482421875, 1.04962158203125, 1.1179962158203125, 1.186370849609375, 1.2547454833984375, 1.3231201171875, 1.3914947509765625, 1.459869384765625, 1.5282440185546875, 1.59661865234375, 1.6649932861328125, 1.733367919921875, 1.8017425537109375, 1.8701171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 30.0, 37.0, 77.0, 94.0, 207.0, 206.0, 137.0, 72.0, 55.0, 19.0, 25.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4054222106933594, -0.39238739013671875, -0.3793525695800781, -0.3663177490234375, -0.3532829284667969, -0.34024810791015625, -0.3272132873535156, -0.314178466796875, -0.3011436462402344, -0.28810882568359375, -0.2750740051269531, -0.2620391845703125, -0.24900436401367188, -0.23596954345703125, -0.22293472290039062, -0.20989990234375, -0.19686508178710938, -0.18383026123046875, -0.17079544067382812, -0.1577606201171875, -0.14472579956054688, -0.13169097900390625, -0.11865615844726562, -0.105621337890625, -0.09258651733398438, -0.07955169677734375, -0.06651687622070312, -0.0534820556640625, -0.040447235107421875, -0.02741241455078125, -0.014377593994140625, -0.0013427734375, 0.011692047119140625, 0.02472686767578125, 0.037761688232421875, 0.0507965087890625, 0.06383132934570312, 0.07686614990234375, 0.08990097045898438, 0.102935791015625, 0.11597061157226562, 0.12900543212890625, 0.14204025268554688, 0.1550750732421875, 0.16810989379882812, 0.18114471435546875, 0.19417953491210938, 0.20721435546875, 0.22024917602539062, 0.23328399658203125, 0.24631881713867188, 0.2593536376953125, 0.2723884582519531, 0.28542327880859375, 0.2984580993652344, 0.311492919921875, 0.3245277404785156, 0.33756256103515625, 0.3505973815917969, 0.3636322021484375, 0.3766670227050781, 0.38970184326171875, 0.4027366638183594, 0.415771484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 27.0, 36.0, 85.0, 170.0, 1145.0, 226177.0, 819212.0, 1348.0, 162.0, 67.0, 45.0, 21.0, 9.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.62060546875, -8.3427734375, -8.06494140625, -7.787109375, -7.50927734375, -7.2314453125, -6.95361328125, -6.67578125, -6.39794921875, -6.1201171875, -5.84228515625, -5.564453125, -5.28662109375, -5.0087890625, -4.73095703125, -4.453125, -4.17529296875, -3.8974609375, -3.61962890625, -3.341796875, -3.06396484375, -2.7861328125, -2.50830078125, -2.23046875, -1.95263671875, -1.6748046875, -1.39697265625, -1.119140625, -0.84130859375, -0.5634765625, -0.28564453125, -0.0078125, 0.27001953125, 0.5478515625, 0.82568359375, 1.103515625, 1.38134765625, 1.6591796875, 1.93701171875, 2.21484375, 2.49267578125, 2.7705078125, 3.04833984375, 3.326171875, 3.60400390625, 3.8818359375, 4.15966796875, 4.4375, 4.71533203125, 4.9931640625, 5.27099609375, 5.548828125, 5.82666015625, 6.1044921875, 6.38232421875, 6.66015625, 6.93798828125, 7.2158203125, 7.49365234375, 7.771484375, 8.04931640625, 8.3271484375, 8.60498046875, 8.8828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 22.0, 28.0, 23.0, 52.0, 79.0, 121.0, 136.0, 161.0, 99.0, 82.0, 54.0, 41.0, 26.0, 22.0, 14.0, 14.0, 8.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18939897418022156, -0.1777198165655136, -0.16604065895080566, -0.1543615162372589, -0.14268234372138977, -0.13100320100784302, -0.11932404339313507, -0.10764488577842712, -0.09596572816371918, -0.08428657054901123, -0.07260741293430328, -0.060928262770175934, -0.04924910515546799, -0.03756994754076004, -0.02589079737663269, -0.014211639761924744, -0.002532482147216797, 0.009146673604846, 0.020825829356908798, 0.03250498324632645, 0.04418414086103439, 0.05586329847574234, 0.06754244863986969, 0.07922160625457764, 0.09090076386928558, 0.10257992148399353, 0.11425907909870148, 0.12593823671340942, 0.13761737942695618, 0.14929655194282532, 0.16097569465637207, 0.17265485227108002, 0.18433398008346558, 0.19601313769817352, 0.20769229531288147, 0.21937143802642822, 0.23105061054229736, 0.24272975325584412, 0.25440889596939087, 0.26608806848526, 0.27776724100112915, 0.2894463837146759, 0.30112555623054504, 0.3128046989440918, 0.32448387145996094, 0.3361630141735077, 0.34784215688705444, 0.3595213294029236, 0.37120047211647034, 0.3828796148300171, 0.39455878734588623, 0.406237930059433, 0.4179171025753021, 0.4295962452888489, 0.441275417804718, 0.45295456051826477, 0.4646337032318115, 0.4763128459453583, 0.4879920184612274, 0.49967116117477417, 0.5113503336906433, 0.5230295062065125, 0.5347086191177368, 0.546387791633606, 0.5580669641494751]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 4.0, 14.0, 16.0, 18.0, 16.0, 22.0, 30.0, 17.0, 28.0, 29.0, 29.0, 31.0, 40.0, 38.0, 39.0, 39.0, 44.0, 44.0, 34.0, 37.0, 31.0, 35.0, 29.0, 28.0, 38.0, 34.0, 21.0, 21.0, 21.0, 18.0, 19.0, 14.0, 14.0, 15.0, 11.0, 7.0, 12.0, 5.0, 2.0, 1.0, 4.0, 9.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.17023152112960815, -0.16418780386447906, -0.15814407169818878, -0.1521003544330597, -0.1460566222667694, -0.14001290500164032, -0.13396918773651123, -0.12792545557022095, -0.12188173830509186, -0.11583801358938217, -0.10979428887367249, -0.1037505716085434, -0.09770684689283371, -0.09166312217712402, -0.08561940491199493, -0.07957568019628525, -0.07353195548057556, -0.06748823076486588, -0.06144450977444649, -0.0554007887840271, -0.04935706406831741, -0.04331333935260773, -0.03726961836218834, -0.03122589737176895, -0.025182172656059265, -0.019138449802994728, -0.013094726949930191, -0.007051004096865654, -0.001007281243801117, 0.00503644160926342, 0.011080164462327957, 0.017123885452747345, 0.02316761016845703, 0.02921133302152157, 0.035255055874586105, 0.04129877686500549, 0.04734250158071518, 0.053386226296424866, 0.059429947286844254, 0.06547366827726364, 0.07151739299297333, 0.07756111770868301, 0.0836048424243927, 0.08964855968952179, 0.09569228440523148, 0.10173600912094116, 0.10777972638607025, 0.11382345110177994, 0.11986717581748962, 0.1259108930826187, 0.131954625248909, 0.13799834251403809, 0.14404207468032837, 0.15008579194545746, 0.15612950921058655, 0.16217324137687683, 0.16821695864200592, 0.174260675907135, 0.1803044080734253, 0.18634812533855438, 0.19239184260368347, 0.19843557476997375, 0.20447929203510284, 0.21052300930023193, 0.21656674146652222]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 5.0, 7.0, 11.0, 10.0, 20.0, 20.0, 16.0, 22.0, 27.0, 29.0, 28.0, 34.0, 44.0, 32.0, 39.0, 40.0, 36.0, 35.0, 43.0, 43.0, 48.0, 46.0, 35.0, 33.0, 35.0, 29.0, 34.0, 30.0, 20.0, 10.0, 25.0, 21.0, 15.0, 18.0, 9.0, 8.0, 5.0, 6.0, 2.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.061492919921875, -2.96087646484375, -2.860260009765625, -2.7596435546875, -2.659027099609375, -2.55841064453125, -2.457794189453125, -2.357177734375, -2.256561279296875, -2.15594482421875, -2.055328369140625, -1.9547119140625, -1.854095458984375, -1.75347900390625, -1.652862548828125, -1.55224609375, -1.451629638671875, -1.35101318359375, -1.250396728515625, -1.1497802734375, -1.049163818359375, -0.94854736328125, -0.847930908203125, -0.747314453125, -0.646697998046875, -0.54608154296875, -0.445465087890625, -0.3448486328125, -0.244232177734375, -0.14361572265625, -0.042999267578125, 0.0576171875, 0.158233642578125, 0.25885009765625, 0.359466552734375, 0.4600830078125, 0.560699462890625, 0.66131591796875, 0.761932373046875, 0.862548828125, 0.963165283203125, 1.06378173828125, 1.164398193359375, 1.2650146484375, 1.365631103515625, 1.46624755859375, 1.566864013671875, 1.66748046875, 1.768096923828125, 1.86871337890625, 1.969329833984375, 2.0699462890625, 2.170562744140625, 2.27117919921875, 2.371795654296875, 2.472412109375, 2.573028564453125, 2.67364501953125, 2.774261474609375, 2.8748779296875, 2.975494384765625, 3.07611083984375, 3.176727294921875, 3.27734375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 11.0, 15.0, 25.0, 42.0, 59.0, 87.0, 157.0, 204.0, 301.0, 446.0, 727.0, 1149.0, 1844.0, 2985.0, 4821.0, 8380.0, 14807.0, 28000.0, 58374.0, 166206.0, 493608.0, 150768.0, 54672.0, 26346.0, 14061.0, 7995.0, 4713.0, 2917.0, 1746.0, 1043.0, 730.0, 451.0, 283.0, 202.0, 118.0, 98.0, 47.0, 31.0, 18.0, 16.0, 16.0, 13.0, 12.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.18878173828125, -5.0064697265625, -4.82415771484375, -4.641845703125, -4.45953369140625, -4.2772216796875, -4.09490966796875, -3.91259765625, -3.73028564453125, -3.5479736328125, -3.36566162109375, -3.183349609375, -3.00103759765625, -2.8187255859375, -2.63641357421875, -2.4541015625, -2.27178955078125, -2.0894775390625, -1.90716552734375, -1.724853515625, -1.54254150390625, -1.3602294921875, -1.17791748046875, -0.99560546875, -0.81329345703125, -0.6309814453125, -0.44866943359375, -0.266357421875, -0.08404541015625, 0.0982666015625, 0.28057861328125, 0.462890625, 0.64520263671875, 0.8275146484375, 1.00982666015625, 1.192138671875, 1.37445068359375, 1.5567626953125, 1.73907470703125, 1.92138671875, 2.10369873046875, 2.2860107421875, 2.46832275390625, 2.650634765625, 2.83294677734375, 3.0152587890625, 3.19757080078125, 3.3798828125, 3.56219482421875, 3.7445068359375, 3.92681884765625, 4.109130859375, 4.29144287109375, 4.4737548828125, 4.65606689453125, 4.83837890625, 5.02069091796875, 5.2030029296875, 5.38531494140625, 5.567626953125, 5.74993896484375, 5.9322509765625, 6.11456298828125, 6.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 4.0, 4.0, 4.0, 10.0, 7.0, 16.0, 17.0, 16.0, 17.0, 19.0, 29.0, 29.0, 33.0, 39.0, 45.0, 52.0, 48.0, 84.0, 131.0, 241.0, 1467.0, 196.0, 94.0, 68.0, 60.0, 38.0, 39.0, 28.0, 31.0, 27.0, 29.0, 20.0, 11.0, 11.0, 13.0, 13.0, 10.0, 9.0, 5.0, 8.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.1171875, -9.8043212890625, -9.491455078125, -9.1785888671875, -8.86572265625, -8.5528564453125, -8.239990234375, -7.9271240234375, -7.6142578125, -7.3013916015625, -6.988525390625, -6.6756591796875, -6.36279296875, -6.0499267578125, -5.737060546875, -5.4241943359375, -5.111328125, -4.7984619140625, -4.485595703125, -4.1727294921875, -3.85986328125, -3.5469970703125, -3.234130859375, -2.9212646484375, -2.6083984375, -2.2955322265625, -1.982666015625, -1.6697998046875, -1.35693359375, -1.0440673828125, -0.731201171875, -0.4183349609375, -0.10546875, 0.2073974609375, 0.520263671875, 0.8331298828125, 1.14599609375, 1.4588623046875, 1.771728515625, 2.0845947265625, 2.3974609375, 2.7103271484375, 3.023193359375, 3.3360595703125, 3.64892578125, 3.9617919921875, 4.274658203125, 4.5875244140625, 4.900390625, 5.2132568359375, 5.526123046875, 5.8389892578125, 6.15185546875, 6.4647216796875, 6.777587890625, 7.0904541015625, 7.4033203125, 7.7161865234375, 8.029052734375, 8.3419189453125, 8.65478515625, 8.9676513671875, 9.280517578125, 9.5933837890625, 9.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 10.0, 23.0, 13.0, 32.0, 36.0, 41.0, 75.0, 125.0, 184.0, 313.0, 862.0, 4628.0, 59142.0, 2921844.0, 148044.0, 7972.0, 1324.0, 381.0, 209.0, 125.0, 82.0, 70.0, 45.0, 30.0, 25.0, 14.0, 12.0, 11.0, 10.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.63818359375, -17.7763671875, -16.91455078125, -16.052734375, -15.19091796875, -14.3291015625, -13.46728515625, -12.60546875, -11.74365234375, -10.8818359375, -10.02001953125, -9.158203125, -8.29638671875, -7.4345703125, -6.57275390625, -5.7109375, -4.84912109375, -3.9873046875, -3.12548828125, -2.263671875, -1.40185546875, -0.5400390625, 0.32177734375, 1.18359375, 2.04541015625, 2.9072265625, 3.76904296875, 4.630859375, 5.49267578125, 6.3544921875, 7.21630859375, 8.078125, 8.93994140625, 9.8017578125, 10.66357421875, 11.525390625, 12.38720703125, 13.2490234375, 14.11083984375, 14.97265625, 15.83447265625, 16.6962890625, 17.55810546875, 18.419921875, 19.28173828125, 20.1435546875, 21.00537109375, 21.8671875, 22.72900390625, 23.5908203125, 24.45263671875, 25.314453125, 26.17626953125, 27.0380859375, 27.89990234375, 28.76171875, 29.62353515625, 30.4853515625, 31.34716796875, 32.208984375, 33.07080078125, 33.9326171875, 34.79443359375, 35.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 200.0, 716.0, 91.0, 0.0, 2.0], "bins": [-305.0229797363281, -299.96630859375, -294.90960693359375, -289.8529357910156, -284.7962646484375, -279.73956298828125, -274.6828918457031, -269.626220703125, -264.56951904296875, -259.5128479003906, -254.45616149902344, -249.39947509765625, -244.34278869628906, -239.28610229492188, -234.22943115234375, -229.17274475097656, -224.11605834960938, -219.0593719482422, -214.00270080566406, -208.94601440429688, -203.8893280029297, -198.8326416015625, -193.77597045898438, -188.7192840576172, -183.66261291503906, -178.60592651367188, -173.54925537109375, -168.49256896972656, -163.43588256835938, -158.3791961669922, -153.32252502441406, -148.26583862304688, -143.2091522216797, -138.1524658203125, -133.09579467773438, -128.0391082763672, -122.982421875, -117.92574310302734, -112.86906433105469, -107.8123779296875, -102.75569152832031, -97.69901275634766, -92.64232635498047, -87.58564758300781, -82.52896118164062, -77.47228240966797, -72.41560363769531, -67.35891723632812, -62.30223846435547, -57.24555587768555, -52.188873291015625, -47.13219451904297, -42.07550811767578, -37.018829345703125, -31.962146759033203, -26.90546417236328, -21.84878158569336, -16.792098999023438, -11.735417366027832, -6.678735733032227, -1.6220531463623047, 3.434629440307617, 8.491310119628906, 13.547992706298828, 18.60467529296875]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 11.0, 13.0, 11.0, 8.0, 14.0, 18.0, 18.0, 14.0, 29.0, 28.0, 30.0, 38.0, 39.0, 43.0, 52.0, 47.0, 46.0, 42.0, 48.0, 38.0, 42.0, 34.0, 42.0, 38.0, 32.0, 38.0, 31.0, 25.0, 15.0, 25.0, 20.0, 17.0, 18.0, 8.0, 6.0, 6.0, 8.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.94982147216797, -27.997146606445312, -27.04447364807129, -26.091798782348633, -25.139123916625977, -24.186450958251953, -23.233776092529297, -22.28110122680664, -21.328428268432617, -20.37575340270996, -19.423080444335938, -18.47040557861328, -17.517730712890625, -16.5650577545166, -15.612382888793945, -14.659708976745605, -13.70703411102295, -12.75436019897461, -11.801685333251953, -10.849011421203613, -9.896337509155273, -8.943662643432617, -7.990988731384277, -7.0383148193359375, -6.0856404304504395, -5.132966041564941, -4.180292129516602, -3.2276177406311035, -2.2749435901641846, -1.3222694396972656, -0.3695950508117676, 0.5830788612365723, 1.5357532501220703, 2.4884274005889893, 3.441101551055908, 4.393775939941406, 5.346449851989746, 6.299124240875244, 7.251798629760742, 8.204472541809082, 9.157146453857422, 10.109820365905762, 11.062495231628418, 12.015169143676758, 12.967843055725098, 13.920516967773438, 14.873191833496094, 15.825865745544434, 16.778541564941406, 17.731216430664062, 18.683889389038086, 19.636564254760742, 20.5892391204834, 21.541912078857422, 22.494586944580078, 23.447261810302734, 24.399934768676758, 25.352609634399414, 26.305282592773438, 27.257957458496094, 28.21063232421875, 29.163305282592773, 30.11598014831543, 31.068653106689453, 32.02132797241211]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 13.0, 7.0, 9.0, 14.0, 18.0, 21.0, 16.0, 25.0, 39.0, 43.0, 25.0, 45.0, 42.0, 37.0, 52.0, 39.0, 65.0, 50.0, 43.0, 48.0, 38.0, 40.0, 33.0, 31.0, 27.0, 26.0, 24.0, 17.0, 28.0, 17.0, 10.0, 16.0, 3.0, 7.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.2890625, -4.16485595703125, -4.0406494140625, -3.91644287109375, -3.792236328125, -3.66802978515625, -3.5438232421875, -3.41961669921875, -3.29541015625, -3.17120361328125, -3.0469970703125, -2.92279052734375, -2.798583984375, -2.67437744140625, -2.5501708984375, -2.42596435546875, -2.3017578125, -2.17755126953125, -2.0533447265625, -1.92913818359375, -1.804931640625, -1.68072509765625, -1.5565185546875, -1.43231201171875, -1.30810546875, -1.18389892578125, -1.0596923828125, -0.93548583984375, -0.811279296875, -0.68707275390625, -0.5628662109375, -0.43865966796875, -0.314453125, -0.19024658203125, -0.0660400390625, 0.05816650390625, 0.182373046875, 0.30657958984375, 0.4307861328125, 0.55499267578125, 0.67919921875, 0.80340576171875, 0.9276123046875, 1.05181884765625, 1.176025390625, 1.30023193359375, 1.4244384765625, 1.54864501953125, 1.6728515625, 1.79705810546875, 1.9212646484375, 2.04547119140625, 2.169677734375, 2.29388427734375, 2.4180908203125, 2.54229736328125, 2.66650390625, 2.79071044921875, 2.9149169921875, 3.03912353515625, 3.163330078125, 3.28753662109375, 3.4117431640625, 3.53594970703125, 3.66015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 11.0, 15.0, 16.0, 26.0, 26.0, 40.0, 65.0, 111.0, 145.0, 224.0, 346.0, 637.0, 1069.0, 1867.0, 3475.0, 6897.0, 15332.0, 39470.0, 173760.0, 1586846.0, 2057125.0, 227335.0, 45902.0, 16956.0, 7757.0, 3805.0, 2019.0, 1164.0, 678.0, 410.0, 255.0, 170.0, 100.0, 60.0, 47.0, 33.0, 24.0, 16.0, 14.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-8.8125, -8.56817626953125, -8.3238525390625, -8.07952880859375, -7.835205078125, -7.59088134765625, -7.3465576171875, -7.10223388671875, -6.85791015625, -6.61358642578125, -6.3692626953125, -6.12493896484375, -5.880615234375, -5.63629150390625, -5.3919677734375, -5.14764404296875, -4.9033203125, -4.65899658203125, -4.4146728515625, -4.17034912109375, -3.926025390625, -3.68170166015625, -3.4373779296875, -3.19305419921875, -2.94873046875, -2.70440673828125, -2.4600830078125, -2.21575927734375, -1.971435546875, -1.72711181640625, -1.4827880859375, -1.23846435546875, -0.994140625, -0.74981689453125, -0.5054931640625, -0.26116943359375, -0.016845703125, 0.22747802734375, 0.4718017578125, 0.71612548828125, 0.96044921875, 1.20477294921875, 1.4490966796875, 1.69342041015625, 1.937744140625, 2.18206787109375, 2.4263916015625, 2.67071533203125, 2.9150390625, 3.15936279296875, 3.4036865234375, 3.64801025390625, 3.892333984375, 4.13665771484375, 4.3809814453125, 4.62530517578125, 4.86962890625, 5.11395263671875, 5.3582763671875, 5.60260009765625, 5.846923828125, 6.09124755859375, 6.3355712890625, 6.57989501953125, 6.82421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 9.0, 6.0, 12.0, 14.0, 23.0, 34.0, 34.0, 39.0, 47.0, 75.0, 83.0, 139.0, 251.0, 398.0, 590.0, 774.0, 524.0, 347.0, 201.0, 123.0, 79.0, 84.0, 38.0, 31.0, 32.0, 20.0, 15.0, 11.0, 3.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.6162109375, -7.373046875, -7.1298828125, -6.88671875, -6.6435546875, -6.400390625, -6.1572265625, -5.9140625, -5.6708984375, -5.427734375, -5.1845703125, -4.94140625, -4.6982421875, -4.455078125, -4.2119140625, -3.96875, -3.7255859375, -3.482421875, -3.2392578125, -2.99609375, -2.7529296875, -2.509765625, -2.2666015625, -2.0234375, -1.7802734375, -1.537109375, -1.2939453125, -1.05078125, -0.8076171875, -0.564453125, -0.3212890625, -0.078125, 0.1650390625, 0.408203125, 0.6513671875, 0.89453125, 1.1376953125, 1.380859375, 1.6240234375, 1.8671875, 2.1103515625, 2.353515625, 2.5966796875, 2.83984375, 3.0830078125, 3.326171875, 3.5693359375, 3.8125, 4.0556640625, 4.298828125, 4.5419921875, 4.78515625, 5.0283203125, 5.271484375, 5.5146484375, 5.7578125, 6.0009765625, 6.244140625, 6.4873046875, 6.73046875, 6.9736328125, 7.216796875, 7.4599609375, 7.703125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 2.0, 10.0, 16.0, 20.0, 38.0, 17.0, 31.0, 74.0, 92.0, 100.0, 227.0, 707.0, 6785.0, 465423.0, 3699645.0, 18995.0, 1284.0, 288.0, 136.0, 82.0, 63.0, 51.0, 35.0, 33.0, 28.0, 22.0, 15.0, 9.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.53125, -39.27099609375, -38.0107421875, -36.75048828125, -35.490234375, -34.22998046875, -32.9697265625, -31.70947265625, -30.44921875, -29.18896484375, -27.9287109375, -26.66845703125, -25.408203125, -24.14794921875, -22.8876953125, -21.62744140625, -20.3671875, -19.10693359375, -17.8466796875, -16.58642578125, -15.326171875, -14.06591796875, -12.8056640625, -11.54541015625, -10.28515625, -9.02490234375, -7.7646484375, -6.50439453125, -5.244140625, -3.98388671875, -2.7236328125, -1.46337890625, -0.203125, 1.05712890625, 2.3173828125, 3.57763671875, 4.837890625, 6.09814453125, 7.3583984375, 8.61865234375, 9.87890625, 11.13916015625, 12.3994140625, 13.65966796875, 14.919921875, 16.18017578125, 17.4404296875, 18.70068359375, 19.9609375, 21.22119140625, 22.4814453125, 23.74169921875, 25.001953125, 26.26220703125, 27.5224609375, 28.78271484375, 30.04296875, 31.30322265625, 32.5634765625, 33.82373046875, 35.083984375, 36.34423828125, 37.6044921875, 38.86474609375, 40.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 17.0, 17.0, 56.0, 83.0, 131.0, 173.0, 182.0, 145.0, 101.0, 53.0, 24.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.73108673095703, -54.26681137084961, -52.80253982543945, -51.33826446533203, -49.873992919921875, -48.40971755981445, -46.94544219970703, -45.481170654296875, -44.01689910888672, -42.5526237487793, -41.08835220336914, -39.62407684326172, -38.15980529785156, -36.69552993774414, -35.23125457763672, -33.76698303222656, -32.30270767211914, -30.83843421936035, -29.374160766601562, -27.90988540649414, -26.445613861083984, -24.981338500976562, -23.517065048217773, -22.052791595458984, -20.588518142700195, -19.124244689941406, -17.659971237182617, -16.195697784423828, -14.731423377990723, -13.267149925231934, -11.802875518798828, -10.338602066040039, -8.874324798583984, -7.410051345825195, -5.945777416229248, -4.481503486633301, -3.0172300338745117, -1.5529565811157227, -0.08868217468261719, 1.3755912780761719, 2.839864730834961, 4.30413818359375, 5.768412113189697, 7.2326860427856445, 8.696959495544434, 10.161232948303223, 11.625507354736328, 13.089780807495117, 14.554054260253906, 16.018327713012695, 17.482601165771484, 18.946876525878906, 20.411148071289062, 21.875423431396484, 23.339696884155273, 24.803970336914062, 26.26824378967285, 27.73251724243164, 29.19679069519043, 30.66106414794922, 32.12533950805664, 33.5896110534668, 35.05388641357422, 36.518157958984375, 37.9824333190918]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 5.0, 8.0, 20.0, 11.0, 19.0, 15.0, 17.0, 18.0, 32.0, 46.0, 41.0, 41.0, 34.0, 36.0, 37.0, 54.0, 42.0, 46.0, 40.0, 42.0, 43.0, 40.0, 32.0, 39.0, 26.0, 25.0, 21.0, 30.0, 14.0, 20.0, 19.0, 7.0, 20.0, 15.0, 6.0, 5.0, 9.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.172319412231445, -21.4759464263916, -20.77957534790039, -20.083202362060547, -19.386831283569336, -18.690458297729492, -17.99408721923828, -17.297714233398438, -16.601341247558594, -15.904969215393066, -15.208597183227539, -14.512224197387695, -13.815853118896484, -13.11948013305664, -12.423108100891113, -11.726736068725586, -11.030364990234375, -10.333992958068848, -9.63762092590332, -8.941247940063477, -8.244876861572266, -7.54850435256958, -6.8521318435668945, -6.155759811401367, -5.45938777923584, -4.7630157470703125, -4.066643714904785, -3.3702712059020996, -2.6738991737365723, -1.977527141571045, -1.2811546325683594, -0.584782600402832, 0.11159133911132812, 0.807963490486145, 1.504335641860962, 2.2007079124450684, 2.8970799446105957, 3.593451976776123, 4.289824485778809, 4.986196517944336, 5.682568550109863, 6.378940582275391, 7.075312614440918, 7.7716851234436035, 8.468057632446289, 9.1644287109375, 9.860801696777344, 10.557173728942871, 11.253545761108398, 11.949917793273926, 12.646289825439453, 13.342662811279297, 14.039033889770508, 14.735406875610352, 15.431778907775879, 16.128150939941406, 16.82452392578125, 17.520896911621094, 18.217267990112305, 18.91364097595215, 19.61001205444336, 20.306385040283203, 21.002758026123047, 21.699129104614258, 22.39550018310547]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 17.0, 6.0, 18.0, 16.0, 16.0, 28.0, 31.0, 33.0, 31.0, 34.0, 40.0, 39.0, 35.0, 39.0, 54.0, 39.0, 42.0, 36.0, 58.0, 38.0, 48.0, 33.0, 39.0, 28.0, 23.0, 28.0, 20.0, 18.0, 14.0, 11.0, 12.0, 7.0, 12.0, 6.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.23089599609375, -3.1180419921875, -3.00518798828125, -2.892333984375, -2.77947998046875, -2.6666259765625, -2.55377197265625, -2.44091796875, -2.32806396484375, -2.2152099609375, -2.10235595703125, -1.989501953125, -1.87664794921875, -1.7637939453125, -1.65093994140625, -1.5380859375, -1.42523193359375, -1.3123779296875, -1.19952392578125, -1.086669921875, -0.97381591796875, -0.8609619140625, -0.74810791015625, -0.63525390625, -0.52239990234375, -0.4095458984375, -0.29669189453125, -0.183837890625, -0.07098388671875, 0.0418701171875, 0.15472412109375, 0.267578125, 0.38043212890625, 0.4932861328125, 0.60614013671875, 0.718994140625, 0.83184814453125, 0.9447021484375, 1.05755615234375, 1.17041015625, 1.28326416015625, 1.3961181640625, 1.50897216796875, 1.621826171875, 1.73468017578125, 1.8475341796875, 1.96038818359375, 2.0732421875, 2.18609619140625, 2.2989501953125, 2.41180419921875, 2.524658203125, 2.63751220703125, 2.7503662109375, 2.86322021484375, 2.97607421875, 3.08892822265625, 3.2017822265625, 3.31463623046875, 3.427490234375, 3.54034423828125, 3.6531982421875, 3.76605224609375, 3.87890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 13.0, 13.0, 33.0, 47.0, 107.0, 213.0, 442.0, 950.0, 2286.0, 6374.0, 27335.0, 222177.0, 690795.0, 77704.0, 13288.0, 3932.0, 1534.0, 697.0, 303.0, 154.0, 68.0, 37.0, 23.0, 13.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.55487060546875, -4.4417724609375, -4.32867431640625, -4.215576171875, -4.10247802734375, -3.9893798828125, -3.87628173828125, -3.76318359375, -3.65008544921875, -3.5369873046875, -3.42388916015625, -3.310791015625, -3.19769287109375, -3.0845947265625, -2.97149658203125, -2.8583984375, -2.74530029296875, -2.6322021484375, -2.51910400390625, -2.406005859375, -2.29290771484375, -2.1798095703125, -2.06671142578125, -1.95361328125, -1.84051513671875, -1.7274169921875, -1.61431884765625, -1.501220703125, -1.38812255859375, -1.2750244140625, -1.16192626953125, -1.048828125, -0.93572998046875, -0.8226318359375, -0.70953369140625, -0.596435546875, -0.48333740234375, -0.3702392578125, -0.25714111328125, -0.14404296875, -0.03094482421875, 0.0821533203125, 0.19525146484375, 0.308349609375, 0.42144775390625, 0.5345458984375, 0.64764404296875, 0.7607421875, 0.87384033203125, 0.9869384765625, 1.10003662109375, 1.213134765625, 1.32623291015625, 1.4393310546875, 1.55242919921875, 1.66552734375, 1.77862548828125, 1.8917236328125, 2.00482177734375, 2.117919921875, 2.23101806640625, 2.3441162109375, 2.45721435546875, 2.5703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 10.0, 17.0, 9.0, 12.0, 12.0, 16.0, 29.0, 22.0, 26.0, 28.0, 28.0, 26.0, 40.0, 44.0, 36.0, 49.0, 35.0, 31.0, 1063.0, 44.0, 32.0, 33.0, 37.0, 33.0, 27.0, 31.0, 29.0, 27.0, 21.0, 31.0, 20.0, 12.0, 14.0, 19.0, 10.0, 4.0, 3.0, 9.0, 9.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.720703125, -2.641082763671875, -2.56146240234375, -2.481842041015625, -2.4022216796875, -2.322601318359375, -2.24298095703125, -2.163360595703125, -2.083740234375, -2.004119873046875, -1.92449951171875, -1.844879150390625, -1.7652587890625, -1.685638427734375, -1.60601806640625, -1.526397705078125, -1.44677734375, -1.367156982421875, -1.28753662109375, -1.207916259765625, -1.1282958984375, -1.048675537109375, -0.96905517578125, -0.889434814453125, -0.809814453125, -0.730194091796875, -0.65057373046875, -0.570953369140625, -0.4913330078125, -0.411712646484375, -0.33209228515625, -0.252471923828125, -0.1728515625, -0.093231201171875, -0.01361083984375, 0.066009521484375, 0.1456298828125, 0.225250244140625, 0.30487060546875, 0.384490966796875, 0.464111328125, 0.543731689453125, 0.62335205078125, 0.702972412109375, 0.7825927734375, 0.862213134765625, 0.94183349609375, 1.021453857421875, 1.10107421875, 1.180694580078125, 1.26031494140625, 1.339935302734375, 1.4195556640625, 1.499176025390625, 1.57879638671875, 1.658416748046875, 1.738037109375, 1.817657470703125, 1.89727783203125, 1.976898193359375, 2.0565185546875, 2.136138916015625, 2.21575927734375, 2.295379638671875, 2.375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 12.0, 11.0, 13.0, 17.0, 32.0, 55.0, 62.0, 81.0, 107.0, 160.0, 261.0, 394.0, 611.0, 938.0, 1681.0, 2806.0, 5719.0, 12732.0, 36895.0, 166233.0, 1503100.0, 283130.0, 50761.0, 16300.0, 6913.0, 3321.0, 1746.0, 1034.0, 676.0, 437.0, 287.0, 199.0, 124.0, 77.0, 51.0, 42.0, 28.0, 16.0, 12.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5556640625, -1.5093994140625, -1.463134765625, -1.4168701171875, -1.37060546875, -1.3243408203125, -1.278076171875, -1.2318115234375, -1.185546875, -1.1392822265625, -1.093017578125, -1.0467529296875, -1.00048828125, -0.9542236328125, -0.907958984375, -0.8616943359375, -0.8154296875, -0.7691650390625, -0.722900390625, -0.6766357421875, -0.63037109375, -0.5841064453125, -0.537841796875, -0.4915771484375, -0.4453125, -0.3990478515625, -0.352783203125, -0.3065185546875, -0.26025390625, -0.2139892578125, -0.167724609375, -0.1214599609375, -0.0751953125, -0.0289306640625, 0.017333984375, 0.0635986328125, 0.10986328125, 0.1561279296875, 0.202392578125, 0.2486572265625, 0.294921875, 0.3411865234375, 0.387451171875, 0.4337158203125, 0.47998046875, 0.5262451171875, 0.572509765625, 0.6187744140625, 0.6650390625, 0.7113037109375, 0.757568359375, 0.8038330078125, 0.85009765625, 0.8963623046875, 0.942626953125, 0.9888916015625, 1.03515625, 1.0814208984375, 1.127685546875, 1.1739501953125, 1.22021484375, 1.2664794921875, 1.312744140625, 1.3590087890625, 1.4052734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 8.0, 7.0, 3.0, 13.0, 7.0, 13.0, 15.0, 31.0, 78.0, 171.0, 311.0, 147.0, 71.0, 28.0, 25.0, 17.0, 12.0, 7.0, 3.0, 10.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5035934448242188, -0.4852142333984375, -0.46683502197265625, -0.448455810546875, -0.43007659912109375, -0.4116973876953125, -0.39331817626953125, -0.37493896484375, -0.35655975341796875, -0.3381805419921875, -0.31980133056640625, -0.301422119140625, -0.28304290771484375, -0.2646636962890625, -0.24628448486328125, -0.2279052734375, -0.20952606201171875, -0.1911468505859375, -0.17276763916015625, -0.154388427734375, -0.13600921630859375, -0.1176300048828125, -0.09925079345703125, -0.08087158203125, -0.06249237060546875, -0.0441131591796875, -0.02573394775390625, -0.007354736328125, 0.01102447509765625, 0.0294036865234375, 0.04778289794921875, 0.066162109375, 0.08454132080078125, 0.1029205322265625, 0.12129974365234375, 0.139678955078125, 0.15805816650390625, 0.1764373779296875, 0.19481658935546875, 0.21319580078125, 0.23157501220703125, 0.2499542236328125, 0.26833343505859375, 0.286712646484375, 0.30509185791015625, 0.3234710693359375, 0.34185028076171875, 0.3602294921875, 0.37860870361328125, 0.3969879150390625, 0.41536712646484375, 0.433746337890625, 0.45212554931640625, 0.4705047607421875, 0.48888397216796875, 0.50726318359375, 0.5256423950195312, 0.5440216064453125, 0.5624008178710938, 0.580780029296875, 0.5991592407226562, 0.6175384521484375, 0.6359176635742188, 0.654296875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 6.0, 20.0, 24.0, 40.0, 71.0, 183.0, 2126.0, 992771.0, 52037.0, 941.0, 128.0, 65.0, 32.0, 21.0, 16.0, 8.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.921875, -13.5225830078125, -13.123291015625, -12.7239990234375, -12.32470703125, -11.9254150390625, -11.526123046875, -11.1268310546875, -10.7275390625, -10.3282470703125, -9.928955078125, -9.5296630859375, -9.13037109375, -8.7310791015625, -8.331787109375, -7.9324951171875, -7.533203125, -7.1339111328125, -6.734619140625, -6.3353271484375, -5.93603515625, -5.5367431640625, -5.137451171875, -4.7381591796875, -4.3388671875, -3.9395751953125, -3.540283203125, -3.1409912109375, -2.74169921875, -2.3424072265625, -1.943115234375, -1.5438232421875, -1.14453125, -0.7452392578125, -0.345947265625, 0.0533447265625, 0.45263671875, 0.8519287109375, 1.251220703125, 1.6505126953125, 2.0498046875, 2.4490966796875, 2.848388671875, 3.2476806640625, 3.64697265625, 4.0462646484375, 4.445556640625, 4.8448486328125, 5.244140625, 5.6434326171875, 6.042724609375, 6.4420166015625, 6.84130859375, 7.2406005859375, 7.639892578125, 8.0391845703125, 8.4384765625, 8.8377685546875, 9.237060546875, 9.6363525390625, 10.03564453125, 10.4349365234375, 10.834228515625, 11.2335205078125, 11.6328125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 6.0, 3.0, 10.0, 23.0, 26.0, 63.0, 93.0, 157.0, 172.0, 169.0, 117.0, 66.0, 31.0, 30.0, 13.0, 10.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41232261061668396, -0.38766157627105713, -0.3630005717277527, -0.33833953738212585, -0.313678503036499, -0.2890174984931946, -0.26435646414756775, -0.2396954447031021, -0.21503442525863647, -0.19037340581417084, -0.1657123863697052, -0.14105135202407837, -0.11639033257961273, -0.0917293131351471, -0.06706827878952026, -0.042407259345054626, -0.01774623990058899, 0.006914783269166946, 0.03157580643892288, 0.056236833333969116, 0.08089785277843475, 0.10555887222290039, 0.13021990656852722, 0.15488092601299286, 0.1795419454574585, 0.20420296490192413, 0.22886398434638977, 0.2535250186920166, 0.27818602323532104, 0.3028470575809479, 0.3275080919265747, 0.35216909646987915, 0.3768301010131836, 0.4014911353588104, 0.42615213990211487, 0.4508131742477417, 0.47547417879104614, 0.5001351833343506, 0.5247962474822998, 0.5494572520256042, 0.5741182565689087, 0.5987792611122131, 0.6234403252601624, 0.6481013298034668, 0.6727623343467712, 0.6974233388900757, 0.7220844030380249, 0.7467454075813293, 0.7714064717292786, 0.796067476272583, 0.8207285404205322, 0.8453895449638367, 0.8700505495071411, 0.8947116136550903, 0.9193726181983948, 0.9440336227416992, 0.9686946868896484, 0.9933556914329529, 1.0180166959762573, 1.0426777601242065, 1.0673388242721558, 1.0919997692108154, 1.1166608333587646, 1.1413218975067139, 1.1659828424453735]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 4.0, 9.0, 6.0, 14.0, 11.0, 16.0, 15.0, 22.0, 29.0, 19.0, 32.0, 35.0, 26.0, 28.0, 35.0, 46.0, 39.0, 41.0, 36.0, 40.0, 41.0, 35.0, 41.0, 28.0, 44.0, 41.0, 36.0, 30.0, 21.0, 28.0, 19.0, 16.0, 20.0, 19.0, 14.0, 9.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.3948132395744324, -0.383027046918869, -0.37124085426330566, -0.3594546616077423, -0.34766846895217896, -0.3358822464942932, -0.32409605383872986, -0.3123098611831665, -0.30052366852760315, -0.2887374758720398, -0.27695128321647644, -0.2651650905609131, -0.25337886810302734, -0.24159269034862518, -0.22980648279190063, -0.21802029013633728, -0.20623409748077393, -0.19444790482521057, -0.18266171216964722, -0.17087550461292267, -0.15908931195735931, -0.14730311930179596, -0.1355169117450714, -0.12373071908950806, -0.1119445264339447, -0.10015833377838135, -0.0883721336722374, -0.07658593356609344, -0.06479974091053009, -0.05301354452967644, -0.041227348148822784, -0.029441148042678833, -0.01765495538711548, -0.0058687590062618256, 0.005917437374591827, 0.01770363375544548, 0.029489830136299133, 0.041276026517152786, 0.05306222289800644, 0.06484842300415039, 0.07663461565971375, 0.0884208083152771, 0.10020700842142105, 0.111993208527565, 0.12377940118312836, 0.1355655938386917, 0.14735180139541626, 0.15913799405097961, 0.17092418670654297, 0.18271037936210632, 0.19449657201766968, 0.20628277957439423, 0.21806897222995758, 0.22985516488552094, 0.24164137244224548, 0.25342756509780884, 0.2652137577533722, 0.27699995040893555, 0.2887861430644989, 0.30057233572006226, 0.312358558177948, 0.32414475083351135, 0.3359309434890747, 0.34771713614463806, 0.3595033288002014]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 14.0, 11.0, 11.0, 17.0, 20.0, 19.0, 25.0, 25.0, 24.0, 26.0, 28.0, 38.0, 35.0, 28.0, 41.0, 30.0, 51.0, 44.0, 42.0, 45.0, 29.0, 45.0, 34.0, 30.0, 47.0, 31.0, 25.0, 26.0, 14.0, 20.0, 20.0, 10.0, 10.0, 11.0, 10.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.98828125, -2.88323974609375, -2.7781982421875, -2.67315673828125, -2.568115234375, -2.46307373046875, -2.3580322265625, -2.25299072265625, -2.14794921875, -2.04290771484375, -1.9378662109375, -1.83282470703125, -1.727783203125, -1.62274169921875, -1.5177001953125, -1.41265869140625, -1.3076171875, -1.20257568359375, -1.0975341796875, -0.99249267578125, -0.887451171875, -0.78240966796875, -0.6773681640625, -0.57232666015625, -0.46728515625, -0.36224365234375, -0.2572021484375, -0.15216064453125, -0.047119140625, 0.05792236328125, 0.1629638671875, 0.26800537109375, 0.373046875, 0.47808837890625, 0.5831298828125, 0.68817138671875, 0.793212890625, 0.89825439453125, 1.0032958984375, 1.10833740234375, 1.21337890625, 1.31842041015625, 1.4234619140625, 1.52850341796875, 1.633544921875, 1.73858642578125, 1.8436279296875, 1.94866943359375, 2.0537109375, 2.15875244140625, 2.2637939453125, 2.36883544921875, 2.473876953125, 2.57891845703125, 2.6839599609375, 2.78900146484375, 2.89404296875, 2.99908447265625, 3.1041259765625, 3.20916748046875, 3.314208984375, 3.41925048828125, 3.5242919921875, 3.62933349609375, 3.734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 10.0, 22.0, 27.0, 31.0, 58.0, 85.0, 107.0, 172.0, 279.0, 407.0, 611.0, 1036.0, 1718.0, 3095.0, 5687.0, 11369.0, 26765.0, 77764.0, 433051.0, 368740.0, 69230.0, 24608.0, 10827.0, 5469.0, 2932.0, 1718.0, 964.0, 629.0, 370.0, 254.0, 162.0, 112.0, 70.0, 61.0, 31.0, 21.0, 20.0, 10.0, 4.0, 8.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.8046875, -5.64324951171875, -5.4818115234375, -5.32037353515625, -5.158935546875, -4.99749755859375, -4.8360595703125, -4.67462158203125, -4.51318359375, -4.35174560546875, -4.1903076171875, -4.02886962890625, -3.867431640625, -3.70599365234375, -3.5445556640625, -3.38311767578125, -3.2216796875, -3.06024169921875, -2.8988037109375, -2.73736572265625, -2.575927734375, -2.41448974609375, -2.2530517578125, -2.09161376953125, -1.93017578125, -1.76873779296875, -1.6072998046875, -1.44586181640625, -1.284423828125, -1.12298583984375, -0.9615478515625, -0.80010986328125, -0.638671875, -0.47723388671875, -0.3157958984375, -0.15435791015625, 0.007080078125, 0.16851806640625, 0.3299560546875, 0.49139404296875, 0.65283203125, 0.81427001953125, 0.9757080078125, 1.13714599609375, 1.298583984375, 1.46002197265625, 1.6214599609375, 1.78289794921875, 1.9443359375, 2.10577392578125, 2.2672119140625, 2.42864990234375, 2.590087890625, 2.75152587890625, 2.9129638671875, 3.07440185546875, 3.23583984375, 3.39727783203125, 3.5587158203125, 3.72015380859375, 3.881591796875, 4.04302978515625, 4.2044677734375, 4.36590576171875, 4.52734375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 21.0, 26.0, 31.0, 39.0, 39.0, 39.0, 39.0, 46.0, 63.0, 93.0, 236.0, 1624.0, 208.0, 100.0, 58.0, 47.0, 39.0, 43.0, 32.0, 34.0, 20.0, 22.0, 19.0, 16.0, 9.0, 14.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -10.9981689453125, -10.582275390625, -10.1663818359375, -9.75048828125, -9.3345947265625, -8.918701171875, -8.5028076171875, -8.0869140625, -7.6710205078125, -7.255126953125, -6.8392333984375, -6.42333984375, -6.0074462890625, -5.591552734375, -5.1756591796875, -4.759765625, -4.3438720703125, -3.927978515625, -3.5120849609375, -3.09619140625, -2.6802978515625, -2.264404296875, -1.8485107421875, -1.4326171875, -1.0167236328125, -0.600830078125, -0.1849365234375, 0.23095703125, 0.6468505859375, 1.062744140625, 1.4786376953125, 1.89453125, 2.3104248046875, 2.726318359375, 3.1422119140625, 3.55810546875, 3.9739990234375, 4.389892578125, 4.8057861328125, 5.2216796875, 5.6375732421875, 6.053466796875, 6.4693603515625, 6.88525390625, 7.3011474609375, 7.717041015625, 8.1329345703125, 8.548828125, 8.9647216796875, 9.380615234375, 9.7965087890625, 10.21240234375, 10.6282958984375, 11.044189453125, 11.4600830078125, 11.8759765625, 12.2918701171875, 12.707763671875, 13.1236572265625, 13.53955078125, 13.9554443359375, 14.371337890625, 14.7872314453125, 15.203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 11.0, 24.0, 20.0, 22.0, 22.0, 33.0, 49.0, 79.0, 102.0, 179.0, 493.0, 1866.0, 12365.0, 568579.0, 2538229.0, 19847.0, 2492.0, 607.0, 200.0, 111.0, 76.0, 56.0, 48.0, 36.0, 30.0, 24.0, 17.0, 12.0, 18.0, 7.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.779052734375, -26.96435546875, -26.149658203125, -25.3349609375, -24.520263671875, -23.70556640625, -22.890869140625, -22.076171875, -21.261474609375, -20.44677734375, -19.632080078125, -18.8173828125, -18.002685546875, -17.18798828125, -16.373291015625, -15.55859375, -14.743896484375, -13.92919921875, -13.114501953125, -12.2998046875, -11.485107421875, -10.67041015625, -9.855712890625, -9.041015625, -8.226318359375, -7.41162109375, -6.596923828125, -5.7822265625, -4.967529296875, -4.15283203125, -3.338134765625, -2.5234375, -1.708740234375, -0.89404296875, -0.079345703125, 0.7353515625, 1.550048828125, 2.36474609375, 3.179443359375, 3.994140625, 4.808837890625, 5.62353515625, 6.438232421875, 7.2529296875, 8.067626953125, 8.88232421875, 9.697021484375, 10.51171875, 11.326416015625, 12.14111328125, 12.955810546875, 13.7705078125, 14.585205078125, 15.39990234375, 16.214599609375, 17.029296875, 17.843994140625, 18.65869140625, 19.473388671875, 20.2880859375, 21.102783203125, 21.91748046875, 22.732177734375, 23.546875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [3.0, 8.0, 17.0, 51.0, 139.0, 240.0, 267.0, 175.0, 66.0, 34.0, 15.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.217764377593994, -6.045231819152832, -4.872698783874512, -3.7001659870147705, -2.5276331901550293, -1.355100154876709, -0.18256759643554688, 0.9899649620056152, 2.1624979972839355, 3.3350307941436768, 4.507563591003418, 5.680096626281738, 6.8526291847229, 8.025161743164062, 9.197694778442383, 10.370227813720703, 11.542760848999023, 12.715293884277344, 13.887826919555664, 15.060359001159668, 16.232891082763672, 17.405426025390625, 18.577957153320312, 19.750490188598633, 20.923023223876953, 22.095556259155273, 23.268089294433594, 24.440622329711914, 25.613155364990234, 26.785686492919922, 27.958219528198242, 29.130752563476562, 30.30328369140625, 31.47581672668457, 32.64834976196289, 33.82088088989258, 34.99341583251953, 36.16594696044922, 37.33848190307617, 38.51101303100586, 39.68354797363281, 40.8560791015625, 42.02861404418945, 43.20114517211914, 44.373680114746094, 45.54621124267578, 46.718746185302734, 47.89127731323242, 49.06380844116211, 50.2363395690918, 51.40887451171875, 52.58140563964844, 53.75394058227539, 54.92647171020508, 56.09900665283203, 57.27153778076172, 58.444068908691406, 59.616600036621094, 60.78913497924805, 61.961666107177734, 63.13420104980469, 64.30673217773438, 65.47926330566406, 66.65179443359375, 67.82433319091797]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 9.0, 6.0, 6.0, 8.0, 11.0, 10.0, 18.0, 18.0, 15.0, 21.0, 27.0, 36.0, 28.0, 26.0, 33.0, 36.0, 36.0, 40.0, 40.0, 38.0, 54.0, 37.0, 56.0, 31.0, 38.0, 31.0, 39.0, 25.0, 28.0, 25.0, 22.0, 32.0, 24.0, 12.0, 20.0, 10.0, 5.0, 7.0, 10.0, 11.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-39.971099853515625, -38.82118606567383, -37.67127227783203, -36.5213623046875, -35.3714485168457, -34.221534729003906, -33.07162094116211, -31.921707153320312, -30.77179527282715, -29.62188148498535, -28.471969604492188, -27.32205581665039, -26.172142028808594, -25.02223014831543, -23.872316360473633, -22.72240447998047, -21.572490692138672, -20.422576904296875, -19.27266502380371, -18.122751235961914, -16.97283935546875, -15.822925567626953, -14.673011779785156, -13.523098945617676, -12.373186111450195, -11.223273277282715, -10.073360443115234, -8.923446655273438, -7.773533821105957, -6.623620986938477, -5.473707675933838, -4.323794364929199, -3.173877716064453, -2.0239646434783936, -0.874051570892334, 0.2758615016937256, 1.4257745742797852, 2.5756874084472656, 3.7256007194519043, 4.875514030456543, 6.025426864624023, 7.175339698791504, 8.325252532958984, 9.475166320800781, 10.625079154968262, 11.774991989135742, 12.924905776977539, 14.07481861114502, 15.2247314453125, 16.374645233154297, 17.52455711364746, 18.674470901489258, 19.824382781982422, 20.97429656982422, 22.124210357666016, 23.274124145507812, 24.424036026000977, 25.573949813842773, 26.723861694335938, 27.873775482177734, 29.02368927001953, 30.173601150512695, 31.323514938354492, 32.473426818847656, 33.62334060668945]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 13.0, 8.0, 14.0, 20.0, 24.0, 17.0, 20.0, 25.0, 33.0, 34.0, 28.0, 38.0, 37.0, 30.0, 40.0, 36.0, 41.0, 40.0, 42.0, 45.0, 45.0, 40.0, 39.0, 32.0, 31.0, 28.0, 36.0, 26.0, 13.0, 15.0, 19.0, 14.0, 10.0, 7.0, 11.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.71484375, -3.595703125, -3.4765625, -3.357421875, -3.23828125, -3.119140625, -3.0, -2.880859375, -2.76171875, -2.642578125, -2.5234375, -2.404296875, -2.28515625, -2.166015625, -2.046875, -1.927734375, -1.80859375, -1.689453125, -1.5703125, -1.451171875, -1.33203125, -1.212890625, -1.09375, -0.974609375, -0.85546875, -0.736328125, -0.6171875, -0.498046875, -0.37890625, -0.259765625, -0.140625, -0.021484375, 0.09765625, 0.216796875, 0.3359375, 0.455078125, 0.57421875, 0.693359375, 0.8125, 0.931640625, 1.05078125, 1.169921875, 1.2890625, 1.408203125, 1.52734375, 1.646484375, 1.765625, 1.884765625, 2.00390625, 2.123046875, 2.2421875, 2.361328125, 2.48046875, 2.599609375, 2.71875, 2.837890625, 2.95703125, 3.076171875, 3.1953125, 3.314453125, 3.43359375, 3.552734375, 3.671875, 3.791015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 7.0, 12.0, 18.0, 30.0, 36.0, 58.0, 96.0, 149.0, 232.0, 347.0, 512.0, 887.0, 1247.0, 1871.0, 2994.0, 4831.0, 7747.0, 13456.0, 24074.0, 50770.0, 138139.0, 514330.0, 1583751.0, 1286502.0, 368674.0, 102099.0, 40680.0, 20229.0, 11446.0, 6858.0, 4240.0, 2727.0, 1823.0, 1136.0, 769.0, 505.0, 313.0, 222.0, 146.0, 85.0, 69.0, 62.0, 28.0, 14.0, 13.0, 11.0, 4.0, 8.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.90625, -4.7523193359375, -4.598388671875, -4.4444580078125, -4.29052734375, -4.1365966796875, -3.982666015625, -3.8287353515625, -3.6748046875, -3.5208740234375, -3.366943359375, -3.2130126953125, -3.05908203125, -2.9051513671875, -2.751220703125, -2.5972900390625, -2.443359375, -2.2894287109375, -2.135498046875, -1.9815673828125, -1.82763671875, -1.6737060546875, -1.519775390625, -1.3658447265625, -1.2119140625, -1.0579833984375, -0.904052734375, -0.7501220703125, -0.59619140625, -0.4422607421875, -0.288330078125, -0.1343994140625, 0.01953125, 0.1734619140625, 0.327392578125, 0.4813232421875, 0.63525390625, 0.7891845703125, 0.943115234375, 1.0970458984375, 1.2509765625, 1.4049072265625, 1.558837890625, 1.7127685546875, 1.86669921875, 2.0206298828125, 2.174560546875, 2.3284912109375, 2.482421875, 2.6363525390625, 2.790283203125, 2.9442138671875, 3.09814453125, 3.2520751953125, 3.406005859375, 3.5599365234375, 3.7138671875, 3.8677978515625, 4.021728515625, 4.1756591796875, 4.32958984375, 4.4835205078125, 4.637451171875, 4.7913818359375, 4.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 11.0, 12.0, 19.0, 25.0, 35.0, 50.0, 53.0, 80.0, 97.0, 165.0, 232.0, 387.0, 594.0, 698.0, 533.0, 365.0, 206.0, 143.0, 102.0, 77.0, 40.0, 37.0, 31.0, 20.0, 15.0, 8.0, 6.0, 3.0, 4.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3580322265625, -8.083251953125, -7.8084716796875, -7.53369140625, -7.2589111328125, -6.984130859375, -6.7093505859375, -6.4345703125, -6.1597900390625, -5.885009765625, -5.6102294921875, -5.33544921875, -5.0606689453125, -4.785888671875, -4.5111083984375, -4.236328125, -3.9615478515625, -3.686767578125, -3.4119873046875, -3.13720703125, -2.8624267578125, -2.587646484375, -2.3128662109375, -2.0380859375, -1.7633056640625, -1.488525390625, -1.2137451171875, -0.93896484375, -0.6641845703125, -0.389404296875, -0.1146240234375, 0.16015625, 0.4349365234375, 0.709716796875, 0.9844970703125, 1.25927734375, 1.5340576171875, 1.808837890625, 2.0836181640625, 2.3583984375, 2.6331787109375, 2.907958984375, 3.1827392578125, 3.45751953125, 3.7322998046875, 4.007080078125, 4.2818603515625, 4.556640625, 4.8314208984375, 5.106201171875, 5.3809814453125, 5.65576171875, 5.9305419921875, 6.205322265625, 6.4801025390625, 6.7548828125, 7.0296630859375, 7.304443359375, 7.5792236328125, 7.85400390625, 8.1287841796875, 8.403564453125, 8.6783447265625, 8.953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 4.0, 2.0, 11.0, 9.0, 19.0, 29.0, 38.0, 34.0, 83.0, 123.0, 229.0, 478.0, 1680.0, 13166.0, 797864.0, 3349702.0, 26944.0, 2529.0, 631.0, 265.0, 131.0, 88.0, 55.0, 53.0, 26.0, 24.0, 18.0, 15.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.396484375, -31.35546875, -30.314453125, -29.2734375, -28.232421875, -27.19140625, -26.150390625, -25.109375, -24.068359375, -23.02734375, -21.986328125, -20.9453125, -19.904296875, -18.86328125, -17.822265625, -16.78125, -15.740234375, -14.69921875, -13.658203125, -12.6171875, -11.576171875, -10.53515625, -9.494140625, -8.453125, -7.412109375, -6.37109375, -5.330078125, -4.2890625, -3.248046875, -2.20703125, -1.166015625, -0.125, 0.916015625, 1.95703125, 2.998046875, 4.0390625, 5.080078125, 6.12109375, 7.162109375, 8.203125, 9.244140625, 10.28515625, 11.326171875, 12.3671875, 13.408203125, 14.44921875, 15.490234375, 16.53125, 17.572265625, 18.61328125, 19.654296875, 20.6953125, 21.736328125, 22.77734375, 23.818359375, 24.859375, 25.900390625, 26.94140625, 27.982421875, 29.0234375, 30.064453125, 31.10546875, 32.146484375, 33.1875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 18.0, 80.0, 230.0, 373.0, 238.0, 44.0, 21.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.60581970214844, -123.48200225830078, -120.3581771850586, -117.23435974121094, -114.11053466796875, -110.9867172241211, -107.86289978027344, -104.73907470703125, -101.61524963378906, -98.4914321899414, -95.36760711669922, -92.24378967285156, -89.11996459960938, -85.99614715576172, -82.87232971191406, -79.74850463867188, -76.62468719482422, -73.50086975097656, -70.37704467773438, -67.25322723388672, -64.12940216064453, -61.005584716796875, -57.88176345825195, -54.75794219970703, -51.63412094116211, -48.51029968261719, -45.386478424072266, -42.262657165527344, -39.13883972167969, -36.0150146484375, -32.891197204589844, -29.767375946044922, -26.64354705810547, -23.519725799560547, -20.395904541015625, -17.272085189819336, -14.148263931274414, -11.024442672729492, -7.900623321533203, -4.776802062988281, -1.6529808044433594, 1.4708399772644043, 4.594660758972168, 7.718481063842773, 10.842302322387695, 13.966123580932617, 17.089942932128906, 20.213764190673828, 23.33758544921875, 26.461406707763672, 29.585227966308594, 32.70904541015625, 35.83287048339844, 38.956687927246094, 42.080509185791016, 45.20433044433594, 48.32815170288086, 51.45197296142578, 54.5757942199707, 57.699615478515625, 60.82343292236328, 63.94725799560547, 67.07107543945312, 70.19490051269531, 73.31871795654297]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 1.0, 8.0, 7.0, 19.0, 14.0, 17.0, 23.0, 19.0, 34.0, 19.0, 32.0, 25.0, 39.0, 43.0, 33.0, 42.0, 43.0, 33.0, 45.0, 45.0, 49.0, 43.0, 53.0, 40.0, 34.0, 29.0, 23.0, 29.0, 24.0, 21.0, 17.0, 19.0, 8.0, 8.0, 7.0, 7.0, 4.0, 6.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.01807403564453, -20.24705696105957, -19.476041793823242, -18.70502471923828, -17.934009552001953, -17.162992477416992, -16.39197540283203, -15.620959281921387, -14.849943161010742, -14.078927040100098, -13.307910919189453, -12.536893844604492, -11.765877723693848, -10.994861602783203, -10.223844528198242, -9.452828407287598, -8.681812286376953, -7.910796165466309, -7.139779567718506, -6.368762969970703, -5.597746849060059, -4.826730728149414, -4.055714130401611, -3.2846975326538086, -2.513681411743164, -1.7426650524139404, -0.9716486930847168, -0.20063233375549316, 0.5703840255737305, 1.341400384902954, 2.1124167442321777, 2.8834333419799805, 3.654449462890625, 4.4254655838012695, 5.196482181549072, 5.967498779296875, 6.7385149002075195, 7.509531021118164, 8.280548095703125, 9.05156421661377, 9.822580337524414, 10.593596458435059, 11.364612579345703, 12.135629653930664, 12.906645774841309, 13.677661895751953, 14.448678970336914, 15.219695091247559, 15.990711212158203, 16.761728286743164, 17.532743453979492, 18.303760528564453, 19.07477569580078, 19.845792770385742, 20.616809844970703, 21.38782501220703, 22.158842086791992, 22.929859161376953, 23.70087432861328, 24.471891403198242, 25.242908477783203, 26.01392364501953, 26.784940719604492, 27.555957794189453, 28.32697296142578]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 15.0, 14.0, 9.0, 27.0, 23.0, 24.0, 28.0, 24.0, 18.0, 39.0, 43.0, 41.0, 30.0, 36.0, 49.0, 52.0, 50.0, 44.0, 47.0, 35.0, 43.0, 34.0, 34.0, 26.0, 20.0, 25.0, 21.0, 18.0, 25.0, 15.0, 17.0, 14.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.666748046875, -3.55224609375, -3.437744140625, -3.3232421875, -3.208740234375, -3.09423828125, -2.979736328125, -2.865234375, -2.750732421875, -2.63623046875, -2.521728515625, -2.4072265625, -2.292724609375, -2.17822265625, -2.063720703125, -1.94921875, -1.834716796875, -1.72021484375, -1.605712890625, -1.4912109375, -1.376708984375, -1.26220703125, -1.147705078125, -1.033203125, -0.918701171875, -0.80419921875, -0.689697265625, -0.5751953125, -0.460693359375, -0.34619140625, -0.231689453125, -0.1171875, -0.002685546875, 0.11181640625, 0.226318359375, 0.3408203125, 0.455322265625, 0.56982421875, 0.684326171875, 0.798828125, 0.913330078125, 1.02783203125, 1.142333984375, 1.2568359375, 1.371337890625, 1.48583984375, 1.600341796875, 1.71484375, 1.829345703125, 1.94384765625, 2.058349609375, 2.1728515625, 2.287353515625, 2.40185546875, 2.516357421875, 2.630859375, 2.745361328125, 2.85986328125, 2.974365234375, 3.0888671875, 3.203369140625, 3.31787109375, 3.432373046875, 3.546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 12.0, 24.0, 36.0, 42.0, 45.0, 82.0, 137.0, 273.0, 338.0, 591.0, 1079.0, 2083.0, 4417.0, 10657.0, 31108.0, 147097.0, 640125.0, 157377.0, 32733.0, 10800.0, 4573.0, 2128.0, 1121.0, 634.0, 362.0, 234.0, 137.0, 86.0, 73.0, 41.0, 31.0, 21.0, 12.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.200408935546875, -3.10198974609375, -3.003570556640625, -2.9051513671875, -2.806732177734375, -2.70831298828125, -2.609893798828125, -2.511474609375, -2.413055419921875, -2.31463623046875, -2.216217041015625, -2.1177978515625, -2.019378662109375, -1.92095947265625, -1.822540283203125, -1.72412109375, -1.625701904296875, -1.52728271484375, -1.428863525390625, -1.3304443359375, -1.232025146484375, -1.13360595703125, -1.035186767578125, -0.936767578125, -0.838348388671875, -0.73992919921875, -0.641510009765625, -0.5430908203125, -0.444671630859375, -0.34625244140625, -0.247833251953125, -0.1494140625, -0.050994873046875, 0.04742431640625, 0.145843505859375, 0.2442626953125, 0.342681884765625, 0.44110107421875, 0.539520263671875, 0.637939453125, 0.736358642578125, 0.83477783203125, 0.933197021484375, 1.0316162109375, 1.130035400390625, 1.22845458984375, 1.326873779296875, 1.42529296875, 1.523712158203125, 1.62213134765625, 1.720550537109375, 1.8189697265625, 1.917388916015625, 2.01580810546875, 2.114227294921875, 2.212646484375, 2.311065673828125, 2.40948486328125, 2.507904052734375, 2.6063232421875, 2.704742431640625, 2.80316162109375, 2.901580810546875, 3.0]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 11.0, 10.0, 16.0, 13.0, 20.0, 17.0, 25.0, 21.0, 22.0, 30.0, 33.0, 24.0, 27.0, 44.0, 34.0, 39.0, 1058.0, 46.0, 54.0, 33.0, 36.0, 35.0, 39.0, 36.0, 45.0, 37.0, 25.0, 21.0, 23.0, 17.0, 24.0, 15.0, 11.0, 10.0, 10.0, 7.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.111602783203125, -2.02984619140625, -1.948089599609375, -1.8663330078125, -1.784576416015625, -1.70281982421875, -1.621063232421875, -1.539306640625, -1.457550048828125, -1.37579345703125, -1.294036865234375, -1.2122802734375, -1.130523681640625, -1.04876708984375, -0.967010498046875, -0.88525390625, -0.803497314453125, -0.72174072265625, -0.639984130859375, -0.5582275390625, -0.476470947265625, -0.39471435546875, -0.312957763671875, -0.231201171875, -0.149444580078125, -0.06768798828125, 0.014068603515625, 0.0958251953125, 0.177581787109375, 0.25933837890625, 0.341094970703125, 0.4228515625, 0.504608154296875, 0.58636474609375, 0.668121337890625, 0.7498779296875, 0.831634521484375, 0.91339111328125, 0.995147705078125, 1.076904296875, 1.158660888671875, 1.24041748046875, 1.322174072265625, 1.4039306640625, 1.485687255859375, 1.56744384765625, 1.649200439453125, 1.73095703125, 1.812713623046875, 1.89447021484375, 1.976226806640625, 2.0579833984375, 2.139739990234375, 2.22149658203125, 2.303253173828125, 2.385009765625, 2.466766357421875, 2.54852294921875, 2.630279541015625, 2.7120361328125, 2.793792724609375, 2.87554931640625, 2.957305908203125, 3.0390625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 18.0, 16.0, 27.0, 36.0, 52.0, 52.0, 84.0, 141.0, 234.0, 335.0, 525.0, 901.0, 1542.0, 2788.0, 5153.0, 10731.0, 26888.0, 103292.0, 1543672.0, 320409.0, 47713.0, 16172.0, 7414.0, 3759.0, 2083.0, 1150.0, 700.0, 413.0, 258.0, 186.0, 113.0, 86.0, 47.0, 51.0, 29.0, 11.0, 18.0, 6.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.948394775390625, -1.88702392578125, -1.825653076171875, -1.7642822265625, -1.702911376953125, -1.64154052734375, -1.580169677734375, -1.518798828125, -1.457427978515625, -1.39605712890625, -1.334686279296875, -1.2733154296875, -1.211944580078125, -1.15057373046875, -1.089202880859375, -1.02783203125, -0.966461181640625, -0.90509033203125, -0.843719482421875, -0.7823486328125, -0.720977783203125, -0.65960693359375, -0.598236083984375, -0.536865234375, -0.475494384765625, -0.41412353515625, -0.352752685546875, -0.2913818359375, -0.230010986328125, -0.16864013671875, -0.107269287109375, -0.0458984375, 0.015472412109375, 0.07684326171875, 0.138214111328125, 0.1995849609375, 0.260955810546875, 0.32232666015625, 0.383697509765625, 0.445068359375, 0.506439208984375, 0.56781005859375, 0.629180908203125, 0.6905517578125, 0.751922607421875, 0.81329345703125, 0.874664306640625, 0.93603515625, 0.997406005859375, 1.05877685546875, 1.120147705078125, 1.1815185546875, 1.242889404296875, 1.30426025390625, 1.365631103515625, 1.427001953125, 1.488372802734375, 1.54974365234375, 1.611114501953125, 1.6724853515625, 1.733856201171875, 1.79522705078125, 1.856597900390625, 1.91796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 7.0, 4.0, 14.0, 20.0, 47.0, 99.0, 277.0, 276.0, 117.0, 36.0, 23.0, 15.0, 12.0, 5.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.662109375, -0.6426773071289062, -0.6232452392578125, -0.6038131713867188, -0.584381103515625, -0.5649490356445312, -0.5455169677734375, -0.5260848999023438, -0.50665283203125, -0.48722076416015625, -0.4677886962890625, -0.44835662841796875, -0.428924560546875, -0.40949249267578125, -0.3900604248046875, -0.37062835693359375, -0.3511962890625, -0.33176422119140625, -0.3123321533203125, -0.29290008544921875, -0.273468017578125, -0.25403594970703125, -0.2346038818359375, -0.21517181396484375, -0.19573974609375, -0.17630767822265625, -0.1568756103515625, -0.13744354248046875, -0.118011474609375, -0.09857940673828125, -0.0791473388671875, -0.05971527099609375, -0.040283203125, -0.02085113525390625, -0.0014190673828125, 0.01801300048828125, 0.037445068359375, 0.05687713623046875, 0.0763092041015625, 0.09574127197265625, 0.11517333984375, 0.13460540771484375, 0.1540374755859375, 0.17346954345703125, 0.192901611328125, 0.21233367919921875, 0.2317657470703125, 0.25119781494140625, 0.2706298828125, 0.29006195068359375, 0.3094940185546875, 0.32892608642578125, 0.348358154296875, 0.36779022216796875, 0.3872222900390625, 0.40665435791015625, 0.42608642578125, 0.44551849365234375, 0.4649505615234375, 0.48438262939453125, 0.503814697265625, 0.5232467651367188, 0.5426788330078125, 0.5621109008789062, 0.58154296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 2.0, 8.0, 13.0, 10.0, 24.0, 31.0, 44.0, 143.0, 639.0, 3580.0, 875802.0, 164320.0, 3118.0, 567.0, 105.0, 44.0, 25.0, 18.0, 8.0, 6.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.03125, -10.6630859375, -10.294921875, -9.9267578125, -9.55859375, -9.1904296875, -8.822265625, -8.4541015625, -8.0859375, -7.7177734375, -7.349609375, -6.9814453125, -6.61328125, -6.2451171875, -5.876953125, -5.5087890625, -5.140625, -4.7724609375, -4.404296875, -4.0361328125, -3.66796875, -3.2998046875, -2.931640625, -2.5634765625, -2.1953125, -1.8271484375, -1.458984375, -1.0908203125, -0.72265625, -0.3544921875, 0.013671875, 0.3818359375, 0.75, 1.1181640625, 1.486328125, 1.8544921875, 2.22265625, 2.5908203125, 2.958984375, 3.3271484375, 3.6953125, 4.0634765625, 4.431640625, 4.7998046875, 5.16796875, 5.5361328125, 5.904296875, 6.2724609375, 6.640625, 7.0087890625, 7.376953125, 7.7451171875, 8.11328125, 8.4814453125, 8.849609375, 9.2177734375, 9.5859375, 9.9541015625, 10.322265625, 10.6904296875, 11.05859375, 11.4267578125, 11.794921875, 12.1630859375, 12.53125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 10.0, 13.0, 15.0, 39.0, 52.0, 111.0, 211.0, 257.0, 144.0, 61.0, 44.0, 24.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6177295446395874, -0.5797190070152283, -0.5417084693908691, -0.50369793176651, -0.4656873941421509, -0.42767685651779175, -0.3896663188934326, -0.3516557812690735, -0.31364524364471436, -0.2756347060203552, -0.2376241683959961, -0.19961363077163696, -0.16160309314727783, -0.1235925555229187, -0.08558201789855957, -0.04757148027420044, -0.009560942649841309, 0.028449594974517822, 0.06646013259887695, 0.10447067022323608, 0.14248120784759521, 0.18049174547195435, 0.21850228309631348, 0.2565128207206726, 0.29452335834503174, 0.33253389596939087, 0.37054443359375, 0.40855497121810913, 0.44656550884246826, 0.4845760464668274, 0.5225865840911865, 0.5605971217155457, 0.5986077785491943, 0.6366183161735535, 0.6746288537979126, 0.7126393914222717, 0.7506499290466309, 0.78866046667099, 0.8266710042953491, 0.8646815419197083, 0.9026920795440674, 0.9407026171684265, 0.9787131547927856, 1.0167236328125, 1.054734230041504, 1.0927448272705078, 1.1307553052902222, 1.1687657833099365, 1.2067763805389404, 1.2447869777679443, 1.2827974557876587, 1.320807933807373, 1.358818531036377, 1.3968291282653809, 1.4348396062850952, 1.4728500843048096, 1.5108606815338135, 1.5488712787628174, 1.5868817567825317, 1.624892234802246, 1.66290283203125, 1.700913429260254, 1.7389239072799683, 1.7769343852996826, 1.8149449825286865]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 8.0, 8.0, 8.0, 12.0, 19.0, 19.0, 24.0, 19.0, 20.0, 23.0, 16.0, 31.0, 40.0, 30.0, 35.0, 35.0, 33.0, 41.0, 36.0, 38.0, 35.0, 37.0, 39.0, 37.0, 33.0, 30.0, 28.0, 24.0, 28.0, 15.0, 17.0, 26.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 8.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35305070877075195, -0.3404378592967987, -0.32782498002052307, -0.3152121305465698, -0.3025992512702942, -0.28998640179634094, -0.2773735225200653, -0.26476067304611206, -0.2521477937698364, -0.23953492939472198, -0.22692206501960754, -0.2143092006444931, -0.20169633626937866, -0.18908348679542542, -0.17647060751914978, -0.16385775804519653, -0.1512448936700821, -0.13863202929496765, -0.1260191649198532, -0.11340630054473877, -0.10079343616962433, -0.08818057924509048, -0.07556771486997604, -0.0629548504948616, -0.05034198611974716, -0.03772912174463272, -0.02511625923216343, -0.012503396719694138, 0.00010946765542030334, 0.012722328305244446, 0.025335192680358887, 0.03794805705547333, 0.05056092143058777, 0.06317378580570221, 0.07578665018081665, 0.08839951455593109, 0.10101237893104553, 0.11362523585557938, 0.12623810768127441, 0.13885095715522766, 0.1514638364315033, 0.16407670080661774, 0.17668956518173218, 0.18930242955684662, 0.20191529393196106, 0.2145281434059143, 0.22714102268218994, 0.2397538721561432, 0.25236672163009644, 0.2649795711040497, 0.2775924503803253, 0.29020529985427856, 0.3028181791305542, 0.31543102860450745, 0.3280439078807831, 0.34065675735473633, 0.35326963663101196, 0.3658824861049652, 0.37849536538124084, 0.3911082148551941, 0.4037210941314697, 0.416333943605423, 0.4289468228816986, 0.44155967235565186, 0.4541725516319275]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 10.0, 19.0, 11.0, 22.0, 20.0, 18.0, 25.0, 18.0, 30.0, 31.0, 32.0, 39.0, 38.0, 43.0, 30.0, 44.0, 37.0, 40.0, 47.0, 45.0, 52.0, 46.0, 34.0, 21.0, 25.0, 26.0, 16.0, 30.0, 24.0, 18.0, 14.0, 12.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.541015625, -3.43310546875, -3.3251953125, -3.21728515625, -3.109375, -3.00146484375, -2.8935546875, -2.78564453125, -2.677734375, -2.56982421875, -2.4619140625, -2.35400390625, -2.24609375, -2.13818359375, -2.0302734375, -1.92236328125, -1.814453125, -1.70654296875, -1.5986328125, -1.49072265625, -1.3828125, -1.27490234375, -1.1669921875, -1.05908203125, -0.951171875, -0.84326171875, -0.7353515625, -0.62744140625, -0.51953125, -0.41162109375, -0.3037109375, -0.19580078125, -0.087890625, 0.02001953125, 0.1279296875, 0.23583984375, 0.34375, 0.45166015625, 0.5595703125, 0.66748046875, 0.775390625, 0.88330078125, 0.9912109375, 1.09912109375, 1.20703125, 1.31494140625, 1.4228515625, 1.53076171875, 1.638671875, 1.74658203125, 1.8544921875, 1.96240234375, 2.0703125, 2.17822265625, 2.2861328125, 2.39404296875, 2.501953125, 2.60986328125, 2.7177734375, 2.82568359375, 2.93359375, 3.04150390625, 3.1494140625, 3.25732421875, 3.365234375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 7.0, 11.0, 27.0, 34.0, 55.0, 84.0, 159.0, 205.0, 320.0, 483.0, 753.0, 1251.0, 2051.0, 3504.0, 5985.0, 10574.0, 20265.0, 45513.0, 140850.0, 456701.0, 235080.0, 66329.0, 26841.0, 13250.0, 7390.0, 4140.0, 2566.0, 1489.0, 954.0, 587.0, 354.0, 250.0, 150.0, 90.0, 67.0, 46.0, 43.0, 27.0, 9.0, 15.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.94921875, -5.7672119140625, -5.585205078125, -5.4031982421875, -5.22119140625, -5.0391845703125, -4.857177734375, -4.6751708984375, -4.4931640625, -4.3111572265625, -4.129150390625, -3.9471435546875, -3.76513671875, -3.5831298828125, -3.401123046875, -3.2191162109375, -3.037109375, -2.8551025390625, -2.673095703125, -2.4910888671875, -2.30908203125, -2.1270751953125, -1.945068359375, -1.7630615234375, -1.5810546875, -1.3990478515625, -1.217041015625, -1.0350341796875, -0.85302734375, -0.6710205078125, -0.489013671875, -0.3070068359375, -0.125, 0.0570068359375, 0.239013671875, 0.4210205078125, 0.60302734375, 0.7850341796875, 0.967041015625, 1.1490478515625, 1.3310546875, 1.5130615234375, 1.695068359375, 1.8770751953125, 2.05908203125, 2.2410888671875, 2.423095703125, 2.6051025390625, 2.787109375, 2.9691162109375, 3.151123046875, 3.3331298828125, 3.51513671875, 3.6971435546875, 3.879150390625, 4.0611572265625, 4.2431640625, 4.4251708984375, 4.607177734375, 4.7891845703125, 4.97119140625, 5.1531982421875, 5.335205078125, 5.5172119140625, 5.69921875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 12.0, 14.0, 30.0, 34.0, 35.0, 37.0, 36.0, 63.0, 52.0, 67.0, 88.0, 227.0, 1577.0, 248.0, 89.0, 63.0, 63.0, 49.0, 41.0, 35.0, 30.0, 25.0, 17.0, 23.0, 12.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8851318359375, -11.418701171875, -10.9522705078125, -10.48583984375, -10.0194091796875, -9.552978515625, -9.0865478515625, -8.6201171875, -8.1536865234375, -7.687255859375, -7.2208251953125, -6.75439453125, -6.2879638671875, -5.821533203125, -5.3551025390625, -4.888671875, -4.4222412109375, -3.955810546875, -3.4893798828125, -3.02294921875, -2.5565185546875, -2.090087890625, -1.6236572265625, -1.1572265625, -0.6907958984375, -0.224365234375, 0.2420654296875, 0.70849609375, 1.1749267578125, 1.641357421875, 2.1077880859375, 2.57421875, 3.0406494140625, 3.507080078125, 3.9735107421875, 4.43994140625, 4.9063720703125, 5.372802734375, 5.8392333984375, 6.3056640625, 6.7720947265625, 7.238525390625, 7.7049560546875, 8.17138671875, 8.6378173828125, 9.104248046875, 9.5706787109375, 10.037109375, 10.5035400390625, 10.969970703125, 11.4364013671875, 11.90283203125, 12.3692626953125, 12.835693359375, 13.3021240234375, 13.7685546875, 14.2349853515625, 14.701416015625, 15.1678466796875, 15.63427734375, 16.1007080078125, 16.567138671875, 17.0335693359375, 17.5]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 20.0, 28.0, 28.0, 42.0, 73.0, 86.0, 139.0, 263.0, 542.0, 1650.0, 6831.0, 48085.0, 2506483.0, 550360.0, 24668.0, 4179.0, 1086.0, 448.0, 197.0, 139.0, 87.0, 74.0, 51.0, 27.0, 18.0, 22.0, 9.0, 9.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.03125, -22.40625, -21.78125, -21.15625, -20.53125, -19.90625, -19.28125, -18.65625, -18.03125, -17.40625, -16.78125, -16.15625, -15.53125, -14.90625, -14.28125, -13.65625, -13.03125, -12.40625, -11.78125, -11.15625, -10.53125, -9.90625, -9.28125, -8.65625, -8.03125, -7.40625, -6.78125, -6.15625, -5.53125, -4.90625, -4.28125, -3.65625, -3.03125, -2.40625, -1.78125, -1.15625, -0.53125, 0.09375, 0.71875, 1.34375, 1.96875, 2.59375, 3.21875, 3.84375, 4.46875, 5.09375, 5.71875, 6.34375, 6.96875, 7.59375, 8.21875, 8.84375, 9.46875, 10.09375, 10.71875, 11.34375, 11.96875, 12.59375, 13.21875, 13.84375, 14.46875, 15.09375, 15.71875, 16.34375, 16.96875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 15.0, 59.0, 185.0, 314.0, 251.0, 106.0, 50.0, 14.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46574020385742, -60.84966278076172, -59.23358154296875, -57.61750411987305, -56.00142288208008, -54.385345458984375, -52.769264221191406, -51.1531867980957, -49.537105560302734, -47.92102813720703, -46.30494689941406, -44.68886947631836, -43.07278823852539, -41.45671081542969, -39.84062957763672, -38.224552154541016, -36.60847473144531, -34.99239730834961, -33.37631607055664, -31.760236740112305, -30.14415740966797, -28.528079986572266, -26.911998748779297, -25.295921325683594, -23.679840087890625, -22.06376075744629, -20.447681427001953, -18.831602096557617, -17.21552276611328, -15.599444389343262, -13.983365058898926, -12.36728572845459, -10.751205444335938, -9.135126113891602, -7.519046783447266, -5.902967929840088, -4.286888599395752, -2.670809745788574, -1.0547304153442383, 0.5613489151000977, 2.1774282455444336, 3.7935075759887695, 5.4095869064331055, 7.025665760040283, 8.641744613647461, 10.257823944091797, 11.873903274536133, 13.489982604980469, 15.106061935424805, 16.72214126586914, 18.338220596313477, 19.954299926757812, 21.57037925720215, 23.186458587646484, 24.802536010742188, 26.418617248535156, 28.03469467163086, 29.650774002075195, 31.26685333251953, 32.882930755615234, 34.4990119934082, 36.115089416503906, 37.731170654296875, 39.34724807739258, 40.96332931518555]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 6.0, 10.0, 8.0, 14.0, 11.0, 20.0, 15.0, 11.0, 13.0, 23.0, 23.0, 15.0, 25.0, 30.0, 28.0, 40.0, 37.0, 32.0, 41.0, 46.0, 39.0, 34.0, 34.0, 28.0, 33.0, 34.0, 24.0, 40.0, 29.0, 36.0, 17.0, 29.0, 15.0, 28.0, 22.0, 14.0, 18.0, 12.0, 16.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-30.805992126464844, -29.864938735961914, -28.923887252807617, -27.982833862304688, -27.04178237915039, -26.10072898864746, -25.159677505493164, -24.218624114990234, -23.277572631835938, -22.336519241333008, -21.39546775817871, -20.45441436767578, -19.513362884521484, -18.572309494018555, -17.631258010864258, -16.690204620361328, -15.749152183532715, -14.808099746704102, -13.867047309875488, -12.925994873046875, -11.984942436218262, -11.043889999389648, -10.102836608886719, -9.161785125732422, -8.220731735229492, -7.279679298400879, -6.338626861572266, -5.397574424743652, -4.456521987915039, -3.5154690742492676, -2.5744166374206543, -1.633364200592041, -0.6923122406005859, 0.24874025583267212, 1.1897927522659302, 2.130845308303833, 3.0718977451324463, 4.012950420379639, 4.954002857208252, 5.895055294036865, 6.8361077308654785, 7.777160167694092, 8.718213081359863, 9.659265518188477, 10.60031795501709, 11.541370391845703, 12.482422828674316, 13.42347526550293, 14.364527702331543, 15.305580139160156, 16.246633529663086, 17.187685012817383, 18.128738403320312, 19.06978988647461, 20.01084327697754, 20.951894760131836, 21.892948150634766, 22.834001541137695, 23.775053024291992, 24.716106414794922, 25.65715789794922, 26.59821128845215, 27.539262771606445, 28.480316162109375, 29.421367645263672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 10.0, 6.0, 8.0, 9.0, 11.0, 14.0, 15.0, 15.0, 18.0, 26.0, 29.0, 20.0, 31.0, 20.0, 37.0, 34.0, 45.0, 43.0, 51.0, 49.0, 50.0, 39.0, 37.0, 35.0, 43.0, 39.0, 27.0, 33.0, 29.0, 27.0, 26.0, 16.0, 22.0, 11.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.822265625, -3.706298828125, -3.59033203125, -3.474365234375, -3.3583984375, -3.242431640625, -3.12646484375, -3.010498046875, -2.89453125, -2.778564453125, -2.66259765625, -2.546630859375, -2.4306640625, -2.314697265625, -2.19873046875, -2.082763671875, -1.966796875, -1.850830078125, -1.73486328125, -1.618896484375, -1.5029296875, -1.386962890625, -1.27099609375, -1.155029296875, -1.0390625, -0.923095703125, -0.80712890625, -0.691162109375, -0.5751953125, -0.459228515625, -0.34326171875, -0.227294921875, -0.111328125, 0.004638671875, 0.12060546875, 0.236572265625, 0.3525390625, 0.468505859375, 0.58447265625, 0.700439453125, 0.81640625, 0.932373046875, 1.04833984375, 1.164306640625, 1.2802734375, 1.396240234375, 1.51220703125, 1.628173828125, 1.744140625, 1.860107421875, 1.97607421875, 2.092041015625, 2.2080078125, 2.323974609375, 2.43994140625, 2.555908203125, 2.671875, 2.787841796875, 2.90380859375, 3.019775390625, 3.1357421875, 3.251708984375, 3.36767578125, 3.483642578125, 3.599609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 12.0, 12.0, 21.0, 39.0, 50.0, 72.0, 96.0, 122.0, 206.0, 304.0, 416.0, 626.0, 1091.0, 1907.0, 3450.0, 7515.0, 16705.0, 43227.0, 177252.0, 1437154.0, 2130138.0, 280435.0, 55451.0, 19836.0, 8627.0, 3962.0, 2136.0, 1225.0, 726.0, 469.0, 291.0, 194.0, 148.0, 120.0, 62.0, 46.0, 36.0, 30.0, 14.0, 10.0, 9.0, 11.0, 11.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.3936767578125, -6.166259765625, -5.9388427734375, -5.71142578125, -5.4840087890625, -5.256591796875, -5.0291748046875, -4.8017578125, -4.5743408203125, -4.346923828125, -4.1195068359375, -3.89208984375, -3.6646728515625, -3.437255859375, -3.2098388671875, -2.982421875, -2.7550048828125, -2.527587890625, -2.3001708984375, -2.07275390625, -1.8453369140625, -1.617919921875, -1.3905029296875, -1.1630859375, -0.9356689453125, -0.708251953125, -0.4808349609375, -0.25341796875, -0.0260009765625, 0.201416015625, 0.4288330078125, 0.65625, 0.8836669921875, 1.111083984375, 1.3385009765625, 1.56591796875, 1.7933349609375, 2.020751953125, 2.2481689453125, 2.4755859375, 2.7030029296875, 2.930419921875, 3.1578369140625, 3.38525390625, 3.6126708984375, 3.840087890625, 4.0675048828125, 4.294921875, 4.5223388671875, 4.749755859375, 4.9771728515625, 5.20458984375, 5.4320068359375, 5.659423828125, 5.8868408203125, 6.1142578125, 6.3416748046875, 6.569091796875, 6.7965087890625, 7.02392578125, 7.2513427734375, 7.478759765625, 7.7061767578125, 7.93359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 11.0, 7.0, 7.0, 12.0, 9.0, 19.0, 24.0, 29.0, 25.0, 42.0, 58.0, 90.0, 90.0, 106.0, 163.0, 221.0, 410.0, 564.0, 614.0, 476.0, 290.0, 218.0, 156.0, 106.0, 71.0, 55.0, 46.0, 43.0, 23.0, 24.0, 11.0, 10.0, 7.0, 5.0, 3.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.84765625, -7.64752197265625, -7.4473876953125, -7.24725341796875, -7.047119140625, -6.84698486328125, -6.6468505859375, -6.44671630859375, -6.24658203125, -6.04644775390625, -5.8463134765625, -5.64617919921875, -5.446044921875, -5.24591064453125, -5.0457763671875, -4.84564208984375, -4.6455078125, -4.44537353515625, -4.2452392578125, -4.04510498046875, -3.844970703125, -3.64483642578125, -3.4447021484375, -3.24456787109375, -3.04443359375, -2.84429931640625, -2.6441650390625, -2.44403076171875, -2.243896484375, -2.04376220703125, -1.8436279296875, -1.64349365234375, -1.443359375, -1.24322509765625, -1.0430908203125, -0.84295654296875, -0.642822265625, -0.44268798828125, -0.2425537109375, -0.04241943359375, 0.15771484375, 0.35784912109375, 0.5579833984375, 0.75811767578125, 0.958251953125, 1.15838623046875, 1.3585205078125, 1.55865478515625, 1.7587890625, 1.95892333984375, 2.1590576171875, 2.35919189453125, 2.559326171875, 2.75946044921875, 2.9595947265625, 3.15972900390625, 3.35986328125, 3.55999755859375, 3.7601318359375, 3.96026611328125, 4.160400390625, 4.36053466796875, 4.5606689453125, 4.76080322265625, 4.9609375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 9.0, 12.0, 17.0, 24.0, 37.0, 50.0, 66.0, 113.0, 130.0, 249.0, 523.0, 2178.0, 15399.0, 269974.0, 3772044.0, 121885.0, 9031.0, 1373.0, 425.0, 207.0, 142.0, 108.0, 58.0, 49.0, 32.0, 27.0, 23.0, 17.0, 13.0, 8.0, 4.0, 12.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.236572265625, -17.48876953125, -16.740966796875, -15.9931640625, -15.245361328125, -14.49755859375, -13.749755859375, -13.001953125, -12.254150390625, -11.50634765625, -10.758544921875, -10.0107421875, -9.262939453125, -8.51513671875, -7.767333984375, -7.01953125, -6.271728515625, -5.52392578125, -4.776123046875, -4.0283203125, -3.280517578125, -2.53271484375, -1.784912109375, -1.037109375, -0.289306640625, 0.45849609375, 1.206298828125, 1.9541015625, 2.701904296875, 3.44970703125, 4.197509765625, 4.9453125, 5.693115234375, 6.44091796875, 7.188720703125, 7.9365234375, 8.684326171875, 9.43212890625, 10.179931640625, 10.927734375, 11.675537109375, 12.42333984375, 13.171142578125, 13.9189453125, 14.666748046875, 15.41455078125, 16.162353515625, 16.91015625, 17.657958984375, 18.40576171875, 19.153564453125, 19.9013671875, 20.649169921875, 21.39697265625, 22.144775390625, 22.892578125, 23.640380859375, 24.38818359375, 25.135986328125, 25.8837890625, 26.631591796875, 27.37939453125, 28.127197265625, 28.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 32.0, 97.0, 250.0, 348.0, 201.0, 66.0, 11.0, 6.0], "bins": [-150.67547607421875, -148.13961791992188, -145.603759765625, -143.0679168701172, -140.5320587158203, -137.99620056152344, -135.46034240722656, -132.9244842529297, -130.38864135742188, -127.852783203125, -125.31693267822266, -122.78107452392578, -120.24522399902344, -117.70936584472656, -115.17350769042969, -112.63765716552734, -110.10179138183594, -107.56593322753906, -105.03008270263672, -102.49422454833984, -99.9583740234375, -97.42251586914062, -94.88665771484375, -92.3508071899414, -89.81495666503906, -87.27909851074219, -84.74324798583984, -82.20738983154297, -79.67153930664062, -77.13568115234375, -74.59982299804688, -72.06397247314453, -69.52810668945312, -66.99224853515625, -64.4563980102539, -61.92053985595703, -59.38468551635742, -56.84883117675781, -54.3129768371582, -51.777122497558594, -49.24127197265625, -46.70541763305664, -44.16956329345703, -41.633705139160156, -39.09785079956055, -36.56199645996094, -34.02614212036133, -31.490285873413086, -28.954429626464844, -26.418575286865234, -23.882719039916992, -21.346864700317383, -18.81100845336914, -16.27515411376953, -13.739299774169922, -11.20344352722168, -8.66758918762207, -6.1317338943481445, -3.595879077911377, -1.0600242614746094, 1.4758310317993164, 4.011686325073242, 6.547540664672852, 9.083396911621094, 11.619251251220703]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 7.0, 5.0, 11.0, 13.0, 22.0, 19.0, 29.0, 30.0, 22.0, 31.0, 44.0, 43.0, 33.0, 38.0, 42.0, 44.0, 38.0, 31.0, 50.0, 47.0, 38.0, 45.0, 40.0, 27.0, 34.0, 25.0, 33.0, 21.0, 25.0, 19.0, 26.0, 12.0, 14.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.054899215698242, -26.296161651611328, -25.537424087524414, -24.7786865234375, -24.019948959350586, -23.261211395263672, -22.502471923828125, -21.74373435974121, -20.984996795654297, -20.226259231567383, -19.46752166748047, -18.708784103393555, -17.95004653930664, -17.191307067871094, -16.432571411132812, -15.673831939697266, -14.915095329284668, -14.156357765197754, -13.39762020111084, -12.63888168334961, -11.880144119262695, -11.121406555175781, -10.362668991088867, -9.603931427001953, -8.845193862915039, -8.086456298828125, -7.327718257904053, -6.568980693817139, -5.810242652893066, -5.051505088806152, -4.292767524719238, -3.534029483795166, -2.7752914428710938, -2.0165536403656006, -1.257815957069397, -0.49907827377319336, 0.2596595287322998, 1.018397331237793, 1.777134895324707, 2.5358729362487793, 3.2946105003356934, 4.053348064422607, 4.81208610534668, 5.570823669433594, 6.329561233520508, 7.08829927444458, 7.847036838531494, 8.605774879455566, 9.36451244354248, 10.123250007629395, 10.881987571716309, 11.640726089477539, 12.399463653564453, 13.158201217651367, 13.916938781738281, 14.675676345825195, 15.43441390991211, 16.193151473999023, 16.951889038085938, 17.71062660217285, 18.469364166259766, 19.228103637695312, 19.986839294433594, 20.74557876586914, 21.504316329956055]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 2.0, 6.0, 4.0, 13.0, 14.0, 11.0, 11.0, 17.0, 20.0, 20.0, 35.0, 25.0, 18.0, 34.0, 27.0, 42.0, 35.0, 47.0, 35.0, 58.0, 48.0, 38.0, 43.0, 43.0, 43.0, 31.0, 35.0, 32.0, 35.0, 23.0, 25.0, 23.0, 21.0, 15.0, 9.0, 7.0, 7.0, 8.0, 4.0, 5.0, 6.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.453125, -3.338043212890625, -3.22296142578125, -3.107879638671875, -2.9927978515625, -2.877716064453125, -2.76263427734375, -2.647552490234375, -2.532470703125, -2.417388916015625, -2.30230712890625, -2.187225341796875, -2.0721435546875, -1.957061767578125, -1.84197998046875, -1.726898193359375, -1.61181640625, -1.496734619140625, -1.38165283203125, -1.266571044921875, -1.1514892578125, -1.036407470703125, -0.92132568359375, -0.806243896484375, -0.691162109375, -0.576080322265625, -0.46099853515625, -0.345916748046875, -0.2308349609375, -0.115753173828125, -0.00067138671875, 0.114410400390625, 0.2294921875, 0.344573974609375, 0.45965576171875, 0.574737548828125, 0.6898193359375, 0.804901123046875, 0.91998291015625, 1.035064697265625, 1.150146484375, 1.265228271484375, 1.38031005859375, 1.495391845703125, 1.6104736328125, 1.725555419921875, 1.84063720703125, 1.955718994140625, 2.07080078125, 2.185882568359375, 2.30096435546875, 2.416046142578125, 2.5311279296875, 2.646209716796875, 2.76129150390625, 2.876373291015625, 2.991455078125, 3.106536865234375, 3.22161865234375, 3.336700439453125, 3.4517822265625, 3.566864013671875, 3.68194580078125, 3.797027587890625, 3.912109375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 16.0, 24.0, 28.0, 42.0, 56.0, 61.0, 101.0, 128.0, 204.0, 262.0, 306.0, 483.0, 659.0, 959.0, 1494.0, 2259.0, 4016.0, 9393.0, 41793.0, 493535.0, 435727.0, 37489.0, 8716.0, 3872.0, 2259.0, 1336.0, 967.0, 653.0, 469.0, 312.0, 250.0, 170.0, 127.0, 96.0, 60.0, 59.0, 42.0, 36.0, 22.0, 16.0, 14.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.58984375, -2.5062255859375, -2.422607421875, -2.3389892578125, -2.25537109375, -2.1717529296875, -2.088134765625, -2.0045166015625, -1.9208984375, -1.8372802734375, -1.753662109375, -1.6700439453125, -1.58642578125, -1.5028076171875, -1.419189453125, -1.3355712890625, -1.251953125, -1.1683349609375, -1.084716796875, -1.0010986328125, -0.91748046875, -0.8338623046875, -0.750244140625, -0.6666259765625, -0.5830078125, -0.4993896484375, -0.415771484375, -0.3321533203125, -0.24853515625, -0.1649169921875, -0.081298828125, 0.0023193359375, 0.0859375, 0.1695556640625, 0.253173828125, 0.3367919921875, 0.42041015625, 0.5040283203125, 0.587646484375, 0.6712646484375, 0.7548828125, 0.8385009765625, 0.922119140625, 1.0057373046875, 1.08935546875, 1.1729736328125, 1.256591796875, 1.3402099609375, 1.423828125, 1.5074462890625, 1.591064453125, 1.6746826171875, 1.75830078125, 1.8419189453125, 1.925537109375, 2.0091552734375, 2.0927734375, 2.1763916015625, 2.260009765625, 2.3436279296875, 2.42724609375, 2.5108642578125, 2.594482421875, 2.6781005859375, 2.76171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 11.0, 4.0, 13.0, 12.0, 14.0, 16.0, 16.0, 29.0, 25.0, 21.0, 40.0, 35.0, 19.0, 41.0, 49.0, 43.0, 43.0, 43.0, 1069.0, 50.0, 35.0, 43.0, 32.0, 45.0, 35.0, 41.0, 23.0, 33.0, 22.0, 23.0, 18.0, 15.0, 18.0, 14.0, 7.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.090667724609375, -2.99774169921875, -2.904815673828125, -2.8118896484375, -2.718963623046875, -2.62603759765625, -2.533111572265625, -2.440185546875, -2.347259521484375, -2.25433349609375, -2.161407470703125, -2.0684814453125, -1.975555419921875, -1.88262939453125, -1.789703369140625, -1.69677734375, -1.603851318359375, -1.51092529296875, -1.417999267578125, -1.3250732421875, -1.232147216796875, -1.13922119140625, -1.046295166015625, -0.953369140625, -0.860443115234375, -0.76751708984375, -0.674591064453125, -0.5816650390625, -0.488739013671875, -0.39581298828125, -0.302886962890625, -0.2099609375, -0.117034912109375, -0.02410888671875, 0.068817138671875, 0.1617431640625, 0.254669189453125, 0.34759521484375, 0.440521240234375, 0.533447265625, 0.626373291015625, 0.71929931640625, 0.812225341796875, 0.9051513671875, 0.998077392578125, 1.09100341796875, 1.183929443359375, 1.27685546875, 1.369781494140625, 1.46270751953125, 1.555633544921875, 1.6485595703125, 1.741485595703125, 1.83441162109375, 1.927337646484375, 2.020263671875, 2.113189697265625, 2.20611572265625, 2.299041748046875, 2.3919677734375, 2.484893798828125, 2.57781982421875, 2.670745849609375, 2.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 6.0, 5.0, 5.0, 11.0, 11.0, 13.0, 14.0, 26.0, 38.0, 42.0, 67.0, 92.0, 150.0, 136.0, 228.0, 331.0, 567.0, 938.0, 1635.0, 3623.0, 12454.0, 162782.0, 1847369.0, 52739.0, 7625.0, 2724.0, 1342.0, 751.0, 409.0, 270.0, 200.0, 127.0, 94.0, 87.0, 49.0, 46.0, 26.0, 22.0, 18.0, 7.0, 11.0, 6.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-2.658203125, -2.580780029296875, -2.50335693359375, -2.425933837890625, -2.3485107421875, -2.271087646484375, -2.19366455078125, -2.116241455078125, -2.038818359375, -1.961395263671875, -1.88397216796875, -1.806549072265625, -1.7291259765625, -1.651702880859375, -1.57427978515625, -1.496856689453125, -1.41943359375, -1.342010498046875, -1.26458740234375, -1.187164306640625, -1.1097412109375, -1.032318115234375, -0.95489501953125, -0.877471923828125, -0.800048828125, -0.722625732421875, -0.64520263671875, -0.567779541015625, -0.4903564453125, -0.412933349609375, -0.33551025390625, -0.258087158203125, -0.1806640625, -0.103240966796875, -0.02581787109375, 0.051605224609375, 0.1290283203125, 0.206451416015625, 0.28387451171875, 0.361297607421875, 0.438720703125, 0.516143798828125, 0.59356689453125, 0.670989990234375, 0.7484130859375, 0.825836181640625, 0.90325927734375, 0.980682373046875, 1.05810546875, 1.135528564453125, 1.21295166015625, 1.290374755859375, 1.3677978515625, 1.445220947265625, 1.52264404296875, 1.600067138671875, 1.677490234375, 1.754913330078125, 1.83233642578125, 1.909759521484375, 1.9871826171875, 2.064605712890625, 2.14202880859375, 2.219451904296875, 2.296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 11.0, 34.0, 51.0, 125.0, 224.0, 244.0, 135.0, 66.0, 27.0, 14.0, 18.0, 9.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.34619140625, -0.33469390869140625, -0.3231964111328125, -0.31169891357421875, -0.300201416015625, -0.28870391845703125, -0.2772064208984375, -0.26570892333984375, -0.25421142578125, -0.24271392822265625, -0.2312164306640625, -0.21971893310546875, -0.208221435546875, -0.19672393798828125, -0.1852264404296875, -0.17372894287109375, -0.1622314453125, -0.15073394775390625, -0.1392364501953125, -0.12773895263671875, -0.116241455078125, -0.10474395751953125, -0.0932464599609375, -0.08174896240234375, -0.07025146484375, -0.05875396728515625, -0.0472564697265625, -0.03575897216796875, -0.024261474609375, -0.01276397705078125, -0.0012664794921875, 0.01023101806640625, 0.021728515625, 0.03322601318359375, 0.0447235107421875, 0.05622100830078125, 0.067718505859375, 0.07921600341796875, 0.0907135009765625, 0.10221099853515625, 0.11370849609375, 0.12520599365234375, 0.1367034912109375, 0.14820098876953125, 0.159698486328125, 0.17119598388671875, 0.1826934814453125, 0.19419097900390625, 0.2056884765625, 0.21718597412109375, 0.2286834716796875, 0.24018096923828125, 0.251678466796875, 0.26317596435546875, 0.2746734619140625, 0.28617095947265625, 0.29766845703125, 0.30916595458984375, 0.3206634521484375, 0.33216094970703125, 0.343658447265625, 0.35515594482421875, 0.3666534423828125, 0.37815093994140625, 0.3896484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 21.0, 12.0, 29.0, 39.0, 92.0, 264.0, 2707.0, 1031748.0, 12615.0, 712.0, 125.0, 62.0, 43.0, 22.0, 7.0, 9.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.10400390625, -7.8564453125, -7.60888671875, -7.361328125, -7.11376953125, -6.8662109375, -6.61865234375, -6.37109375, -6.12353515625, -5.8759765625, -5.62841796875, -5.380859375, -5.13330078125, -4.8857421875, -4.63818359375, -4.390625, -4.14306640625, -3.8955078125, -3.64794921875, -3.400390625, -3.15283203125, -2.9052734375, -2.65771484375, -2.41015625, -2.16259765625, -1.9150390625, -1.66748046875, -1.419921875, -1.17236328125, -0.9248046875, -0.67724609375, -0.4296875, -0.18212890625, 0.0654296875, 0.31298828125, 0.560546875, 0.80810546875, 1.0556640625, 1.30322265625, 1.55078125, 1.79833984375, 2.0458984375, 2.29345703125, 2.541015625, 2.78857421875, 3.0361328125, 3.28369140625, 3.53125, 3.77880859375, 4.0263671875, 4.27392578125, 4.521484375, 4.76904296875, 5.0166015625, 5.26416015625, 5.51171875, 5.75927734375, 6.0068359375, 6.25439453125, 6.501953125, 6.74951171875, 6.9970703125, 7.24462890625, 7.4921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 26.0, 227.0, 667.0, 76.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296105146408081, -3.2330474853515625, -3.169989824295044, -3.1069321632385254, -3.043874502182007, -2.9808168411254883, -2.9177591800689697, -2.854701519012451, -2.7916440963745117, -2.728586435317993, -2.6655287742614746, -2.602471113204956, -2.5394134521484375, -2.476355791091919, -2.4132981300354004, -2.350240707397461, -2.2871828079223633, -2.2241251468658447, -2.161067485809326, -2.0980098247528076, -2.034952163696289, -1.9718945026397705, -1.9088369607925415, -1.845779299736023, -1.7827216386795044, -1.7196639776229858, -1.6566063165664673, -1.5935486555099487, -1.5304911136627197, -1.4674334526062012, -1.4043757915496826, -1.341318130493164, -1.2782602310180664, -1.2152025699615479, -1.1521449089050293, -1.0890872478485107, -1.0260295867919922, -0.9629719853401184, -0.8999143838882446, -0.8368567228317261, -0.7737990617752075, -0.710741400718689, -0.6476837396621704, -0.5846261382102966, -0.5215684771537781, -0.4585108160972595, -0.39545318484306335, -0.3323955535888672, -0.26933789253234863, -0.20628024637699127, -0.1432226002216339, -0.08016495406627655, -0.01710730791091919, 0.045950353145599365, 0.10900798439979553, 0.1720656156539917, 0.23512327671051025, 0.2981809377670288, 0.361238569021225, 0.42429620027542114, 0.4873538613319397, 0.5504115223884583, 0.613469123840332, 0.6765267848968506, 0.7395844459533691]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 13.0, 15.0, 10.0, 16.0, 15.0, 23.0, 27.0, 26.0, 21.0, 30.0, 32.0, 37.0, 42.0, 34.0, 42.0, 53.0, 47.0, 33.0, 38.0, 37.0, 51.0, 41.0, 34.0, 33.0, 26.0, 34.0, 24.0, 22.0, 28.0, 17.0, 8.0, 18.0, 14.0, 4.0, 8.0, 4.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2493683099746704, -0.2419174164533615, -0.2344665229320526, -0.2270156294107437, -0.21956473588943481, -0.21211384236812592, -0.20466294884681702, -0.19721205532550812, -0.18976116180419922, -0.18231026828289032, -0.17485937476158142, -0.16740848124027252, -0.15995758771896362, -0.15250669419765472, -0.14505580067634583, -0.13760490715503693, -0.13015401363372803, -0.12270312011241913, -0.11525222659111023, -0.10780133306980133, -0.10035043954849243, -0.09289954602718353, -0.08544865250587463, -0.07799775898456573, -0.07054686546325684, -0.06309597194194794, -0.05564507842063904, -0.04819418489933014, -0.04074329137802124, -0.03329239785671234, -0.025841504335403442, -0.018390610814094543, -0.010939717292785645, -0.0034888237714767456, 0.003962069749832153, 0.011412963271141052, 0.01886385679244995, 0.02631475031375885, 0.03376564383506775, 0.04121653735637665, 0.04866743087768555, 0.056118324398994446, 0.06356921792030334, 0.07102011144161224, 0.07847100496292114, 0.08592189848423004, 0.09337279200553894, 0.10082368552684784, 0.10827457904815674, 0.11572547256946564, 0.12317636609077454, 0.13062725961208344, 0.13807815313339233, 0.14552904665470123, 0.15297994017601013, 0.16043083369731903, 0.16788172721862793, 0.17533262073993683, 0.18278351426124573, 0.19023440778255463, 0.19768530130386353, 0.20513619482517242, 0.21258708834648132, 0.22003798186779022, 0.22748887538909912]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 7.0, 8.0, 7.0, 7.0, 13.0, 14.0, 19.0, 15.0, 24.0, 26.0, 21.0, 33.0, 35.0, 31.0, 40.0, 56.0, 42.0, 38.0, 55.0, 60.0, 49.0, 50.0, 28.0, 40.0, 35.0, 33.0, 35.0, 23.0, 29.0, 25.0, 19.0, 14.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.425628662109375, -3.30242919921875, -3.179229736328125, -3.0560302734375, -2.932830810546875, -2.80963134765625, -2.686431884765625, -2.563232421875, -2.440032958984375, -2.31683349609375, -2.193634033203125, -2.0704345703125, -1.947235107421875, -1.82403564453125, -1.700836181640625, -1.57763671875, -1.454437255859375, -1.33123779296875, -1.208038330078125, -1.0848388671875, -0.961639404296875, -0.83843994140625, -0.715240478515625, -0.592041015625, -0.468841552734375, -0.34564208984375, -0.222442626953125, -0.0992431640625, 0.023956298828125, 0.14715576171875, 0.270355224609375, 0.3935546875, 0.516754150390625, 0.63995361328125, 0.763153076171875, 0.8863525390625, 1.009552001953125, 1.13275146484375, 1.255950927734375, 1.379150390625, 1.502349853515625, 1.62554931640625, 1.748748779296875, 1.8719482421875, 1.995147705078125, 2.11834716796875, 2.241546630859375, 2.36474609375, 2.487945556640625, 2.61114501953125, 2.734344482421875, 2.8575439453125, 2.980743408203125, 3.10394287109375, 3.227142333984375, 3.350341796875, 3.473541259765625, 3.59674072265625, 3.719940185546875, 3.8431396484375, 3.966339111328125, 4.08953857421875, 4.212738037109375, 4.3359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 14.0, 28.0, 23.0, 33.0, 51.0, 80.0, 105.0, 137.0, 203.0, 306.0, 430.0, 727.0, 1139.0, 1860.0, 3549.0, 7405.0, 16719.0, 45549.0, 183530.0, 558476.0, 156305.0, 41319.0, 15442.0, 6774.0, 3371.0, 1843.0, 1037.0, 680.0, 435.0, 281.0, 205.0, 150.0, 93.0, 66.0, 51.0, 33.0, 24.0, 16.0, 16.0, 7.0, 10.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.31561279296875, -5.1351318359375, -4.95465087890625, -4.774169921875, -4.59368896484375, -4.4132080078125, -4.23272705078125, -4.05224609375, -3.87176513671875, -3.6912841796875, -3.51080322265625, -3.330322265625, -3.14984130859375, -2.9693603515625, -2.78887939453125, -2.6083984375, -2.42791748046875, -2.2474365234375, -2.06695556640625, -1.886474609375, -1.70599365234375, -1.5255126953125, -1.34503173828125, -1.16455078125, -0.98406982421875, -0.8035888671875, -0.62310791015625, -0.442626953125, -0.26214599609375, -0.0816650390625, 0.09881591796875, 0.279296875, 0.45977783203125, 0.6402587890625, 0.82073974609375, 1.001220703125, 1.18170166015625, 1.3621826171875, 1.54266357421875, 1.72314453125, 1.90362548828125, 2.0841064453125, 2.26458740234375, 2.445068359375, 2.62554931640625, 2.8060302734375, 2.98651123046875, 3.1669921875, 3.34747314453125, 3.5279541015625, 3.70843505859375, 3.888916015625, 4.06939697265625, 4.2498779296875, 4.43035888671875, 4.61083984375, 4.79132080078125, 4.9718017578125, 5.15228271484375, 5.332763671875, 5.51324462890625, 5.6937255859375, 5.87420654296875, 6.0546875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 12.0, 13.0, 8.0, 17.0, 17.0, 20.0, 29.0, 24.0, 36.0, 27.0, 31.0, 44.0, 49.0, 54.0, 66.0, 165.0, 1464.0, 367.0, 124.0, 52.0, 69.0, 51.0, 35.0, 29.0, 38.0, 28.0, 22.0, 16.0, 10.0, 18.0, 12.0, 12.0, 15.0, 6.0, 8.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.26220703125, -9.9072265625, -9.55224609375, -9.197265625, -8.84228515625, -8.4873046875, -8.13232421875, -7.77734375, -7.42236328125, -7.0673828125, -6.71240234375, -6.357421875, -6.00244140625, -5.6474609375, -5.29248046875, -4.9375, -4.58251953125, -4.2275390625, -3.87255859375, -3.517578125, -3.16259765625, -2.8076171875, -2.45263671875, -2.09765625, -1.74267578125, -1.3876953125, -1.03271484375, -0.677734375, -0.32275390625, 0.0322265625, 0.38720703125, 0.7421875, 1.09716796875, 1.4521484375, 1.80712890625, 2.162109375, 2.51708984375, 2.8720703125, 3.22705078125, 3.58203125, 3.93701171875, 4.2919921875, 4.64697265625, 5.001953125, 5.35693359375, 5.7119140625, 6.06689453125, 6.421875, 6.77685546875, 7.1318359375, 7.48681640625, 7.841796875, 8.19677734375, 8.5517578125, 8.90673828125, 9.26171875, 9.61669921875, 9.9716796875, 10.32666015625, 10.681640625, 11.03662109375, 11.3916015625, 11.74658203125, 12.1015625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 10.0, 9.0, 15.0, 22.0, 23.0, 15.0, 26.0, 28.0, 41.0, 66.0, 82.0, 120.0, 164.0, 298.0, 664.0, 2009.0, 10694.0, 137560.0, 2882449.0, 99004.0, 9033.0, 1810.0, 603.0, 280.0, 190.0, 94.0, 93.0, 60.0, 47.0, 45.0, 21.0, 29.0, 13.0, 18.0, 17.0, 11.0, 7.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.890625, -17.371337890625, -16.85205078125, -16.332763671875, -15.8134765625, -15.294189453125, -14.77490234375, -14.255615234375, -13.736328125, -13.217041015625, -12.69775390625, -12.178466796875, -11.6591796875, -11.139892578125, -10.62060546875, -10.101318359375, -9.58203125, -9.062744140625, -8.54345703125, -8.024169921875, -7.5048828125, -6.985595703125, -6.46630859375, -5.947021484375, -5.427734375, -4.908447265625, -4.38916015625, -3.869873046875, -3.3505859375, -2.831298828125, -2.31201171875, -1.792724609375, -1.2734375, -0.754150390625, -0.23486328125, 0.284423828125, 0.8037109375, 1.322998046875, 1.84228515625, 2.361572265625, 2.880859375, 3.400146484375, 3.91943359375, 4.438720703125, 4.9580078125, 5.477294921875, 5.99658203125, 6.515869140625, 7.03515625, 7.554443359375, 8.07373046875, 8.593017578125, 9.1123046875, 9.631591796875, 10.15087890625, 10.670166015625, 11.189453125, 11.708740234375, 12.22802734375, 12.747314453125, 13.2666015625, 13.785888671875, 14.30517578125, 14.824462890625, 15.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 11.0, 300.0, 674.0, 30.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.324481010437012, -9.159858703613281, -4.995236396789551, -0.8306140899658203, 3.33400821685791, 7.498631477355957, 11.663252830505371, 15.827874183654785, 19.992496490478516, 24.157119750976562, 28.321741104125977, 32.48636245727539, 36.65098571777344, 40.815608978271484, 44.98023223876953, 49.14485168457031, 53.30947494506836, 57.474098205566406, 61.63871765136719, 65.8033447265625, 69.96796417236328, 74.13258361816406, 78.29721069335938, 82.46183013916016, 86.62645721435547, 90.79107666015625, 94.95570373535156, 99.12032318115234, 103.28494262695312, 107.44956970214844, 111.61418914794922, 115.77880859375, 119.94343566894531, 124.1080551147461, 128.27267456054688, 132.4373016357422, 136.6019287109375, 140.76654052734375, 144.93116760253906, 149.09579467773438, 153.26040649414062, 157.42503356933594, 161.5896453857422, 165.7542724609375, 169.9188995361328, 174.08352661132812, 178.24813842773438, 182.4127655029297, 186.577392578125, 190.7420196533203, 194.90663146972656, 199.07125854492188, 203.2358856201172, 207.4005126953125, 211.56512451171875, 215.72975158691406, 219.89437866210938, 224.0590057373047, 228.22361755371094, 232.38824462890625, 236.55287170410156, 240.71749877929688, 244.88211059570312, 249.04673767089844, 253.2113494873047]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 3.0, 10.0, 6.0, 7.0, 7.0, 14.0, 8.0, 15.0, 22.0, 34.0, 25.0, 33.0, 37.0, 26.0, 35.0, 43.0, 52.0, 43.0, 45.0, 40.0, 44.0, 47.0, 22.0, 42.0, 24.0, 37.0, 31.0, 32.0, 30.0, 28.0, 30.0, 23.0, 23.0, 16.0, 17.0, 8.0, 7.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.405521392822266, -29.41016960144043, -28.414817810058594, -27.41946792602539, -26.424116134643555, -25.42876434326172, -24.433412551879883, -23.438060760498047, -22.442710876464844, -21.447359085083008, -20.452007293701172, -19.45665740966797, -18.461305618286133, -17.465953826904297, -16.47060203552246, -15.475250244140625, -14.479898452758789, -13.484546661376953, -12.489195823669434, -11.493844032287598, -10.498493194580078, -9.503141403198242, -8.507789611816406, -7.5124382972717285, -6.517086982727051, -5.521735668182373, -4.526384353637695, -3.5310325622558594, -2.5356812477111816, -1.540329933166504, -0.544978141784668, 0.45037317276000977, 1.4457244873046875, 2.4410758018493652, 3.436427354812622, 4.431778907775879, 5.427130222320557, 6.422481536865234, 7.41783332824707, 8.413185119628906, 9.408535957336426, 10.403887748718262, 11.399238586425781, 12.394590377807617, 13.389942169189453, 14.385293006896973, 15.380644798278809, 16.375995635986328, 17.371347427368164, 18.36669921875, 19.362051010131836, 20.357402801513672, 21.352752685546875, 22.34810447692871, 23.343456268310547, 24.338808059692383, 25.33415985107422, 26.329511642456055, 27.32486343383789, 28.320213317871094, 29.31556510925293, 30.310916900634766, 31.3062686920166, 32.30162048339844, 33.29697036743164]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 6.0, 14.0, 10.0, 8.0, 8.0, 19.0, 16.0, 18.0, 15.0, 22.0, 25.0, 30.0, 40.0, 28.0, 40.0, 41.0, 45.0, 37.0, 44.0, 49.0, 32.0, 49.0, 31.0, 47.0, 37.0, 24.0, 16.0, 29.0, 37.0, 23.0, 26.0, 23.0, 11.0, 25.0, 10.0, 6.0, 7.0, 11.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.298828125, -3.183013916015625, -3.06719970703125, -2.951385498046875, -2.8355712890625, -2.719757080078125, -2.60394287109375, -2.488128662109375, -2.372314453125, -2.256500244140625, -2.14068603515625, -2.024871826171875, -1.9090576171875, -1.793243408203125, -1.67742919921875, -1.561614990234375, -1.44580078125, -1.329986572265625, -1.21417236328125, -1.098358154296875, -0.9825439453125, -0.866729736328125, -0.75091552734375, -0.635101318359375, -0.519287109375, -0.403472900390625, -0.28765869140625, -0.171844482421875, -0.0560302734375, 0.059783935546875, 0.17559814453125, 0.291412353515625, 0.4072265625, 0.523040771484375, 0.63885498046875, 0.754669189453125, 0.8704833984375, 0.986297607421875, 1.10211181640625, 1.217926025390625, 1.333740234375, 1.449554443359375, 1.56536865234375, 1.681182861328125, 1.7969970703125, 1.912811279296875, 2.02862548828125, 2.144439697265625, 2.26025390625, 2.376068115234375, 2.49188232421875, 2.607696533203125, 2.7235107421875, 2.839324951171875, 2.95513916015625, 3.070953369140625, 3.186767578125, 3.302581787109375, 3.41839599609375, 3.534210205078125, 3.6500244140625, 3.765838623046875, 3.88165283203125, 3.997467041015625, 4.11328125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 22.0, 18.0, 43.0, 60.0, 74.0, 124.0, 181.0, 276.0, 509.0, 759.0, 1196.0, 2065.0, 3902.0, 7297.0, 14377.0, 35169.0, 123656.0, 695213.0, 2307131.0, 797066.0, 133994.0, 37574.0, 15421.0, 7815.0, 4077.0, 2378.0, 1401.0, 885.0, 548.0, 341.0, 211.0, 154.0, 117.0, 68.0, 42.0, 37.0, 13.0, 21.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.05181884765625, -4.8614501953125, -4.67108154296875, -4.480712890625, -4.29034423828125, -4.0999755859375, -3.90960693359375, -3.71923828125, -3.52886962890625, -3.3385009765625, -3.14813232421875, -2.957763671875, -2.76739501953125, -2.5770263671875, -2.38665771484375, -2.1962890625, -2.00592041015625, -1.8155517578125, -1.62518310546875, -1.434814453125, -1.24444580078125, -1.0540771484375, -0.86370849609375, -0.67333984375, -0.48297119140625, -0.2926025390625, -0.10223388671875, 0.088134765625, 0.27850341796875, 0.4688720703125, 0.65924072265625, 0.849609375, 1.03997802734375, 1.2303466796875, 1.42071533203125, 1.611083984375, 1.80145263671875, 1.9918212890625, 2.18218994140625, 2.37255859375, 2.56292724609375, 2.7532958984375, 2.94366455078125, 3.134033203125, 3.32440185546875, 3.5147705078125, 3.70513916015625, 3.8955078125, 4.08587646484375, 4.2762451171875, 4.46661376953125, 4.656982421875, 4.84735107421875, 5.0377197265625, 5.22808837890625, 5.41845703125, 5.60882568359375, 5.7991943359375, 5.98956298828125, 6.179931640625, 6.37030029296875, 6.5606689453125, 6.75103759765625, 6.94140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 8.0, 4.0, 7.0, 12.0, 15.0, 23.0, 28.0, 28.0, 51.0, 53.0, 99.0, 120.0, 161.0, 248.0, 434.0, 619.0, 669.0, 509.0, 314.0, 198.0, 117.0, 86.0, 71.0, 36.0, 49.0, 29.0, 11.0, 16.0, 18.0, 11.0, 6.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.50384521484375, -5.2850341796875, -5.06622314453125, -4.847412109375, -4.62860107421875, -4.4097900390625, -4.19097900390625, -3.97216796875, -3.75335693359375, -3.5345458984375, -3.31573486328125, -3.096923828125, -2.87811279296875, -2.6593017578125, -2.44049072265625, -2.2216796875, -2.00286865234375, -1.7840576171875, -1.56524658203125, -1.346435546875, -1.12762451171875, -0.9088134765625, -0.69000244140625, -0.47119140625, -0.25238037109375, -0.0335693359375, 0.18524169921875, 0.404052734375, 0.62286376953125, 0.8416748046875, 1.06048583984375, 1.279296875, 1.49810791015625, 1.7169189453125, 1.93572998046875, 2.154541015625, 2.37335205078125, 2.5921630859375, 2.81097412109375, 3.02978515625, 3.24859619140625, 3.4674072265625, 3.68621826171875, 3.905029296875, 4.12384033203125, 4.3426513671875, 4.56146240234375, 4.7802734375, 4.99908447265625, 5.2178955078125, 5.43670654296875, 5.655517578125, 5.87432861328125, 6.0931396484375, 6.31195068359375, 6.53076171875, 6.74957275390625, 6.9683837890625, 7.18719482421875, 7.406005859375, 7.62481689453125, 7.8436279296875, 8.06243896484375, 8.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 14.0, 19.0, 21.0, 29.0, 38.0, 83.0, 88.0, 133.0, 257.0, 625.0, 2119.0, 11889.0, 140730.0, 3681257.0, 331721.0, 20339.0, 3182.0, 866.0, 318.0, 182.0, 103.0, 67.0, 46.0, 41.0, 25.0, 20.0, 12.0, 10.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.859375, -23.24169921875, -22.6240234375, -22.00634765625, -21.388671875, -20.77099609375, -20.1533203125, -19.53564453125, -18.91796875, -18.30029296875, -17.6826171875, -17.06494140625, -16.447265625, -15.82958984375, -15.2119140625, -14.59423828125, -13.9765625, -13.35888671875, -12.7412109375, -12.12353515625, -11.505859375, -10.88818359375, -10.2705078125, -9.65283203125, -9.03515625, -8.41748046875, -7.7998046875, -7.18212890625, -6.564453125, -5.94677734375, -5.3291015625, -4.71142578125, -4.09375, -3.47607421875, -2.8583984375, -2.24072265625, -1.623046875, -1.00537109375, -0.3876953125, 0.22998046875, 0.84765625, 1.46533203125, 2.0830078125, 2.70068359375, 3.318359375, 3.93603515625, 4.5537109375, 5.17138671875, 5.7890625, 6.40673828125, 7.0244140625, 7.64208984375, 8.259765625, 8.87744140625, 9.4951171875, 10.11279296875, 10.73046875, 11.34814453125, 11.9658203125, 12.58349609375, 13.201171875, 13.81884765625, 14.4365234375, 15.05419921875, 15.671875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 37.0, 91.0, 166.0, 242.0, 235.0, 120.0, 71.0, 26.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.61666488647461, -52.90502166748047, -51.19337463378906, -49.48173141479492, -47.770084381103516, -46.058441162109375, -44.34679412841797, -42.63515090942383, -40.92350387573242, -39.21186065673828, -37.500213623046875, -35.788570404052734, -34.07692337036133, -32.36528015136719, -30.65363311767578, -28.94198989868164, -27.230344772338867, -25.518699645996094, -23.80705451965332, -22.095409393310547, -20.383764266967773, -18.672119140625, -16.96047592163086, -15.24882984161377, -13.537184715270996, -11.825539588928223, -10.11389446258545, -8.402250289916992, -6.6906046867370605, -4.978960037231445, -3.267314910888672, -1.5556697845458984, 0.155975341796875, 1.8676203489303589, 3.5792653560638428, 5.290910243988037, 7.0025553703308105, 8.714200019836426, 10.4258451461792, 12.137490272521973, 13.849135398864746, 15.56078052520752, 17.272424697875977, 18.98406982421875, 20.695714950561523, 22.407360076904297, 24.11900520324707, 25.830650329589844, 27.542295455932617, 29.25394058227539, 30.965585708618164, 32.67723083496094, 34.38887405395508, 36.100521087646484, 37.812164306640625, 39.52381134033203, 41.23545455932617, 42.94709777832031, 44.65874481201172, 46.37038803100586, 48.082035064697266, 49.793678283691406, 51.50532531738281, 53.21696853637695, 54.92861557006836]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 2.0, 5.0, 6.0, 12.0, 9.0, 11.0, 18.0, 19.0, 19.0, 22.0, 31.0, 30.0, 30.0, 32.0, 44.0, 41.0, 51.0, 38.0, 45.0, 55.0, 39.0, 41.0, 40.0, 44.0, 30.0, 44.0, 42.0, 29.0, 31.0, 31.0, 21.0, 14.0, 16.0, 11.0, 8.0, 7.0, 8.0, 2.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.89798927307129, -25.143157958984375, -24.388328552246094, -23.63349723815918, -22.878665924072266, -22.123836517333984, -21.36900520324707, -20.614173889160156, -19.859344482421875, -19.10451316833496, -18.34968376159668, -17.594852447509766, -16.840023040771484, -16.08519172668457, -15.330360412597656, -14.575530052185059, -13.820699691772461, -13.065869331359863, -12.311038970947266, -11.556207656860352, -10.801377296447754, -10.046546936035156, -9.291715621948242, -8.536885261535645, -7.782054901123047, -7.027224540710449, -6.272393703460693, -5.5175628662109375, -4.76273250579834, -4.007902145385742, -3.2530713081359863, -2.4982404708862305, -1.743408203125, -0.9885776042938232, -0.23374700546264648, 0.5210835933685303, 1.275914192199707, 2.030744791030884, 2.7855753898620605, 3.5404062271118164, 4.295236587524414, 5.050066947937012, 5.804897785186768, 6.559728622436523, 7.314558982849121, 8.069389343261719, 8.824220657348633, 9.57905101776123, 10.333881378173828, 11.088711738586426, 11.843542098999023, 12.598373413085938, 13.353203773498535, 14.108034133911133, 14.862865447998047, 15.617695808410645, 16.372526168823242, 17.127357482910156, 17.882186889648438, 18.63701820373535, 19.391849517822266, 20.146678924560547, 20.90151023864746, 21.656341552734375, 22.411170959472656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 4.0, 10.0, 10.0, 4.0, 8.0, 15.0, 10.0, 14.0, 26.0, 26.0, 28.0, 23.0, 23.0, 26.0, 50.0, 39.0, 35.0, 34.0, 32.0, 40.0, 31.0, 44.0, 44.0, 42.0, 39.0, 45.0, 34.0, 36.0, 28.0, 29.0, 25.0, 21.0, 14.0, 18.0, 9.0, 12.0, 10.0, 13.0, 7.0, 12.0, 2.0, 4.0, 4.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.318359375, -3.210540771484375, -3.10272216796875, -2.994903564453125, -2.8870849609375, -2.779266357421875, -2.67144775390625, -2.563629150390625, -2.455810546875, -2.347991943359375, -2.24017333984375, -2.132354736328125, -2.0245361328125, -1.916717529296875, -1.80889892578125, -1.701080322265625, -1.59326171875, -1.485443115234375, -1.37762451171875, -1.269805908203125, -1.1619873046875, -1.054168701171875, -0.94635009765625, -0.838531494140625, -0.730712890625, -0.622894287109375, -0.51507568359375, -0.407257080078125, -0.2994384765625, -0.191619873046875, -0.08380126953125, 0.024017333984375, 0.1318359375, 0.239654541015625, 0.34747314453125, 0.455291748046875, 0.5631103515625, 0.670928955078125, 0.77874755859375, 0.886566162109375, 0.994384765625, 1.102203369140625, 1.21002197265625, 1.317840576171875, 1.4256591796875, 1.533477783203125, 1.64129638671875, 1.749114990234375, 1.85693359375, 1.964752197265625, 2.07257080078125, 2.180389404296875, 2.2882080078125, 2.396026611328125, 2.50384521484375, 2.611663818359375, 2.719482421875, 2.827301025390625, 2.93511962890625, 3.042938232421875, 3.1507568359375, 3.258575439453125, 3.36639404296875, 3.474212646484375, 3.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 10.0, 12.0, 10.0, 21.0, 21.0, 26.0, 46.0, 56.0, 74.0, 101.0, 138.0, 187.0, 272.0, 395.0, 556.0, 863.0, 1339.0, 1961.0, 3167.0, 5679.0, 10921.0, 26002.0, 325245.0, 610730.0, 32172.0, 12172.0, 6365.0, 3625.0, 2056.0, 1323.0, 930.0, 568.0, 444.0, 314.0, 204.0, 149.0, 122.0, 92.0, 47.0, 29.0, 36.0, 18.0, 20.0, 7.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6015625, -4.466552734375, -4.33154296875, -4.196533203125, -4.0615234375, -3.926513671875, -3.79150390625, -3.656494140625, -3.521484375, -3.386474609375, -3.25146484375, -3.116455078125, -2.9814453125, -2.846435546875, -2.71142578125, -2.576416015625, -2.44140625, -2.306396484375, -2.17138671875, -2.036376953125, -1.9013671875, -1.766357421875, -1.63134765625, -1.496337890625, -1.361328125, -1.226318359375, -1.09130859375, -0.956298828125, -0.8212890625, -0.686279296875, -0.55126953125, -0.416259765625, -0.28125, -0.146240234375, -0.01123046875, 0.123779296875, 0.2587890625, 0.393798828125, 0.52880859375, 0.663818359375, 0.798828125, 0.933837890625, 1.06884765625, 1.203857421875, 1.3388671875, 1.473876953125, 1.60888671875, 1.743896484375, 1.87890625, 2.013916015625, 2.14892578125, 2.283935546875, 2.4189453125, 2.553955078125, 2.68896484375, 2.823974609375, 2.958984375, 3.093994140625, 3.22900390625, 3.364013671875, 3.4990234375, 3.634033203125, 3.76904296875, 3.904052734375, 4.0390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 11.0, 5.0, 11.0, 10.0, 17.0, 12.0, 17.0, 15.0, 21.0, 25.0, 23.0, 34.0, 40.0, 33.0, 37.0, 27.0, 41.0, 49.0, 41.0, 44.0, 1068.0, 41.0, 45.0, 41.0, 36.0, 36.0, 34.0, 23.0, 18.0, 15.0, 21.0, 24.0, 14.0, 17.0, 13.0, 14.0, 8.0, 4.0, 10.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.365234375, -2.287109375, -2.208984375, -2.130859375, -2.052734375, -1.974609375, -1.896484375, -1.818359375, -1.740234375, -1.662109375, -1.583984375, -1.505859375, -1.427734375, -1.349609375, -1.271484375, -1.193359375, -1.115234375, -1.037109375, -0.958984375, -0.880859375, -0.802734375, -0.724609375, -0.646484375, -0.568359375, -0.490234375, -0.412109375, -0.333984375, -0.255859375, -0.177734375, -0.099609375, -0.021484375, 0.056640625, 0.134765625, 0.212890625, 0.291015625, 0.369140625, 0.447265625, 0.525390625, 0.603515625, 0.681640625, 0.759765625, 0.837890625, 0.916015625, 0.994140625, 1.072265625, 1.150390625, 1.228515625, 1.306640625, 1.384765625, 1.462890625, 1.541015625, 1.619140625, 1.697265625, 1.775390625, 1.853515625, 1.931640625, 2.009765625, 2.087890625, 2.166015625, 2.244140625, 2.322265625, 2.400390625, 2.478515625, 2.556640625, 2.634765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 14.0, 7.0, 10.0, 24.0, 22.0, 23.0, 41.0, 53.0, 68.0, 84.0, 105.0, 147.0, 191.0, 282.0, 418.0, 560.0, 866.0, 1394.0, 2218.0, 3776.0, 6980.0, 16241.0, 58201.0, 1621715.0, 325566.0, 32290.0, 11571.0, 5611.0, 2983.0, 1883.0, 1165.0, 724.0, 514.0, 355.0, 250.0, 188.0, 131.0, 107.0, 76.0, 55.0, 45.0, 34.0, 28.0, 16.0, 13.0, 14.0, 14.0, 15.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.0078125, -1.9447021484375, -1.881591796875, -1.8184814453125, -1.75537109375, -1.6922607421875, -1.629150390625, -1.5660400390625, -1.5029296875, -1.4398193359375, -1.376708984375, -1.3135986328125, -1.25048828125, -1.1873779296875, -1.124267578125, -1.0611572265625, -0.998046875, -0.9349365234375, -0.871826171875, -0.8087158203125, -0.74560546875, -0.6824951171875, -0.619384765625, -0.5562744140625, -0.4931640625, -0.4300537109375, -0.366943359375, -0.3038330078125, -0.24072265625, -0.1776123046875, -0.114501953125, -0.0513916015625, 0.01171875, 0.0748291015625, 0.137939453125, 0.2010498046875, 0.26416015625, 0.3272705078125, 0.390380859375, 0.4534912109375, 0.5166015625, 0.5797119140625, 0.642822265625, 0.7059326171875, 0.76904296875, 0.8321533203125, 0.895263671875, 0.9583740234375, 1.021484375, 1.0845947265625, 1.147705078125, 1.2108154296875, 1.27392578125, 1.3370361328125, 1.400146484375, 1.4632568359375, 1.5263671875, 1.5894775390625, 1.652587890625, 1.7156982421875, 1.77880859375, 1.8419189453125, 1.905029296875, 1.9681396484375, 2.03125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 12.0, 20.0, 16.0, 54.0, 188.0, 469.0, 84.0, 41.0, 18.0, 16.0, 9.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.485107421875, -0.4709625244140625, -0.456817626953125, -0.4426727294921875, -0.42852783203125, -0.4143829345703125, -0.400238037109375, -0.3860931396484375, -0.3719482421875, -0.3578033447265625, -0.343658447265625, -0.3295135498046875, -0.31536865234375, -0.3012237548828125, -0.287078857421875, -0.2729339599609375, -0.2587890625, -0.2446441650390625, -0.230499267578125, -0.2163543701171875, -0.20220947265625, -0.1880645751953125, -0.173919677734375, -0.1597747802734375, -0.1456298828125, -0.1314849853515625, -0.117340087890625, -0.1031951904296875, -0.08905029296875, -0.0749053955078125, -0.060760498046875, -0.0466156005859375, -0.032470703125, -0.0183258056640625, -0.004180908203125, 0.0099639892578125, 0.02410888671875, 0.0382537841796875, 0.052398681640625, 0.0665435791015625, 0.0806884765625, 0.0948333740234375, 0.108978271484375, 0.1231231689453125, 0.13726806640625, 0.1514129638671875, 0.165557861328125, 0.1797027587890625, 0.19384765625, 0.2079925537109375, 0.222137451171875, 0.2362823486328125, 0.25042724609375, 0.2645721435546875, 0.278717041015625, 0.2928619384765625, 0.3070068359375, 0.3211517333984375, 0.335296630859375, 0.3494415283203125, 0.36358642578125, 0.3777313232421875, 0.391876220703125, 0.4060211181640625, 0.420166015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 20.0, 36.0, 52.0, 121.0, 746.0, 41394.0, 1004242.0, 1498.0, 172.0, 63.0, 56.0, 25.0, 24.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 1.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-9.9765625, -9.6453857421875, -9.314208984375, -8.9830322265625, -8.65185546875, -8.3206787109375, -7.989501953125, -7.6583251953125, -7.3271484375, -6.9959716796875, -6.664794921875, -6.3336181640625, -6.00244140625, -5.6712646484375, -5.340087890625, -5.0089111328125, -4.677734375, -4.3465576171875, -4.015380859375, -3.6842041015625, -3.35302734375, -3.0218505859375, -2.690673828125, -2.3594970703125, -2.0283203125, -1.6971435546875, -1.365966796875, -1.0347900390625, -0.70361328125, -0.3724365234375, -0.041259765625, 0.2899169921875, 0.62109375, 0.9522705078125, 1.283447265625, 1.6146240234375, 1.94580078125, 2.2769775390625, 2.608154296875, 2.9393310546875, 3.2705078125, 3.6016845703125, 3.932861328125, 4.2640380859375, 4.59521484375, 4.9263916015625, 5.257568359375, 5.5887451171875, 5.919921875, 6.2510986328125, 6.582275390625, 6.9134521484375, 7.24462890625, 7.5758056640625, 7.906982421875, 8.2381591796875, 8.5693359375, 8.9005126953125, 9.231689453125, 9.5628662109375, 9.89404296875, 10.2252197265625, 10.556396484375, 10.8875732421875, 11.21875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 25.0, 60.0, 208.0, 361.0, 210.0, 84.0, 28.0, 15.0, 14.0, 4.0], "bins": [-1.8845131397247314, -1.8517507314682007, -1.81898832321167, -1.7862260341644287, -1.753463625907898, -1.7207012176513672, -1.6879388093948364, -1.6551764011383057, -1.6224141120910645, -1.5896517038345337, -1.556889295578003, -1.5241270065307617, -1.491364598274231, -1.4586021900177002, -1.4258397817611694, -1.3930773735046387, -1.3603150844573975, -1.3275526762008667, -1.294790267944336, -1.2620279788970947, -1.229265570640564, -1.1965031623840332, -1.1637407541275024, -1.1309783458709717, -1.098215937614441, -1.0654535293579102, -1.0326911211013794, -0.9999287724494934, -0.9671664237976074, -0.9344040155410767, -0.9016416072845459, -0.8688792586326599, -0.8361169099807739, -0.8033545017242432, -0.7705921530723572, -0.7378297448158264, -0.7050673961639404, -0.6723049879074097, -0.6395425796508789, -0.6067802309989929, -0.5740178823471069, -0.5412554740905762, -0.5084931254386902, -0.4757307171821594, -0.44296836853027344, -0.4102059602737427, -0.3774435818195343, -0.3446812033653259, -0.31191879510879517, -0.2791564166545868, -0.24639403820037842, -0.21363164484500885, -0.18086926639080048, -0.1481068879365921, -0.11534449458122253, -0.08258211612701416, -0.04981975257396698, -0.017057370394468307, 0.015705011785030365, 0.048467397689819336, 0.08122977614402771, 0.11399215459823608, 0.14675454795360565, 0.17951692640781403, 0.2122793048620224]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 14.0, 1.0, 16.0, 11.0, 16.0, 24.0, 17.0, 23.0, 28.0, 23.0, 23.0, 31.0, 37.0, 32.0, 29.0, 39.0, 28.0, 36.0, 28.0, 30.0, 45.0, 43.0, 42.0, 36.0, 29.0, 30.0, 28.0, 25.0, 24.0, 21.0, 22.0, 21.0, 17.0, 13.0, 11.0, 13.0, 13.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.29606109857559204, -0.2868116796016693, -0.2775622308254242, -0.26831281185150146, -0.25906336307525635, -0.24981392920017242, -0.2405644953250885, -0.23131507635116577, -0.22206562757492065, -0.21281619369983673, -0.2035667598247528, -0.19431732594966888, -0.18506789207458496, -0.17581845819950104, -0.16656902432441711, -0.15731960535049438, -0.14807017147541046, -0.13882073760032654, -0.12957130372524261, -0.12032186985015869, -0.11107243597507477, -0.10182300209999084, -0.09257357567548752, -0.0833241418004036, -0.07407470792531967, -0.06482527405023575, -0.055575840175151825, -0.0463264100253582, -0.03707697615027428, -0.027827542275190353, -0.01857811212539673, -0.009328678250312805, -7.924437522888184e-05, 0.009170188568532467, 0.018419621512293816, 0.02766905352473259, 0.03691848739981651, 0.046167921274900436, 0.05541735142469406, 0.06466678529977798, 0.07391621917486191, 0.08316565304994583, 0.09241508692502975, 0.10166451334953308, 0.110913947224617, 0.12016338109970093, 0.12941281497478485, 0.13866224884986877, 0.1479116827249527, 0.15716111660003662, 0.16641055047512054, 0.17565998435020447, 0.1849094182252884, 0.19415885210037231, 0.20340827107429504, 0.21265771985054016, 0.2219071388244629, 0.23115657269954681, 0.24040600657463074, 0.24965544044971466, 0.2589048743247986, 0.2681542932987213, 0.27740374207496643, 0.28665316104888916, 0.2959026098251343]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 12.0, 9.0, 6.0, 14.0, 7.0, 23.0, 21.0, 21.0, 24.0, 36.0, 20.0, 24.0, 39.0, 31.0, 38.0, 39.0, 36.0, 36.0, 38.0, 48.0, 40.0, 41.0, 35.0, 39.0, 43.0, 23.0, 29.0, 22.0, 23.0, 29.0, 19.0, 13.0, 14.0, 12.0, 15.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.453125, -3.34478759765625, -3.2364501953125, -3.12811279296875, -3.019775390625, -2.91143798828125, -2.8031005859375, -2.69476318359375, -2.58642578125, -2.47808837890625, -2.3697509765625, -2.26141357421875, -2.153076171875, -2.04473876953125, -1.9364013671875, -1.82806396484375, -1.7197265625, -1.61138916015625, -1.5030517578125, -1.39471435546875, -1.286376953125, -1.17803955078125, -1.0697021484375, -0.96136474609375, -0.85302734375, -0.74468994140625, -0.6363525390625, -0.52801513671875, -0.419677734375, -0.31134033203125, -0.2030029296875, -0.09466552734375, 0.013671875, 0.12200927734375, 0.2303466796875, 0.33868408203125, 0.447021484375, 0.55535888671875, 0.6636962890625, 0.77203369140625, 0.88037109375, 0.98870849609375, 1.0970458984375, 1.20538330078125, 1.313720703125, 1.42205810546875, 1.5303955078125, 1.63873291015625, 1.7470703125, 1.85540771484375, 1.9637451171875, 2.07208251953125, 2.180419921875, 2.28875732421875, 2.3970947265625, 2.50543212890625, 2.61376953125, 2.72210693359375, 2.8304443359375, 2.93878173828125, 3.047119140625, 3.15545654296875, 3.2637939453125, 3.37213134765625, 3.48046875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 10.0, 14.0, 11.0, 25.0, 29.0, 32.0, 54.0, 84.0, 125.0, 196.0, 353.0, 525.0, 837.0, 1493.0, 2437.0, 4392.0, 8184.0, 15934.0, 35915.0, 147168.0, 659841.0, 108590.0, 31004.0, 14077.0, 7207.0, 4005.0, 2367.0, 1430.0, 810.0, 488.0, 317.0, 197.0, 124.0, 78.0, 59.0, 43.0, 24.0, 11.0, 7.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.60546875, -7.384521484375, -7.16357421875, -6.942626953125, -6.7216796875, -6.500732421875, -6.27978515625, -6.058837890625, -5.837890625, -5.616943359375, -5.39599609375, -5.175048828125, -4.9541015625, -4.733154296875, -4.51220703125, -4.291259765625, -4.0703125, -3.849365234375, -3.62841796875, -3.407470703125, -3.1865234375, -2.965576171875, -2.74462890625, -2.523681640625, -2.302734375, -2.081787109375, -1.86083984375, -1.639892578125, -1.4189453125, -1.197998046875, -0.97705078125, -0.756103515625, -0.53515625, -0.314208984375, -0.09326171875, 0.127685546875, 0.3486328125, 0.569580078125, 0.79052734375, 1.011474609375, 1.232421875, 1.453369140625, 1.67431640625, 1.895263671875, 2.1162109375, 2.337158203125, 2.55810546875, 2.779052734375, 3.0, 3.220947265625, 3.44189453125, 3.662841796875, 3.8837890625, 4.104736328125, 4.32568359375, 4.546630859375, 4.767578125, 4.988525390625, 5.20947265625, 5.430419921875, 5.6513671875, 5.872314453125, 6.09326171875, 6.314208984375, 6.53515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 7.0, 9.0, 10.0, 16.0, 15.0, 14.0, 29.0, 25.0, 27.0, 27.0, 36.0, 42.0, 51.0, 52.0, 88.0, 111.0, 257.0, 1569.0, 170.0, 67.0, 59.0, 59.0, 41.0, 29.0, 37.0, 19.0, 23.0, 34.0, 25.0, 14.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0390625, -10.6748046875, -10.310546875, -9.9462890625, -9.58203125, -9.2177734375, -8.853515625, -8.4892578125, -8.125, -7.7607421875, -7.396484375, -7.0322265625, -6.66796875, -6.3037109375, -5.939453125, -5.5751953125, -5.2109375, -4.8466796875, -4.482421875, -4.1181640625, -3.75390625, -3.3896484375, -3.025390625, -2.6611328125, -2.296875, -1.9326171875, -1.568359375, -1.2041015625, -0.83984375, -0.4755859375, -0.111328125, 0.2529296875, 0.6171875, 0.9814453125, 1.345703125, 1.7099609375, 2.07421875, 2.4384765625, 2.802734375, 3.1669921875, 3.53125, 3.8955078125, 4.259765625, 4.6240234375, 4.98828125, 5.3525390625, 5.716796875, 6.0810546875, 6.4453125, 6.8095703125, 7.173828125, 7.5380859375, 7.90234375, 8.2666015625, 8.630859375, 8.9951171875, 9.359375, 9.7236328125, 10.087890625, 10.4521484375, 10.81640625, 11.1806640625, 11.544921875, 11.9091796875, 12.2734375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 7.0, 9.0, 17.0, 17.0, 32.0, 37.0, 51.0, 86.0, 92.0, 186.0, 372.0, 929.0, 3016.0, 15479.0, 233159.0, 2831181.0, 51387.0, 6663.0, 1592.0, 619.0, 268.0, 140.0, 76.0, 84.0, 43.0, 45.0, 27.0, 17.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.468017578125, -17.85791015625, -17.247802734375, -16.6376953125, -16.027587890625, -15.41748046875, -14.807373046875, -14.197265625, -13.587158203125, -12.97705078125, -12.366943359375, -11.7568359375, -11.146728515625, -10.53662109375, -9.926513671875, -9.31640625, -8.706298828125, -8.09619140625, -7.486083984375, -6.8759765625, -6.265869140625, -5.65576171875, -5.045654296875, -4.435546875, -3.825439453125, -3.21533203125, -2.605224609375, -1.9951171875, -1.385009765625, -0.77490234375, -0.164794921875, 0.4453125, 1.055419921875, 1.66552734375, 2.275634765625, 2.8857421875, 3.495849609375, 4.10595703125, 4.716064453125, 5.326171875, 5.936279296875, 6.54638671875, 7.156494140625, 7.7666015625, 8.376708984375, 8.98681640625, 9.596923828125, 10.20703125, 10.817138671875, 11.42724609375, 12.037353515625, 12.6474609375, 13.257568359375, 13.86767578125, 14.477783203125, 15.087890625, 15.697998046875, 16.30810546875, 16.918212890625, 17.5283203125, 18.138427734375, 18.74853515625, 19.358642578125, 19.96875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 21.0, 30.0, 116.0, 254.0, 277.0, 195.0, 74.0, 32.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.020174026489258, -14.71348762512207, -13.406801223754883, -12.100114822387695, -10.793428421020508, -9.48674201965332, -8.180055618286133, -6.873369216918945, -5.566682815551758, -4.25999641418457, -2.953310012817383, -1.6466236114501953, -0.3399372100830078, 0.9667491912841797, 2.273435592651367, 3.5801219940185547, 4.886808395385742, 6.19349479675293, 7.500181198120117, 8.806867599487305, 10.113554000854492, 11.42024040222168, 12.726926803588867, 14.033613204956055, 15.340299606323242, 16.64698600769043, 17.953672409057617, 19.260358810424805, 20.567045211791992, 21.87373161315918, 23.180418014526367, 24.487104415893555, 25.793792724609375, 27.100479125976562, 28.40716552734375, 29.713851928710938, 31.020538330078125, 32.32722473144531, 33.6339111328125, 34.94059753417969, 36.247283935546875, 37.55397033691406, 38.86065673828125, 40.16734313964844, 41.474029541015625, 42.78071594238281, 44.08740234375, 45.39408874511719, 46.700775146484375, 48.00746154785156, 49.31414794921875, 50.62083435058594, 51.927520751953125, 53.23420715332031, 54.5408935546875, 55.84757995605469, 57.154266357421875, 58.46095275878906, 59.76763916015625, 61.07432556152344, 62.381011962890625, 63.68769836425781, 64.994384765625, 66.30107116699219, 67.60775756835938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 4.0, 9.0, 4.0, 8.0, 12.0, 15.0, 26.0, 27.0, 18.0, 29.0, 35.0, 32.0, 29.0, 37.0, 46.0, 48.0, 48.0, 38.0, 43.0, 44.0, 46.0, 41.0, 38.0, 43.0, 28.0, 39.0, 25.0, 23.0, 26.0, 17.0, 18.0, 19.0, 13.0, 15.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.587955474853516, -35.603729248046875, -34.619503021240234, -33.635276794433594, -32.65105056762695, -31.666824340820312, -30.682598114013672, -29.6983699798584, -28.714143753051758, -27.729917526245117, -26.745691299438477, -25.761465072631836, -24.777238845825195, -23.793010711669922, -22.80878448486328, -21.82455825805664, -20.84033203125, -19.85610580444336, -18.87187957763672, -17.887653350830078, -16.903427124023438, -15.91919994354248, -14.93497371673584, -13.950746536254883, -12.966522216796875, -11.982295989990234, -10.998069763183594, -10.013843536376953, -9.029616355895996, -8.045390129089355, -7.061163902282715, -6.076937198638916, -5.092710494995117, -4.108484268188477, -3.1242575645446777, -2.140031337738037, -1.1558048725128174, -0.17157840728759766, 0.812647819519043, 1.7968745231628418, 2.7811007499694824, 3.765327215194702, 4.749553680419922, 5.7337799072265625, 6.718006134033203, 7.702232837677002, 8.686458587646484, 9.670685768127441, 10.654911994934082, 11.639138221740723, 12.623364448547363, 13.60759162902832, 14.591817855834961, 15.576044082641602, 16.560270309448242, 17.544496536254883, 18.528722763061523, 19.512948989868164, 20.497175216674805, 21.481401443481445, 22.465627670288086, 23.44985580444336, 24.43408203125, 25.41830825805664, 26.40253448486328]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 7.0, 11.0, 12.0, 12.0, 17.0, 18.0, 13.0, 14.0, 20.0, 29.0, 25.0, 29.0, 29.0, 26.0, 34.0, 43.0, 42.0, 31.0, 42.0, 41.0, 50.0, 30.0, 45.0, 39.0, 41.0, 32.0, 28.0, 30.0, 33.0, 21.0, 26.0, 12.0, 15.0, 17.0, 10.0, 17.0, 8.0, 5.0, 8.0, 6.0, 8.0, 4.0, 3.0, 10.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.478515625, -3.365692138671875, -3.25286865234375, -3.140045166015625, -3.0272216796875, -2.914398193359375, -2.80157470703125, -2.688751220703125, -2.575927734375, -2.463104248046875, -2.35028076171875, -2.237457275390625, -2.1246337890625, -2.011810302734375, -1.89898681640625, -1.786163330078125, -1.67333984375, -1.560516357421875, -1.44769287109375, -1.334869384765625, -1.2220458984375, -1.109222412109375, -0.99639892578125, -0.883575439453125, -0.770751953125, -0.657928466796875, -0.54510498046875, -0.432281494140625, -0.3194580078125, -0.206634521484375, -0.09381103515625, 0.019012451171875, 0.1318359375, 0.244659423828125, 0.35748291015625, 0.470306396484375, 0.5831298828125, 0.695953369140625, 0.80877685546875, 0.921600341796875, 1.034423828125, 1.147247314453125, 1.26007080078125, 1.372894287109375, 1.4857177734375, 1.598541259765625, 1.71136474609375, 1.824188232421875, 1.93701171875, 2.049835205078125, 2.16265869140625, 2.275482177734375, 2.3883056640625, 2.501129150390625, 2.61395263671875, 2.726776123046875, 2.839599609375, 2.952423095703125, 3.06524658203125, 3.178070068359375, 3.2908935546875, 3.403717041015625, 3.51654052734375, 3.629364013671875, 3.7421875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 6.0, 18.0, 18.0, 27.0, 40.0, 48.0, 85.0, 136.0, 221.0, 366.0, 600.0, 1083.0, 1885.0, 3800.0, 7936.0, 17823.0, 48403.0, 232222.0, 1652444.0, 1876167.0, 261764.0, 52319.0, 18795.0, 8609.0, 4223.0, 2252.0, 1187.0, 670.0, 409.0, 263.0, 174.0, 88.0, 67.0, 43.0, 23.0, 17.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.4761962890625, -6.253173828125, -6.0301513671875, -5.80712890625, -5.5841064453125, -5.361083984375, -5.1380615234375, -4.9150390625, -4.6920166015625, -4.468994140625, -4.2459716796875, -4.02294921875, -3.7999267578125, -3.576904296875, -3.3538818359375, -3.130859375, -2.9078369140625, -2.684814453125, -2.4617919921875, -2.23876953125, -2.0157470703125, -1.792724609375, -1.5697021484375, -1.3466796875, -1.1236572265625, -0.900634765625, -0.6776123046875, -0.45458984375, -0.2315673828125, -0.008544921875, 0.2144775390625, 0.4375, 0.6605224609375, 0.883544921875, 1.1065673828125, 1.32958984375, 1.5526123046875, 1.775634765625, 1.9986572265625, 2.2216796875, 2.4447021484375, 2.667724609375, 2.8907470703125, 3.11376953125, 3.3367919921875, 3.559814453125, 3.7828369140625, 4.005859375, 4.2288818359375, 4.451904296875, 4.6749267578125, 4.89794921875, 5.1209716796875, 5.343994140625, 5.5670166015625, 5.7900390625, 6.0130615234375, 6.236083984375, 6.4591064453125, 6.68212890625, 6.9051513671875, 7.128173828125, 7.3511962890625, 7.57421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 8.0, 5.0, 12.0, 20.0, 17.0, 29.0, 36.0, 52.0, 94.0, 118.0, 157.0, 324.0, 531.0, 765.0, 686.0, 430.0, 257.0, 159.0, 110.0, 67.0, 46.0, 42.0, 27.0, 19.0, 18.0, 10.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.65234375, -7.39569091796875, -7.1390380859375, -6.88238525390625, -6.625732421875, -6.36907958984375, -6.1124267578125, -5.85577392578125, -5.59912109375, -5.34246826171875, -5.0858154296875, -4.82916259765625, -4.572509765625, -4.31585693359375, -4.0592041015625, -3.80255126953125, -3.5458984375, -3.28924560546875, -3.0325927734375, -2.77593994140625, -2.519287109375, -2.26263427734375, -2.0059814453125, -1.74932861328125, -1.49267578125, -1.23602294921875, -0.9793701171875, -0.72271728515625, -0.466064453125, -0.20941162109375, 0.0472412109375, 0.30389404296875, 0.560546875, 0.81719970703125, 1.0738525390625, 1.33050537109375, 1.587158203125, 1.84381103515625, 2.1004638671875, 2.35711669921875, 2.61376953125, 2.87042236328125, 3.1270751953125, 3.38372802734375, 3.640380859375, 3.89703369140625, 4.1536865234375, 4.41033935546875, 4.6669921875, 4.92364501953125, 5.1802978515625, 5.43695068359375, 5.693603515625, 5.95025634765625, 6.2069091796875, 6.46356201171875, 6.72021484375, 6.97686767578125, 7.2335205078125, 7.49017333984375, 7.746826171875, 8.00347900390625, 8.2601318359375, 8.51678466796875, 8.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 60.0, 82.0, 141.0, 278.0, 622.0, 2339.0, 17320.0, 564935.0, 3549130.0, 52812.0, 4631.0, 979.0, 366.0, 193.0, 94.0, 58.0, 34.0, 18.0, 27.0, 13.0, 6.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.390625, -25.618896484375, -24.84716796875, -24.075439453125, -23.3037109375, -22.531982421875, -21.76025390625, -20.988525390625, -20.216796875, -19.445068359375, -18.67333984375, -17.901611328125, -17.1298828125, -16.358154296875, -15.58642578125, -14.814697265625, -14.04296875, -13.271240234375, -12.49951171875, -11.727783203125, -10.9560546875, -10.184326171875, -9.41259765625, -8.640869140625, -7.869140625, -7.097412109375, -6.32568359375, -5.553955078125, -4.7822265625, -4.010498046875, -3.23876953125, -2.467041015625, -1.6953125, -0.923583984375, -0.15185546875, 0.619873046875, 1.3916015625, 2.163330078125, 2.93505859375, 3.706787109375, 4.478515625, 5.250244140625, 6.02197265625, 6.793701171875, 7.5654296875, 8.337158203125, 9.10888671875, 9.880615234375, 10.65234375, 11.424072265625, 12.19580078125, 12.967529296875, 13.7392578125, 14.510986328125, 15.28271484375, 16.054443359375, 16.826171875, 17.597900390625, 18.36962890625, 19.141357421875, 19.9130859375, 20.684814453125, 21.45654296875, 22.228271484375, 23.0]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 59.0, 278.0, 515.0, 128.0, 23.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-216.75743103027344, -212.90518188476562, -209.0529327392578, -205.20069885253906, -201.34844970703125, -197.49620056152344, -193.64395141601562, -189.79171752929688, -185.93946838378906, -182.08721923828125, -178.23497009277344, -174.3827362060547, -170.53048706054688, -166.67823791503906, -162.82598876953125, -158.9737548828125, -155.1215057373047, -151.26925659179688, -147.41700744628906, -143.5647735595703, -139.7125244140625, -135.8602752685547, -132.00802612304688, -128.15579223632812, -124.30353546142578, -120.45128631591797, -116.59904479980469, -112.74679565429688, -108.8945541381836, -105.04230499267578, -101.1900634765625, -97.33781433105469, -93.48558044433594, -89.63333129882812, -85.78108978271484, -81.92884063720703, -78.07659912109375, -74.22434997558594, -70.37210845947266, -66.51985931396484, -62.66761016845703, -58.815364837646484, -54.96311950683594, -51.11087417602539, -47.258628845214844, -43.40637969970703, -39.55413818359375, -35.70188903808594, -31.849647521972656, -27.99740219116211, -24.145156860351562, -20.292911529541016, -16.44066619873047, -12.588418960571289, -8.736173629760742, -4.883928298950195, -1.0316829681396484, 2.8205626010894775, 6.6728081703186035, 10.525053977966309, 14.377299308776855, 18.22954559326172, 22.081790924072266, 25.934036254882812, 29.78628158569336]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 10.0, 14.0, 6.0, 22.0, 18.0, 20.0, 35.0, 28.0, 38.0, 37.0, 40.0, 38.0, 42.0, 42.0, 45.0, 48.0, 53.0, 44.0, 36.0, 44.0, 42.0, 29.0, 40.0, 23.0, 26.0, 26.0, 21.0, 22.0, 21.0, 19.0, 9.0, 6.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.454151153564453, -22.71558380126953, -21.977014541625977, -21.238447189331055, -20.4998779296875, -19.761310577392578, -19.022743225097656, -18.284175872802734, -17.54560661315918, -16.807039260864258, -16.068470001220703, -15.329902648925781, -14.591334342956543, -13.852766036987305, -13.114198684692383, -12.375630378723145, -11.637062072753906, -10.898493766784668, -10.15992546081543, -9.421358108520508, -8.68278980255127, -7.944221496582031, -7.205653667449951, -6.467085838317871, -5.728517532348633, -4.9899492263793945, -4.2513813972473145, -3.5128133296966553, -2.774245262145996, -2.035677194595337, -1.2971091270446777, -0.5585412979125977, 0.18002891540527344, 0.9185969829559326, 1.6571650505065918, 2.395733118057251, 3.13430118560791, 3.8728692531585693, 4.6114373207092285, 5.350005149841309, 6.088573455810547, 6.827141761779785, 7.565709590911865, 8.304277420043945, 9.042845726013184, 9.781414031982422, 10.519981384277344, 11.258549690246582, 11.99711799621582, 12.735686302185059, 13.474254608154297, 14.212821960449219, 14.951390266418457, 15.689958572387695, 16.428525924682617, 17.167095184326172, 17.905662536621094, 18.644229888916016, 19.38279914855957, 20.121366500854492, 20.859935760498047, 21.59850311279297, 22.33707046508789, 23.075637817382812, 23.814207077026367]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 9.0, 10.0, 16.0, 22.0, 14.0, 28.0, 28.0, 27.0, 31.0, 42.0, 36.0, 42.0, 47.0, 45.0, 44.0, 49.0, 41.0, 42.0, 47.0, 40.0, 43.0, 29.0, 31.0, 31.0, 38.0, 28.0, 16.0, 15.0, 16.0, 16.0, 12.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.15234375, -4.02862548828125, -3.9049072265625, -3.78118896484375, -3.657470703125, -3.53375244140625, -3.4100341796875, -3.28631591796875, -3.16259765625, -3.03887939453125, -2.9151611328125, -2.79144287109375, -2.667724609375, -2.54400634765625, -2.4202880859375, -2.29656982421875, -2.1728515625, -2.04913330078125, -1.9254150390625, -1.80169677734375, -1.677978515625, -1.55426025390625, -1.4305419921875, -1.30682373046875, -1.18310546875, -1.05938720703125, -0.9356689453125, -0.81195068359375, -0.688232421875, -0.56451416015625, -0.4407958984375, -0.31707763671875, -0.193359375, -0.06964111328125, 0.0540771484375, 0.17779541015625, 0.301513671875, 0.42523193359375, 0.5489501953125, 0.67266845703125, 0.79638671875, 0.92010498046875, 1.0438232421875, 1.16754150390625, 1.291259765625, 1.41497802734375, 1.5386962890625, 1.66241455078125, 1.7861328125, 1.90985107421875, 2.0335693359375, 2.15728759765625, 2.281005859375, 2.40472412109375, 2.5284423828125, 2.65216064453125, 2.77587890625, 2.89959716796875, 3.0233154296875, 3.14703369140625, 3.270751953125, 3.39447021484375, 3.5181884765625, 3.64190673828125, 3.765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 12.0, 28.0, 37.0, 47.0, 58.0, 101.0, 150.0, 175.0, 236.0, 333.0, 456.0, 658.0, 962.0, 1445.0, 2505.0, 5621.0, 45421.0, 927898.0, 49286.0, 5743.0, 2502.0, 1529.0, 997.0, 656.0, 488.0, 371.0, 224.0, 181.0, 130.0, 99.0, 66.0, 40.0, 33.0, 19.0, 15.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.5400390625, -4.400390625, -4.2607421875, -4.12109375, -3.9814453125, -3.841796875, -3.7021484375, -3.5625, -3.4228515625, -3.283203125, -3.1435546875, -3.00390625, -2.8642578125, -2.724609375, -2.5849609375, -2.4453125, -2.3056640625, -2.166015625, -2.0263671875, -1.88671875, -1.7470703125, -1.607421875, -1.4677734375, -1.328125, -1.1884765625, -1.048828125, -0.9091796875, -0.76953125, -0.6298828125, -0.490234375, -0.3505859375, -0.2109375, -0.0712890625, 0.068359375, 0.2080078125, 0.34765625, 0.4873046875, 0.626953125, 0.7666015625, 0.90625, 1.0458984375, 1.185546875, 1.3251953125, 1.46484375, 1.6044921875, 1.744140625, 1.8837890625, 2.0234375, 2.1630859375, 2.302734375, 2.4423828125, 2.58203125, 2.7216796875, 2.861328125, 3.0009765625, 3.140625, 3.2802734375, 3.419921875, 3.5595703125, 3.69921875, 3.8388671875, 3.978515625, 4.1181640625, 4.2578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 1.0, 12.0, 14.0, 17.0, 10.0, 10.0, 11.0, 18.0, 26.0, 27.0, 17.0, 32.0, 32.0, 43.0, 41.0, 37.0, 31.0, 52.0, 1058.0, 49.0, 42.0, 41.0, 30.0, 35.0, 39.0, 26.0, 36.0, 33.0, 36.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 9.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.66796875, -2.588836669921875, -2.50970458984375, -2.430572509765625, -2.3514404296875, -2.272308349609375, -2.19317626953125, -2.114044189453125, -2.034912109375, -1.955780029296875, -1.87664794921875, -1.797515869140625, -1.7183837890625, -1.639251708984375, -1.56011962890625, -1.480987548828125, -1.40185546875, -1.322723388671875, -1.24359130859375, -1.164459228515625, -1.0853271484375, -1.006195068359375, -0.92706298828125, -0.847930908203125, -0.768798828125, -0.689666748046875, -0.61053466796875, -0.531402587890625, -0.4522705078125, -0.373138427734375, -0.29400634765625, -0.214874267578125, -0.1357421875, -0.056610107421875, 0.02252197265625, 0.101654052734375, 0.1807861328125, 0.259918212890625, 0.33905029296875, 0.418182373046875, 0.497314453125, 0.576446533203125, 0.65557861328125, 0.734710693359375, 0.8138427734375, 0.892974853515625, 0.97210693359375, 1.051239013671875, 1.13037109375, 1.209503173828125, 1.28863525390625, 1.367767333984375, 1.4468994140625, 1.526031494140625, 1.60516357421875, 1.684295654296875, 1.763427734375, 1.842559814453125, 1.92169189453125, 2.000823974609375, 2.0799560546875, 2.159088134765625, 2.23822021484375, 2.317352294921875, 2.396484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 5.0, 9.0, 6.0, 13.0, 19.0, 39.0, 48.0, 63.0, 81.0, 137.0, 185.0, 257.0, 390.0, 578.0, 797.0, 1393.0, 2353.0, 5039.0, 18022.0, 406766.0, 1620585.0, 27345.0, 5955.0, 2713.0, 1430.0, 944.0, 568.0, 416.0, 287.0, 198.0, 163.0, 104.0, 64.0, 42.0, 35.0, 23.0, 20.0, 12.0, 11.0, 6.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.13671875, -2.0758514404296875, -2.014984130859375, -1.9541168212890625, -1.89324951171875, -1.8323822021484375, -1.771514892578125, -1.7106475830078125, -1.6497802734375, -1.5889129638671875, -1.528045654296875, -1.4671783447265625, -1.40631103515625, -1.3454437255859375, -1.284576416015625, -1.2237091064453125, -1.162841796875, -1.1019744873046875, -1.041107177734375, -0.9802398681640625, -0.91937255859375, -0.8585052490234375, -0.797637939453125, -0.7367706298828125, -0.6759033203125, -0.6150360107421875, -0.554168701171875, -0.4933013916015625, -0.43243408203125, -0.3715667724609375, -0.310699462890625, -0.2498321533203125, -0.18896484375, -0.1280975341796875, -0.067230224609375, -0.0063629150390625, 0.05450439453125, 0.1153717041015625, 0.176239013671875, 0.2371063232421875, 0.2979736328125, 0.3588409423828125, 0.419708251953125, 0.4805755615234375, 0.54144287109375, 0.6023101806640625, 0.663177490234375, 0.7240447998046875, 0.784912109375, 0.8457794189453125, 0.906646728515625, 0.9675140380859375, 1.02838134765625, 1.0892486572265625, 1.150115966796875, 1.2109832763671875, 1.2718505859375, 1.3327178955078125, 1.393585205078125, 1.4544525146484375, 1.51531982421875, 1.5761871337890625, 1.637054443359375, 1.6979217529296875, 1.7587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 6.0, 9.0, 18.0, 18.0, 8.0, 20.0, 26.0, 31.0, 48.0, 100.0, 206.0, 168.0, 95.0, 63.0, 43.0, 28.0, 21.0, 14.0, 14.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09587287902832031, -0.09305191040039062, -0.09023094177246094, -0.08740997314453125, -0.08458900451660156, -0.08176803588867188, -0.07894706726074219, -0.0761260986328125, -0.07330513000488281, -0.07048416137695312, -0.06766319274902344, -0.06484222412109375, -0.06202125549316406, -0.059200286865234375, -0.05637931823730469, -0.053558349609375, -0.05073738098144531, -0.047916412353515625, -0.04509544372558594, -0.04227447509765625, -0.03945350646972656, -0.036632537841796875, -0.03381156921386719, -0.0309906005859375, -0.028169631958007812, -0.025348663330078125, -0.022527694702148438, -0.01970672607421875, -0.016885757446289062, -0.014064788818359375, -0.011243820190429688, -0.0084228515625, -0.0056018829345703125, -0.002780914306640625, 4.00543212890625e-05, 0.00286102294921875, 0.0056819915771484375, 0.008502960205078125, 0.011323928833007812, 0.0141448974609375, 0.016965866088867188, 0.019786834716796875, 0.022607803344726562, 0.02542877197265625, 0.028249740600585938, 0.031070709228515625, 0.03389167785644531, 0.036712646484375, 0.03953361511230469, 0.042354583740234375, 0.04517555236816406, 0.04799652099609375, 0.05081748962402344, 0.053638458251953125, 0.05645942687988281, 0.0592803955078125, 0.06210136413574219, 0.06492233276367188, 0.06774330139160156, 0.07056427001953125, 0.07338523864746094, 0.07620620727539062, 0.07902717590332031, 0.08184814453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 14.0, 18.0, 38.0, 49.0, 104.0, 221.0, 1116.0, 1040445.0, 5819.0, 336.0, 124.0, 62.0, 41.0, 26.0, 13.0, 19.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.962249755859375, -1.89129638671875, -1.820343017578125, -1.7493896484375, -1.678436279296875, -1.60748291015625, -1.536529541015625, -1.465576171875, -1.394622802734375, -1.32366943359375, -1.252716064453125, -1.1817626953125, -1.110809326171875, -1.03985595703125, -0.968902587890625, -0.89794921875, -0.826995849609375, -0.75604248046875, -0.685089111328125, -0.6141357421875, -0.543182373046875, -0.47222900390625, -0.401275634765625, -0.330322265625, -0.259368896484375, -0.18841552734375, -0.117462158203125, -0.0465087890625, 0.024444580078125, 0.09539794921875, 0.166351318359375, 0.2373046875, 0.308258056640625, 0.37921142578125, 0.450164794921875, 0.5211181640625, 0.592071533203125, 0.66302490234375, 0.733978271484375, 0.804931640625, 0.875885009765625, 0.94683837890625, 1.017791748046875, 1.0887451171875, 1.159698486328125, 1.23065185546875, 1.301605224609375, 1.37255859375, 1.443511962890625, 1.51446533203125, 1.585418701171875, 1.6563720703125, 1.727325439453125, 1.79827880859375, 1.869232177734375, 1.940185546875, 2.011138916015625, 2.08209228515625, 2.153045654296875, 2.2239990234375, 2.294952392578125, 2.36590576171875, 2.436859130859375, 2.5078125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 6.0, 34.0, 92.0, 325.0, 385.0, 135.0, 28.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06273401528596878, -0.05401284620165825, -0.04529167711734772, -0.036570508033037186, -0.027849338948726654, -0.019128169864416122, -0.01040700078010559, -0.0016858316957950592, 0.007035337388515472, 0.015756506472826004, 0.024477675557136536, 0.03319884464144707, 0.0419200137257576, 0.05064118281006813, 0.05936235189437866, 0.06808352470397949, 0.07680469006299973, 0.08552585542201996, 0.09424702823162079, 0.10296820104122162, 0.11168936640024185, 0.12041053175926208, 0.12913170456886292, 0.13785287737846375, 0.14657405018806458, 0.1552952229976654, 0.16401639580726624, 0.17273755371570587, 0.1814587265253067, 0.19017989933490753, 0.19890105724334717, 0.207622230052948, 0.21634337306022644, 0.22506454586982727, 0.2337857186794281, 0.24250687658786774, 0.2512280344963074, 0.2599492073059082, 0.26867038011550903, 0.27739155292510986, 0.2861127257347107, 0.2948338985443115, 0.30355507135391235, 0.3122762441635132, 0.320997416973114, 0.32971855998039246, 0.3384397327899933, 0.3471609055995941, 0.35588207840919495, 0.3646032512187958, 0.3733244240283966, 0.38204559683799744, 0.3907667398452759, 0.3994879126548767, 0.40820908546447754, 0.41693025827407837, 0.4256514310836792, 0.43437260389328003, 0.44309377670288086, 0.4518149495124817, 0.4605361223220825, 0.46925726532936096, 0.4779784381389618, 0.4866996109485626, 0.49542078375816345]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 11.0, 13.0, 3.0, 13.0, 15.0, 25.0, 11.0, 25.0, 21.0, 33.0, 38.0, 36.0, 39.0, 43.0, 54.0, 33.0, 53.0, 49.0, 47.0, 47.0, 34.0, 37.0, 31.0, 42.0, 34.0, 30.0, 27.0, 23.0, 18.0, 27.0, 16.0, 11.0, 10.0, 8.0, 9.0, 9.0, 9.0, 10.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07050657272338867, -0.06814620643854141, -0.06578584015369415, -0.06342548131942749, -0.06106511503458023, -0.05870474874973297, -0.05634438619017601, -0.05398402363061905, -0.05162365734577179, -0.04926329106092453, -0.04690292850136757, -0.04454256594181061, -0.04218219965696335, -0.03982183337211609, -0.03746147081255913, -0.03510110825300217, -0.03274074196815491, -0.030380377545952797, -0.028020013123750687, -0.025659648701548576, -0.023299284279346466, -0.020938919857144356, -0.018578555434942245, -0.016218191012740135, -0.013857826590538025, -0.011497462168335915, -0.009137097746133804, -0.006776733323931694, -0.004416368901729584, -0.0020560044795274734, 0.00030435994267463684, 0.002664724364876747, 0.005025088787078857, 0.007385453209280968, 0.009745817631483078, 0.012106182053685188, 0.014466546475887299, 0.01682691089808941, 0.01918727532029152, 0.02154763974249363, 0.02390800416469574, 0.02626836858689785, 0.02862873300909996, 0.03098909743130207, 0.03334946185350418, 0.03570982813835144, 0.0380701906979084, 0.04043055325746536, 0.04279091954231262, 0.04515128582715988, 0.04751164838671684, 0.049872010946273804, 0.05223237723112106, 0.05459274351596832, 0.056953106075525284, 0.059313468635082245, 0.061673834919929504, 0.06403420120477676, 0.06639456748962402, 0.06875492632389069, 0.07111529260873795, 0.0734756588935852, 0.07583601772785187, 0.07819638401269913, 0.08055675029754639]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 14.0, 13.0, 12.0, 23.0, 33.0, 22.0, 25.0, 36.0, 30.0, 43.0, 42.0, 39.0, 40.0, 45.0, 34.0, 39.0, 33.0, 44.0, 52.0, 46.0, 38.0, 40.0, 26.0, 27.0, 26.0, 37.0, 20.0, 20.0, 20.0, 10.0, 6.0, 13.0, 10.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.830535888671875, -3.70989990234375, -3.589263916015625, -3.4686279296875, -3.347991943359375, -3.22735595703125, -3.106719970703125, -2.986083984375, -2.865447998046875, -2.74481201171875, -2.624176025390625, -2.5035400390625, -2.382904052734375, -2.26226806640625, -2.141632080078125, -2.02099609375, -1.900360107421875, -1.77972412109375, -1.659088134765625, -1.5384521484375, -1.417816162109375, -1.29718017578125, -1.176544189453125, -1.055908203125, -0.935272216796875, -0.81463623046875, -0.694000244140625, -0.5733642578125, -0.452728271484375, -0.33209228515625, -0.211456298828125, -0.0908203125, 0.029815673828125, 0.15045166015625, 0.271087646484375, 0.3917236328125, 0.512359619140625, 0.63299560546875, 0.753631591796875, 0.874267578125, 0.994903564453125, 1.11553955078125, 1.236175537109375, 1.3568115234375, 1.477447509765625, 1.59808349609375, 1.718719482421875, 1.83935546875, 1.959991455078125, 2.08062744140625, 2.201263427734375, 2.3218994140625, 2.442535400390625, 2.56317138671875, 2.683807373046875, 2.804443359375, 2.925079345703125, 3.04571533203125, 3.166351318359375, 3.2869873046875, 3.407623291015625, 3.52825927734375, 3.648895263671875, 3.76953125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 8.0, 10.0, 14.0, 22.0, 15.0, 36.0, 51.0, 98.0, 182.0, 263.0, 467.0, 814.0, 1392.0, 2553.0, 4555.0, 8625.0, 16743.0, 33556.0, 70581.0, 170923.0, 386490.0, 196624.0, 78662.0, 36677.0, 18382.0, 9366.0, 5042.0, 2701.0, 1507.0, 922.0, 495.0, 293.0, 161.0, 114.0, 70.0, 36.0, 29.0, 19.0, 13.0, 14.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.65234375, -6.45416259765625, -6.2559814453125, -6.05780029296875, -5.859619140625, -5.66143798828125, -5.4632568359375, -5.26507568359375, -5.06689453125, -4.86871337890625, -4.6705322265625, -4.47235107421875, -4.274169921875, -4.07598876953125, -3.8778076171875, -3.67962646484375, -3.4814453125, -3.28326416015625, -3.0850830078125, -2.88690185546875, -2.688720703125, -2.49053955078125, -2.2923583984375, -2.09417724609375, -1.89599609375, -1.69781494140625, -1.4996337890625, -1.30145263671875, -1.103271484375, -0.90509033203125, -0.7069091796875, -0.50872802734375, -0.310546875, -0.11236572265625, 0.0858154296875, 0.28399658203125, 0.482177734375, 0.68035888671875, 0.8785400390625, 1.07672119140625, 1.27490234375, 1.47308349609375, 1.6712646484375, 1.86944580078125, 2.067626953125, 2.26580810546875, 2.4639892578125, 2.66217041015625, 2.8603515625, 3.05853271484375, 3.2567138671875, 3.45489501953125, 3.653076171875, 3.85125732421875, 4.0494384765625, 4.24761962890625, 4.44580078125, 4.64398193359375, 4.8421630859375, 5.04034423828125, 5.238525390625, 5.43670654296875, 5.6348876953125, 5.83306884765625, 6.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 8.0, 11.0, 17.0, 13.0, 19.0, 17.0, 23.0, 31.0, 24.0, 33.0, 45.0, 46.0, 48.0, 56.0, 90.0, 104.0, 169.0, 1367.0, 245.0, 144.0, 91.0, 44.0, 43.0, 36.0, 35.0, 40.0, 25.0, 24.0, 25.0, 23.0, 27.0, 15.0, 19.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 7.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.43505859375, -9.1279296875, -8.82080078125, -8.513671875, -8.20654296875, -7.8994140625, -7.59228515625, -7.28515625, -6.97802734375, -6.6708984375, -6.36376953125, -6.056640625, -5.74951171875, -5.4423828125, -5.13525390625, -4.828125, -4.52099609375, -4.2138671875, -3.90673828125, -3.599609375, -3.29248046875, -2.9853515625, -2.67822265625, -2.37109375, -2.06396484375, -1.7568359375, -1.44970703125, -1.142578125, -0.83544921875, -0.5283203125, -0.22119140625, 0.0859375, 0.39306640625, 0.7001953125, 1.00732421875, 1.314453125, 1.62158203125, 1.9287109375, 2.23583984375, 2.54296875, 2.85009765625, 3.1572265625, 3.46435546875, 3.771484375, 4.07861328125, 4.3857421875, 4.69287109375, 5.0, 5.30712890625, 5.6142578125, 5.92138671875, 6.228515625, 6.53564453125, 6.8427734375, 7.14990234375, 7.45703125, 7.76416015625, 8.0712890625, 8.37841796875, 8.685546875, 8.99267578125, 9.2998046875, 9.60693359375, 9.9140625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 15.0, 9.0, 19.0, 15.0, 36.0, 32.0, 69.0, 112.0, 187.0, 376.0, 701.0, 1793.0, 4835.0, 18409.0, 118770.0, 2476881.0, 465775.0, 43428.0, 9224.0, 2744.0, 1123.0, 513.0, 267.0, 143.0, 71.0, 44.0, 29.0, 22.0, 20.0, 8.0, 7.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.234375, -13.721435546875, -13.20849609375, -12.695556640625, -12.1826171875, -11.669677734375, -11.15673828125, -10.643798828125, -10.130859375, -9.617919921875, -9.10498046875, -8.592041015625, -8.0791015625, -7.566162109375, -7.05322265625, -6.540283203125, -6.02734375, -5.514404296875, -5.00146484375, -4.488525390625, -3.9755859375, -3.462646484375, -2.94970703125, -2.436767578125, -1.923828125, -1.410888671875, -0.89794921875, -0.385009765625, 0.1279296875, 0.640869140625, 1.15380859375, 1.666748046875, 2.1796875, 2.692626953125, 3.20556640625, 3.718505859375, 4.2314453125, 4.744384765625, 5.25732421875, 5.770263671875, 6.283203125, 6.796142578125, 7.30908203125, 7.822021484375, 8.3349609375, 8.847900390625, 9.36083984375, 9.873779296875, 10.38671875, 10.899658203125, 11.41259765625, 11.925537109375, 12.4384765625, 12.951416015625, 13.46435546875, 13.977294921875, 14.490234375, 15.003173828125, 15.51611328125, 16.029052734375, 16.5419921875, 17.054931640625, 17.56787109375, 18.080810546875, 18.59375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 17.0, 205.0, 531.0, 226.0, 30.0, 5.0, 1.0], "bins": [-228.764404296875, -224.92250061035156, -221.08059692382812, -217.23870849609375, -213.3968048095703, -209.55490112304688, -205.71299743652344, -201.87110900878906, -198.02920532226562, -194.1873016357422, -190.34539794921875, -186.50350952148438, -182.66160583496094, -178.8197021484375, -174.97779846191406, -171.1359100341797, -167.29400634765625, -163.4521026611328, -159.61019897460938, -155.768310546875, -151.92640686035156, -148.08450317382812, -144.2425994873047, -140.4007110595703, -136.55880737304688, -132.71690368652344, -128.875, -125.0331039428711, -121.19120788574219, -117.34930419921875, -113.50740814208984, -109.6655044555664, -105.82360076904297, -101.98169708251953, -98.13980102539062, -94.29789733886719, -90.45600128173828, -86.61409759521484, -82.77220153808594, -78.9302978515625, -75.08839416503906, -71.24649047851562, -67.40459442138672, -63.56269454956055, -59.720794677734375, -55.87889099121094, -52.03699493408203, -48.195091247558594, -44.35319519042969, -40.511295318603516, -36.669395446777344, -32.82749557495117, -28.985595703125, -25.143693923950195, -21.301794052124023, -17.45989418029785, -13.617996215820312, -9.77609634399414, -5.9341959953308105, -2.0922956466674805, 1.7496042251586914, 5.59150505065918, 9.433404922485352, 13.275304794311523, 17.117204666137695]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 14.0, 22.0, 15.0, 20.0, 13.0, 28.0, 26.0, 24.0, 35.0, 43.0, 39.0, 40.0, 43.0, 44.0, 37.0, 43.0, 43.0, 42.0, 40.0, 33.0, 31.0, 31.0, 28.0, 37.0, 17.0, 23.0, 30.0, 22.0, 14.0, 21.0, 12.0, 9.0, 11.0, 8.0, 7.0, 5.0, 10.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.797935485839844, -23.97972297668457, -23.161510467529297, -22.343297958374023, -21.52508544921875, -20.706871032714844, -19.888660430908203, -19.070446014404297, -18.252233505249023, -17.43402099609375, -16.615808486938477, -15.797595977783203, -14.979382514953613, -14.16117000579834, -13.342957496643066, -12.524744033813477, -11.70653247833252, -10.888319969177246, -10.070107460021973, -9.251893997192383, -8.43368148803711, -7.615468978881836, -6.7972564697265625, -5.979043483734131, -5.160830974578857, -4.342618465423584, -3.5244054794311523, -2.706192970275879, -1.8879802227020264, -1.0697674751281738, -0.2515549659729004, 0.5666580200195312, 1.3848705291748047, 2.2030832767486572, 3.0212960243225098, 3.839508533477783, 4.657721519470215, 5.475934028625488, 6.294146537780762, 7.112359523773193, 7.930572032928467, 8.748785018920898, 9.566997528076172, 10.385210037231445, 11.203422546386719, 12.021635055541992, 12.839847564697266, 13.658061027526855, 14.476273536682129, 15.294486045837402, 16.112699508666992, 16.930912017822266, 17.74912452697754, 18.567337036132812, 19.385549545288086, 20.20376205444336, 21.021974563598633, 21.840187072753906, 22.65839958190918, 23.476612091064453, 24.294824600219727, 25.113037109375, 25.931251525878906, 26.74946403503418, 27.567676544189453]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 5.0, 9.0, 12.0, 18.0, 12.0, 22.0, 14.0, 29.0, 19.0, 18.0, 33.0, 27.0, 25.0, 28.0, 28.0, 34.0, 33.0, 52.0, 42.0, 43.0, 38.0, 40.0, 44.0, 43.0, 32.0, 32.0, 27.0, 24.0, 32.0, 19.0, 21.0, 17.0, 8.0, 13.0, 18.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-3.341796875, -3.23211669921875, -3.1224365234375, -3.01275634765625, -2.903076171875, -2.79339599609375, -2.6837158203125, -2.57403564453125, -2.46435546875, -2.35467529296875, -2.2449951171875, -2.13531494140625, -2.025634765625, -1.91595458984375, -1.8062744140625, -1.69659423828125, -1.5869140625, -1.47723388671875, -1.3675537109375, -1.25787353515625, -1.148193359375, -1.03851318359375, -0.9288330078125, -0.81915283203125, -0.70947265625, -0.59979248046875, -0.4901123046875, -0.38043212890625, -0.270751953125, -0.16107177734375, -0.0513916015625, 0.05828857421875, 0.16796875, 0.27764892578125, 0.3873291015625, 0.49700927734375, 0.606689453125, 0.71636962890625, 0.8260498046875, 0.93572998046875, 1.04541015625, 1.15509033203125, 1.2647705078125, 1.37445068359375, 1.484130859375, 1.59381103515625, 1.7034912109375, 1.81317138671875, 1.9228515625, 2.03253173828125, 2.1422119140625, 2.25189208984375, 2.361572265625, 2.47125244140625, 2.5809326171875, 2.69061279296875, 2.80029296875, 2.90997314453125, 3.0196533203125, 3.12933349609375, 3.239013671875, 3.34869384765625, 3.4583740234375, 3.56805419921875, 3.677734375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 7.0, 13.0, 15.0, 16.0, 17.0, 25.0, 22.0, 32.0, 41.0, 35.0, 54.0, 55.0, 90.0, 167.0, 326.0, 948.0, 4247.0, 34799.0, 3086677.0, 1042467.0, 19597.0, 3026.0, 742.0, 278.0, 141.0, 85.0, 54.0, 34.0, 50.0, 30.0, 24.0, 20.0, 25.0, 18.0, 10.0, 12.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 2.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.635498046875, -20.91162109375, -20.187744140625, -19.4638671875, -18.739990234375, -18.01611328125, -17.292236328125, -16.568359375, -15.844482421875, -15.12060546875, -14.396728515625, -13.6728515625, -12.948974609375, -12.22509765625, -11.501220703125, -10.77734375, -10.053466796875, -9.32958984375, -8.605712890625, -7.8818359375, -7.157958984375, -6.43408203125, -5.710205078125, -4.986328125, -4.262451171875, -3.53857421875, -2.814697265625, -2.0908203125, -1.366943359375, -0.64306640625, 0.080810546875, 0.8046875, 1.528564453125, 2.25244140625, 2.976318359375, 3.7001953125, 4.424072265625, 5.14794921875, 5.871826171875, 6.595703125, 7.319580078125, 8.04345703125, 8.767333984375, 9.4912109375, 10.215087890625, 10.93896484375, 11.662841796875, 12.38671875, 13.110595703125, 13.83447265625, 14.558349609375, 15.2822265625, 16.006103515625, 16.72998046875, 17.453857421875, 18.177734375, 18.901611328125, 19.62548828125, 20.349365234375, 21.0732421875, 21.797119140625, 22.52099609375, 23.244873046875, 23.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 12.0, 8.0, 19.0, 18.0, 26.0, 31.0, 29.0, 58.0, 66.0, 88.0, 124.0, 202.0, 262.0, 442.0, 581.0, 607.0, 467.0, 271.0, 209.0, 130.0, 100.0, 74.0, 42.0, 48.0, 24.0, 27.0, 18.0, 9.0, 22.0, 10.0, 9.0, 8.0, 4.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.2452392578125, -4.052978515625, -3.8607177734375, -3.66845703125, -3.4761962890625, -3.283935546875, -3.0916748046875, -2.8994140625, -2.7071533203125, -2.514892578125, -2.3226318359375, -2.13037109375, -1.9381103515625, -1.745849609375, -1.5535888671875, -1.361328125, -1.1690673828125, -0.976806640625, -0.7845458984375, -0.59228515625, -0.4000244140625, -0.207763671875, -0.0155029296875, 0.1767578125, 0.3690185546875, 0.561279296875, 0.7535400390625, 0.94580078125, 1.1380615234375, 1.330322265625, 1.5225830078125, 1.71484375, 1.9071044921875, 2.099365234375, 2.2916259765625, 2.48388671875, 2.6761474609375, 2.868408203125, 3.0606689453125, 3.2529296875, 3.4451904296875, 3.637451171875, 3.8297119140625, 4.02197265625, 4.2142333984375, 4.406494140625, 4.5987548828125, 4.791015625, 4.9832763671875, 5.175537109375, 5.3677978515625, 5.56005859375, 5.7523193359375, 5.944580078125, 6.1368408203125, 6.3291015625, 6.5213623046875, 6.713623046875, 6.9058837890625, 7.09814453125, 7.2904052734375, 7.482666015625, 7.6749267578125, 7.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 4.0, 12.0, 13.0, 10.0, 16.0, 26.0, 24.0, 31.0, 37.0, 86.0, 120.0, 223.0, 715.0, 4107.0, 48352.0, 2920003.0, 1185259.0, 30887.0, 3116.0, 617.0, 238.0, 119.0, 58.0, 42.0, 34.0, 20.0, 16.0, 12.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.517333984375, -19.83154296875, -19.145751953125, -18.4599609375, -17.774169921875, -17.08837890625, -16.402587890625, -15.716796875, -15.031005859375, -14.34521484375, -13.659423828125, -12.9736328125, -12.287841796875, -11.60205078125, -10.916259765625, -10.23046875, -9.544677734375, -8.85888671875, -8.173095703125, -7.4873046875, -6.801513671875, -6.11572265625, -5.429931640625, -4.744140625, -4.058349609375, -3.37255859375, -2.686767578125, -2.0009765625, -1.315185546875, -0.62939453125, 0.056396484375, 0.7421875, 1.427978515625, 2.11376953125, 2.799560546875, 3.4853515625, 4.171142578125, 4.85693359375, 5.542724609375, 6.228515625, 6.914306640625, 7.60009765625, 8.285888671875, 8.9716796875, 9.657470703125, 10.34326171875, 11.029052734375, 11.71484375, 12.400634765625, 13.08642578125, 13.772216796875, 14.4580078125, 15.143798828125, 15.82958984375, 16.515380859375, 17.201171875, 17.886962890625, 18.57275390625, 19.258544921875, 19.9443359375, 20.630126953125, 21.31591796875, 22.001708984375, 22.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 17.0, 39.0, 81.0, 181.0, 249.0, 234.0, 123.0, 50.0, 24.0, 12.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.815486907958984, -53.194007873535156, -51.572532653808594, -49.951053619384766, -48.32957458496094, -46.708099365234375, -45.08662033081055, -43.46514129638672, -41.843666076660156, -40.22218704223633, -38.600711822509766, -36.97923278808594, -35.35775375366211, -33.73627471923828, -32.11479949951172, -30.49332046508789, -28.871841430664062, -27.250364303588867, -25.62888526916504, -24.007408142089844, -22.385929107666016, -20.76445198059082, -19.142974853515625, -17.521495819091797, -15.900018692016602, -14.27854061126709, -12.657062530517578, -11.035585403442383, -9.414107322692871, -7.792629241943359, -6.171152114868164, -4.549674034118652, -2.928192138671875, -1.3067142963409424, 0.31476354598999023, 1.9362411499023438, 3.5577192306518555, 5.179197311401367, 6.8006744384765625, 8.422152519226074, 10.043630599975586, 11.665108680725098, 13.28658676147461, 14.908063888549805, 16.529541015625, 18.151020050048828, 19.772497177124023, 21.39397430419922, 23.015453338623047, 24.636930465698242, 26.25840950012207, 27.879886627197266, 29.501365661621094, 31.12284278869629, 32.744319915771484, 34.36579895019531, 35.987274169921875, 37.6087532043457, 39.230228424072266, 40.851707458496094, 42.47318649291992, 44.09466552734375, 45.71614074707031, 47.33761978149414, 48.95909881591797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 8.0, 5.0, 5.0, 7.0, 10.0, 8.0, 15.0, 19.0, 12.0, 15.0, 18.0, 15.0, 18.0, 22.0, 31.0, 28.0, 24.0, 31.0, 27.0, 33.0, 43.0, 25.0, 23.0, 30.0, 47.0, 39.0, 26.0, 47.0, 33.0, 17.0, 44.0, 28.0, 34.0, 31.0, 17.0, 15.0, 20.0, 13.0, 15.0, 19.0, 7.0, 9.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.015356063842773, -16.481029510498047, -15.94670295715332, -15.412375450134277, -14.87804889678955, -14.343722343444824, -13.809394836425781, -13.275068283081055, -12.740741729736328, -12.206415176391602, -11.672088623046875, -11.137761116027832, -10.603434562683105, -10.069108009338379, -9.534780502319336, -9.00045394897461, -8.466127395629883, -7.931800842285156, -7.3974738121032715, -6.863146781921387, -6.32882022857666, -5.794493675231934, -5.260166645050049, -4.725839614868164, -4.1915130615234375, -3.657186269760132, -3.122859477996826, -2.5885326862335205, -2.054205894470215, -1.5198791027069092, -0.9855523109436035, -0.45122551918029785, 0.08310317993164062, 0.6174299716949463, 1.151756763458252, 1.6860835552215576, 2.2204103469848633, 2.754737138748169, 3.2890639305114746, 3.8233907222747803, 4.357717514038086, 4.8920440673828125, 5.426371097564697, 5.960698127746582, 6.495024681091309, 7.029351234436035, 7.56367826461792, 8.098005294799805, 8.632331848144531, 9.166658401489258, 9.700984954833984, 10.235312461853027, 10.769639015197754, 11.30396556854248, 11.838293075561523, 12.37261962890625, 12.906946182250977, 13.441272735595703, 13.97559928894043, 14.509926795959473, 15.0442533493042, 15.578579902648926, 16.11290740966797, 16.647233963012695, 17.181560516357422]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 10.0, 17.0, 13.0, 22.0, 15.0, 17.0, 19.0, 25.0, 27.0, 23.0, 30.0, 40.0, 34.0, 38.0, 40.0, 39.0, 52.0, 42.0, 51.0, 36.0, 35.0, 39.0, 30.0, 31.0, 37.0, 26.0, 27.0, 23.0, 22.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.326690673828125, -3.21002197265625, -3.093353271484375, -2.9766845703125, -2.860015869140625, -2.74334716796875, -2.626678466796875, -2.510009765625, -2.393341064453125, -2.27667236328125, -2.160003662109375, -2.0433349609375, -1.926666259765625, -1.80999755859375, -1.693328857421875, -1.57666015625, -1.459991455078125, -1.34332275390625, -1.226654052734375, -1.1099853515625, -0.993316650390625, -0.87664794921875, -0.759979248046875, -0.643310546875, -0.526641845703125, -0.40997314453125, -0.293304443359375, -0.1766357421875, -0.059967041015625, 0.05670166015625, 0.173370361328125, 0.2900390625, 0.406707763671875, 0.52337646484375, 0.640045166015625, 0.7567138671875, 0.873382568359375, 0.99005126953125, 1.106719970703125, 1.223388671875, 1.340057373046875, 1.45672607421875, 1.573394775390625, 1.6900634765625, 1.806732177734375, 1.92340087890625, 2.040069580078125, 2.15673828125, 2.273406982421875, 2.39007568359375, 2.506744384765625, 2.6234130859375, 2.740081787109375, 2.85675048828125, 2.973419189453125, 3.090087890625, 3.206756591796875, 3.32342529296875, 3.440093994140625, 3.5567626953125, 3.673431396484375, 3.79010009765625, 3.906768798828125, 4.0234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 12.0, 22.0, 24.0, 46.0, 66.0, 92.0, 125.0, 225.0, 312.0, 451.0, 798.0, 1211.0, 2059.0, 3612.0, 6373.0, 12117.0, 23867.0, 48701.0, 105548.0, 228162.0, 297256.0, 167144.0, 75469.0, 35508.0, 17512.0, 9451.0, 4994.0, 2934.0, 1648.0, 990.0, 647.0, 401.0, 233.0, 199.0, 102.0, 75.0, 47.0, 41.0, 29.0, 10.0, 12.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62841796875, -0.6089553833007812, -0.5894927978515625, -0.5700302124023438, -0.550567626953125, -0.5311050415039062, -0.5116424560546875, -0.49217987060546875, -0.47271728515625, -0.45325469970703125, -0.4337921142578125, -0.41432952880859375, -0.394866943359375, -0.37540435791015625, -0.3559417724609375, -0.33647918701171875, -0.3170166015625, -0.29755401611328125, -0.2780914306640625, -0.25862884521484375, -0.239166259765625, -0.21970367431640625, -0.2002410888671875, -0.18077850341796875, -0.16131591796875, -0.14185333251953125, -0.1223907470703125, -0.10292816162109375, -0.083465576171875, -0.06400299072265625, -0.0445404052734375, -0.02507781982421875, -0.005615234375, 0.01384735107421875, 0.0333099365234375, 0.05277252197265625, 0.072235107421875, 0.09169769287109375, 0.1111602783203125, 0.13062286376953125, 0.15008544921875, 0.16954803466796875, 0.1890106201171875, 0.20847320556640625, 0.227935791015625, 0.24739837646484375, 0.2668609619140625, 0.28632354736328125, 0.3057861328125, 0.32524871826171875, 0.3447113037109375, 0.36417388916015625, 0.383636474609375, 0.40309906005859375, 0.4225616455078125, 0.44202423095703125, 0.46148681640625, 0.48094940185546875, 0.5004119873046875, 0.5198745727539062, 0.539337158203125, 0.5587997436523438, 0.5782623291015625, 0.5977249145507812, 0.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 9.0, 5.0, 9.0, 8.0, 14.0, 12.0, 18.0, 17.0, 18.0, 26.0, 30.0, 26.0, 28.0, 35.0, 26.0, 30.0, 45.0, 40.0, 35.0, 43.0, 1068.0, 37.0, 40.0, 44.0, 22.0, 33.0, 34.0, 26.0, 30.0, 31.0, 25.0, 20.0, 21.0, 20.0, 16.0, 14.0, 13.0, 7.0, 9.0, 7.0, 5.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.349609375, -2.27178955078125, -2.1939697265625, -2.11614990234375, -2.038330078125, -1.96051025390625, -1.8826904296875, -1.80487060546875, -1.72705078125, -1.64923095703125, -1.5714111328125, -1.49359130859375, -1.415771484375, -1.33795166015625, -1.2601318359375, -1.18231201171875, -1.1044921875, -1.02667236328125, -0.9488525390625, -0.87103271484375, -0.793212890625, -0.71539306640625, -0.6375732421875, -0.55975341796875, -0.48193359375, -0.40411376953125, -0.3262939453125, -0.24847412109375, -0.170654296875, -0.09283447265625, -0.0150146484375, 0.06280517578125, 0.140625, 0.21844482421875, 0.2962646484375, 0.37408447265625, 0.451904296875, 0.52972412109375, 0.6075439453125, 0.68536376953125, 0.76318359375, 0.84100341796875, 0.9188232421875, 0.99664306640625, 1.074462890625, 1.15228271484375, 1.2301025390625, 1.30792236328125, 1.3857421875, 1.46356201171875, 1.5413818359375, 1.61920166015625, 1.697021484375, 1.77484130859375, 1.8526611328125, 1.93048095703125, 2.00830078125, 2.08612060546875, 2.1639404296875, 2.24176025390625, 2.319580078125, 2.39739990234375, 2.4752197265625, 2.55303955078125, 2.630859375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 14.0, 10.0, 22.0, 52.0, 68.0, 94.0, 150.0, 263.0, 460.0, 875.0, 1841.0, 4058.0, 10031.0, 27741.0, 88276.0, 369074.0, 1330679.0, 182731.0, 51305.0, 17344.0, 6428.0, 2728.0, 1279.0, 659.0, 347.0, 220.0, 115.0, 78.0, 42.0, 28.0, 21.0, 25.0, 15.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.646484375, -0.62762451171875, -0.6087646484375, -0.58990478515625, -0.571044921875, -0.55218505859375, -0.5333251953125, -0.51446533203125, -0.49560546875, -0.47674560546875, -0.4578857421875, -0.43902587890625, -0.420166015625, -0.40130615234375, -0.3824462890625, -0.36358642578125, -0.3447265625, -0.32586669921875, -0.3070068359375, -0.28814697265625, -0.269287109375, -0.25042724609375, -0.2315673828125, -0.21270751953125, -0.19384765625, -0.17498779296875, -0.1561279296875, -0.13726806640625, -0.118408203125, -0.09954833984375, -0.0806884765625, -0.06182861328125, -0.04296875, -0.02410888671875, -0.0052490234375, 0.01361083984375, 0.032470703125, 0.05133056640625, 0.0701904296875, 0.08905029296875, 0.10791015625, 0.12677001953125, 0.1456298828125, 0.16448974609375, 0.183349609375, 0.20220947265625, 0.2210693359375, 0.23992919921875, 0.2587890625, 0.27764892578125, 0.2965087890625, 0.31536865234375, 0.334228515625, 0.35308837890625, 0.3719482421875, 0.39080810546875, 0.40966796875, 0.42852783203125, 0.4473876953125, 0.46624755859375, 0.485107421875, 0.50396728515625, 0.5228271484375, 0.54168701171875, 0.560546875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 13.0, 18.0, 21.0, 27.0, 29.0, 48.0, 72.0, 131.0, 155.0, 140.0, 87.0, 67.0, 33.0, 22.0, 25.0, 14.0, 14.0, 8.0, 15.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10052490234375, -0.09778881072998047, -0.09505271911621094, -0.0923166275024414, -0.08958053588867188, -0.08684444427490234, -0.08410835266113281, -0.08137226104736328, -0.07863616943359375, -0.07590007781982422, -0.07316398620605469, -0.07042789459228516, -0.06769180297851562, -0.0649557113647461, -0.06221961975097656, -0.05948352813720703, -0.0567474365234375, -0.05401134490966797, -0.05127525329589844, -0.048539161682128906, -0.045803070068359375, -0.043066978454589844, -0.04033088684082031, -0.03759479522705078, -0.03485870361328125, -0.03212261199951172, -0.029386520385742188, -0.026650428771972656, -0.023914337158203125, -0.021178245544433594, -0.018442153930664062, -0.01570606231689453, -0.012969970703125, -0.010233879089355469, -0.0074977874755859375, -0.004761695861816406, -0.002025604248046875, 0.0007104873657226562, 0.0034465789794921875, 0.006182670593261719, 0.00891876220703125, 0.011654853820800781, 0.014390945434570312, 0.017127037048339844, 0.019863128662109375, 0.022599220275878906, 0.025335311889648438, 0.02807140350341797, 0.0308074951171875, 0.03354358673095703, 0.03627967834472656, 0.039015769958496094, 0.041751861572265625, 0.044487953186035156, 0.04722404479980469, 0.04996013641357422, 0.05269622802734375, 0.05543231964111328, 0.05816841125488281, 0.060904502868652344, 0.06364059448242188, 0.0663766860961914, 0.06911277770996094, 0.07184886932373047, 0.0745849609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 4.0, 5.0, 8.0, 6.0, 15.0, 16.0, 31.0, 38.0, 68.0, 108.0, 196.0, 487.0, 10561.0, 1032639.0, 3488.0, 399.0, 183.0, 87.0, 65.0, 39.0, 29.0, 21.0, 14.0, 3.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6268157958984375, -1.565155029296875, -1.5034942626953125, -1.44183349609375, -1.3801727294921875, -1.318511962890625, -1.2568511962890625, -1.1951904296875, -1.1335296630859375, -1.071868896484375, -1.0102081298828125, -0.94854736328125, -0.8868865966796875, -0.825225830078125, -0.7635650634765625, -0.701904296875, -0.6402435302734375, -0.578582763671875, -0.5169219970703125, -0.45526123046875, -0.3936004638671875, -0.331939697265625, -0.2702789306640625, -0.2086181640625, -0.1469573974609375, -0.085296630859375, -0.0236358642578125, 0.03802490234375, 0.0996856689453125, 0.161346435546875, 0.2230072021484375, 0.28466796875, 0.3463287353515625, 0.407989501953125, 0.4696502685546875, 0.53131103515625, 0.5929718017578125, 0.654632568359375, 0.7162933349609375, 0.7779541015625, 0.8396148681640625, 0.901275634765625, 0.9629364013671875, 1.02459716796875, 1.0862579345703125, 1.147918701171875, 1.2095794677734375, 1.271240234375, 1.3329010009765625, 1.394561767578125, 1.4562225341796875, 1.51788330078125, 1.5795440673828125, 1.641204833984375, 1.7028656005859375, 1.7645263671875, 1.8261871337890625, 1.887847900390625, 1.9495086669921875, 2.01116943359375, 2.0728302001953125, 2.134490966796875, 2.1961517333984375, 2.2578125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 18.0, 50.0, 127.0, 292.0, 307.0, 139.0, 39.0, 20.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19680680334568024, -0.18978610634803772, -0.1827654093503952, -0.17574471235275269, -0.16872401535511017, -0.16170331835746765, -0.15468262135982513, -0.14766192436218262, -0.1406412273645401, -0.13362053036689758, -0.12659983336925507, -0.11957913637161255, -0.11255843937397003, -0.10553774237632751, -0.098517045378685, -0.09149634838104248, -0.08447565138339996, -0.07745495438575745, -0.07043425738811493, -0.06341356039047241, -0.056392863392829895, -0.04937216639518738, -0.04235146939754486, -0.035330772399902344, -0.028310075402259827, -0.02128937840461731, -0.014268681406974792, -0.007247984409332275, -0.0002272874116897583, 0.006793409585952759, 0.013814106583595276, 0.020834803581237793, 0.027855515480041504, 0.03487621247768402, 0.04189690947532654, 0.048917606472969055, 0.05593830347061157, 0.06295900046825409, 0.0699796974658966, 0.07700039446353912, 0.08402109146118164, 0.09104178845882416, 0.09806248545646667, 0.10508318245410919, 0.11210387945175171, 0.11912457644939423, 0.12614527344703674, 0.13316597044467926, 0.14018666744232178, 0.1472073644399643, 0.1542280614376068, 0.16124875843524933, 0.16826945543289185, 0.17529015243053436, 0.18231084942817688, 0.1893315464258194, 0.19635224342346191, 0.20337294042110443, 0.21039363741874695, 0.21741433441638947, 0.22443503141403198, 0.2314557284116745, 0.23847642540931702, 0.24549712240695953, 0.25251781940460205]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 8.0, 4.0, 14.0, 13.0, 15.0, 19.0, 17.0, 22.0, 27.0, 35.0, 19.0, 16.0, 34.0, 28.0, 39.0, 36.0, 49.0, 29.0, 40.0, 42.0, 43.0, 32.0, 36.0, 32.0, 35.0, 25.0, 30.0, 34.0, 36.0, 38.0, 21.0, 20.0, 9.0, 16.0, 6.0, 17.0, 8.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.05887115001678467, -0.05697086825966835, -0.05507058650255203, -0.053170304745435715, -0.0512700229883194, -0.04936974123120308, -0.04746945947408676, -0.045569177716970444, -0.043668895959854126, -0.04176861420273781, -0.03986833244562149, -0.03796805068850517, -0.036067768931388855, -0.03416748717427254, -0.03226720541715622, -0.0303669236600399, -0.028466641902923584, -0.026566360145807266, -0.02466607838869095, -0.02276579663157463, -0.020865514874458313, -0.018965233117341995, -0.017064951360225677, -0.01516466960310936, -0.013264387845993042, -0.011364106088876724, -0.009463824331760406, -0.007563542574644089, -0.005663260817527771, -0.0037629790604114532, -0.0018626973032951355, 3.758445382118225e-05, 0.0019378662109375, 0.0038381479680538177, 0.0057384297251701355, 0.007638711482286453, 0.009538993239402771, 0.011439274996519089, 0.013339556753635406, 0.015239838510751724, 0.017140120267868042, 0.01904040202498436, 0.020940683782100677, 0.022840965539216995, 0.024741247296333313, 0.02664152905344963, 0.02854181081056595, 0.030442092567682266, 0.032342374324798584, 0.0342426560819149, 0.03614293783903122, 0.03804321959614754, 0.039943501353263855, 0.04184378311038017, 0.04374406486749649, 0.04564434662461281, 0.047544628381729126, 0.049444910138845444, 0.05134519189596176, 0.05324547365307808, 0.0551457554101944, 0.057046037167310715, 0.05894631892442703, 0.06084660068154335, 0.06274688243865967]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 10.0, 10.0, 13.0, 13.0, 15.0, 12.0, 19.0, 28.0, 27.0, 29.0, 25.0, 28.0, 36.0, 40.0, 31.0, 38.0, 53.0, 33.0, 41.0, 36.0, 46.0, 35.0, 40.0, 50.0, 26.0, 28.0, 32.0, 24.0, 21.0, 16.0, 10.0, 17.0, 10.0, 15.0, 9.0, 13.0, 10.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.46484375, -3.351806640625, -3.23876953125, -3.125732421875, -3.0126953125, -2.899658203125, -2.78662109375, -2.673583984375, -2.560546875, -2.447509765625, -2.33447265625, -2.221435546875, -2.1083984375, -1.995361328125, -1.88232421875, -1.769287109375, -1.65625, -1.543212890625, -1.43017578125, -1.317138671875, -1.2041015625, -1.091064453125, -0.97802734375, -0.864990234375, -0.751953125, -0.638916015625, -0.52587890625, -0.412841796875, -0.2998046875, -0.186767578125, -0.07373046875, 0.039306640625, 0.15234375, 0.265380859375, 0.37841796875, 0.491455078125, 0.6044921875, 0.717529296875, 0.83056640625, 0.943603515625, 1.056640625, 1.169677734375, 1.28271484375, 1.395751953125, 1.5087890625, 1.621826171875, 1.73486328125, 1.847900390625, 1.9609375, 2.073974609375, 2.18701171875, 2.300048828125, 2.4130859375, 2.526123046875, 2.63916015625, 2.752197265625, 2.865234375, 2.978271484375, 3.09130859375, 3.204345703125, 3.3173828125, 3.430419921875, 3.54345703125, 3.656494140625, 3.76953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 13.0, 7.0, 22.0, 33.0, 34.0, 46.0, 75.0, 95.0, 143.0, 218.0, 318.0, 459.0, 633.0, 1098.0, 1560.0, 2568.0, 4209.0, 7114.0, 12260.0, 21829.0, 41952.0, 86594.0, 197439.0, 337472.0, 170293.0, 76044.0, 37525.0, 19880.0, 11169.0, 6599.0, 3872.0, 2507.0, 1562.0, 941.0, 663.0, 437.0, 277.0, 200.0, 123.0, 67.0, 71.0, 45.0, 33.0, 15.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.70550537109375, -4.5399169921875, -4.37432861328125, -4.208740234375, -4.04315185546875, -3.8775634765625, -3.71197509765625, -3.54638671875, -3.38079833984375, -3.2152099609375, -3.04962158203125, -2.884033203125, -2.71844482421875, -2.5528564453125, -2.38726806640625, -2.2216796875, -2.05609130859375, -1.8905029296875, -1.72491455078125, -1.559326171875, -1.39373779296875, -1.2281494140625, -1.06256103515625, -0.89697265625, -0.73138427734375, -0.5657958984375, -0.40020751953125, -0.234619140625, -0.06903076171875, 0.0965576171875, 0.26214599609375, 0.427734375, 0.59332275390625, 0.7589111328125, 0.92449951171875, 1.090087890625, 1.25567626953125, 1.4212646484375, 1.58685302734375, 1.75244140625, 1.91802978515625, 2.0836181640625, 2.24920654296875, 2.414794921875, 2.58038330078125, 2.7459716796875, 2.91156005859375, 3.0771484375, 3.24273681640625, 3.4083251953125, 3.57391357421875, 3.739501953125, 3.90509033203125, 4.0706787109375, 4.23626708984375, 4.40185546875, 4.56744384765625, 4.7330322265625, 4.89862060546875, 5.064208984375, 5.22979736328125, 5.3953857421875, 5.56097412109375, 5.7265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 1.0, 6.0, 6.0, 7.0, 16.0, 16.0, 17.0, 21.0, 16.0, 27.0, 31.0, 31.0, 45.0, 31.0, 70.0, 82.0, 113.0, 182.0, 1390.0, 291.0, 133.0, 87.0, 66.0, 41.0, 40.0, 39.0, 29.0, 28.0, 31.0, 22.0, 21.0, 17.0, 15.0, 13.0, 19.0, 11.0, 5.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.03125, -9.70556640625, -9.3798828125, -9.05419921875, -8.728515625, -8.40283203125, -8.0771484375, -7.75146484375, -7.42578125, -7.10009765625, -6.7744140625, -6.44873046875, -6.123046875, -5.79736328125, -5.4716796875, -5.14599609375, -4.8203125, -4.49462890625, -4.1689453125, -3.84326171875, -3.517578125, -3.19189453125, -2.8662109375, -2.54052734375, -2.21484375, -1.88916015625, -1.5634765625, -1.23779296875, -0.912109375, -0.58642578125, -0.2607421875, 0.06494140625, 0.390625, 0.71630859375, 1.0419921875, 1.36767578125, 1.693359375, 2.01904296875, 2.3447265625, 2.67041015625, 2.99609375, 3.32177734375, 3.6474609375, 3.97314453125, 4.298828125, 4.62451171875, 4.9501953125, 5.27587890625, 5.6015625, 5.92724609375, 6.2529296875, 6.57861328125, 6.904296875, 7.22998046875, 7.5556640625, 7.88134765625, 8.20703125, 8.53271484375, 8.8583984375, 9.18408203125, 9.509765625, 9.83544921875, 10.1611328125, 10.48681640625, 10.8125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 12.0, 9.0, 13.0, 13.0, 20.0, 22.0, 38.0, 49.0, 81.0, 91.0, 161.0, 260.0, 500.0, 1167.0, 3992.0, 20739.0, 246759.0, 2732080.0, 120657.0, 13908.0, 3068.0, 959.0, 449.0, 224.0, 144.0, 80.0, 67.0, 36.0, 26.0, 23.0, 16.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.50537109375, -15.9794921875, -15.45361328125, -14.927734375, -14.40185546875, -13.8759765625, -13.35009765625, -12.82421875, -12.29833984375, -11.7724609375, -11.24658203125, -10.720703125, -10.19482421875, -9.6689453125, -9.14306640625, -8.6171875, -8.09130859375, -7.5654296875, -7.03955078125, -6.513671875, -5.98779296875, -5.4619140625, -4.93603515625, -4.41015625, -3.88427734375, -3.3583984375, -2.83251953125, -2.306640625, -1.78076171875, -1.2548828125, -0.72900390625, -0.203125, 0.32275390625, 0.8486328125, 1.37451171875, 1.900390625, 2.42626953125, 2.9521484375, 3.47802734375, 4.00390625, 4.52978515625, 5.0556640625, 5.58154296875, 6.107421875, 6.63330078125, 7.1591796875, 7.68505859375, 8.2109375, 8.73681640625, 9.2626953125, 9.78857421875, 10.314453125, 10.84033203125, 11.3662109375, 11.89208984375, 12.41796875, 12.94384765625, 13.4697265625, 13.99560546875, 14.521484375, 15.04736328125, 15.5732421875, 16.09912109375, 16.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 24.0, 99.0, 332.0, 364.0, 153.0, 32.0, 12.0], "bins": [-138.59930419921875, -136.29335021972656, -133.98741149902344, -131.68145751953125, -129.37551879882812, -127.06956481933594, -124.76361846923828, -122.45767211914062, -120.15171813964844, -117.84577178955078, -115.53982543945312, -113.23387145996094, -110.92792510986328, -108.62197875976562, -106.31603240966797, -104.01008605957031, -101.70413970947266, -99.398193359375, -97.09224700927734, -94.78629302978516, -92.4803466796875, -90.17440032958984, -87.86845397949219, -85.56250762939453, -83.25656127929688, -80.95061492919922, -78.64466857910156, -76.33871459960938, -74.03276824951172, -71.72682189941406, -69.4208755493164, -67.11492919921875, -64.8089828491211, -62.50303649902344, -60.197086334228516, -57.89113998413086, -55.58518981933594, -53.27924346923828, -50.973297119140625, -48.66735076904297, -46.36140060424805, -44.05545425415039, -41.74950408935547, -39.44355773925781, -37.137611389160156, -34.831661224365234, -32.52571487426758, -30.21976661682129, -27.913818359375, -25.60787010192871, -23.301921844482422, -20.995975494384766, -18.690027236938477, -16.384078979492188, -14.078131675720215, -11.772184371948242, -9.466236114501953, -7.160288333892822, -4.854340553283691, -2.5483927726745605, -0.2424449920654297, 2.0635032653808594, 4.369450569152832, 6.675397872924805, 8.981346130371094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 9.0, 10.0, 10.0, 14.0, 13.0, 15.0, 23.0, 27.0, 34.0, 34.0, 28.0, 29.0, 21.0, 26.0, 31.0, 49.0, 59.0, 51.0, 41.0, 41.0, 50.0, 44.0, 23.0, 23.0, 41.0, 30.0, 30.0, 32.0, 16.0, 22.0, 11.0, 17.0, 9.0, 9.0, 14.0, 17.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.878116607666016, -23.134761810302734, -22.39140510559082, -21.64805030822754, -20.904693603515625, -20.161338806152344, -19.417984008789062, -18.67462921142578, -17.931272506713867, -17.187917709350586, -16.444561004638672, -15.70120620727539, -14.957850456237793, -14.214494705200195, -13.471139907836914, -12.727784156799316, -11.984428405761719, -11.241072654724121, -10.497716903686523, -9.754362106323242, -9.011006355285645, -8.267650604248047, -7.524295330047607, -6.780940055847168, -6.03758430480957, -5.294228553771973, -4.550873279571533, -3.8075177669525146, -3.064162254333496, -2.3208067417144775, -1.577451229095459, -0.8340959548950195, -0.09074020385742188, 0.6526153087615967, 1.3959708213806152, 2.139326333999634, 2.8826818466186523, 3.626037359237671, 4.3693928718566895, 5.112748146057129, 5.856103897094727, 6.599459648132324, 7.342814922332764, 8.086170196533203, 8.8295259475708, 9.572881698608398, 10.31623649597168, 11.059592247009277, 11.802947998046875, 12.546303749084473, 13.28965950012207, 14.033014297485352, 14.77637004852295, 15.519725799560547, 16.263080596923828, 17.00643539428711, 17.749792098999023, 18.493146896362305, 19.23650360107422, 19.9798583984375, 20.72321319580078, 21.466569900512695, 22.209924697875977, 22.95328140258789, 23.696636199951172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 3.0, 2.0, 8.0, 9.0, 12.0, 10.0, 11.0, 16.0, 18.0, 12.0, 19.0, 26.0, 34.0, 23.0, 27.0, 49.0, 38.0, 40.0, 37.0, 43.0, 45.0, 36.0, 40.0, 40.0, 38.0, 37.0, 32.0, 24.0, 34.0, 31.0, 25.0, 23.0, 24.0, 11.0, 14.0, 16.0, 19.0, 9.0, 9.0, 4.0, 8.0, 8.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.46484375, -3.351715087890625, -3.23858642578125, -3.125457763671875, -3.0123291015625, -2.899200439453125, -2.78607177734375, -2.672943115234375, -2.559814453125, -2.446685791015625, -2.33355712890625, -2.220428466796875, -2.1072998046875, -1.994171142578125, -1.88104248046875, -1.767913818359375, -1.65478515625, -1.541656494140625, -1.42852783203125, -1.315399169921875, -1.2022705078125, -1.089141845703125, -0.97601318359375, -0.862884521484375, -0.749755859375, -0.636627197265625, -0.52349853515625, -0.410369873046875, -0.2972412109375, -0.184112548828125, -0.07098388671875, 0.042144775390625, 0.1552734375, 0.268402099609375, 0.38153076171875, 0.494659423828125, 0.6077880859375, 0.720916748046875, 0.83404541015625, 0.947174072265625, 1.060302734375, 1.173431396484375, 1.28656005859375, 1.399688720703125, 1.5128173828125, 1.625946044921875, 1.73907470703125, 1.852203369140625, 1.96533203125, 2.078460693359375, 2.19158935546875, 2.304718017578125, 2.4178466796875, 2.530975341796875, 2.64410400390625, 2.757232666015625, 2.870361328125, 2.983489990234375, 3.09661865234375, 3.209747314453125, 3.3228759765625, 3.436004638671875, 3.54913330078125, 3.662261962890625, 3.775390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 7.0, 4.0, 5.0, 11.0, 7.0, 27.0, 32.0, 32.0, 32.0, 44.0, 71.0, 91.0, 130.0, 150.0, 233.0, 374.0, 769.0, 6690.0, 3621492.0, 558804.0, 3548.0, 612.0, 307.0, 206.0, 142.0, 106.0, 87.0, 63.0, 32.0, 30.0, 30.0, 31.0, 23.0, 7.0, 3.0, 5.0, 6.0, 8.0, 4.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.9375, -37.634765625, -36.33203125, -35.029296875, -33.7265625, -32.423828125, -31.12109375, -29.818359375, -28.515625, -27.212890625, -25.91015625, -24.607421875, -23.3046875, -22.001953125, -20.69921875, -19.396484375, -18.09375, -16.791015625, -15.48828125, -14.185546875, -12.8828125, -11.580078125, -10.27734375, -8.974609375, -7.671875, -6.369140625, -5.06640625, -3.763671875, -2.4609375, -1.158203125, 0.14453125, 1.447265625, 2.75, 4.052734375, 5.35546875, 6.658203125, 7.9609375, 9.263671875, 10.56640625, 11.869140625, 13.171875, 14.474609375, 15.77734375, 17.080078125, 18.3828125, 19.685546875, 20.98828125, 22.291015625, 23.59375, 24.896484375, 26.19921875, 27.501953125, 28.8046875, 30.107421875, 31.41015625, 32.712890625, 34.015625, 35.318359375, 36.62109375, 37.923828125, 39.2265625, 40.529296875, 41.83203125, 43.134765625, 44.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 14.0, 14.0, 26.0, 35.0, 38.0, 62.0, 81.0, 104.0, 171.0, 287.0, 493.0, 719.0, 724.0, 453.0, 263.0, 162.0, 91.0, 68.0, 56.0, 32.0, 45.0, 27.0, 23.0, 13.0, 10.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.125, -6.91534423828125, -6.7056884765625, -6.49603271484375, -6.286376953125, -6.07672119140625, -5.8670654296875, -5.65740966796875, -5.44775390625, -5.23809814453125, -5.0284423828125, -4.81878662109375, -4.609130859375, -4.39947509765625, -4.1898193359375, -3.98016357421875, -3.7705078125, -3.56085205078125, -3.3511962890625, -3.14154052734375, -2.931884765625, -2.72222900390625, -2.5125732421875, -2.30291748046875, -2.09326171875, -1.88360595703125, -1.6739501953125, -1.46429443359375, -1.254638671875, -1.04498291015625, -0.8353271484375, -0.62567138671875, -0.416015625, -0.20635986328125, 0.0032958984375, 0.21295166015625, 0.422607421875, 0.63226318359375, 0.8419189453125, 1.05157470703125, 1.26123046875, 1.47088623046875, 1.6805419921875, 1.89019775390625, 2.099853515625, 2.30950927734375, 2.5191650390625, 2.72882080078125, 2.9384765625, 3.14813232421875, 3.3577880859375, 3.56744384765625, 3.777099609375, 3.98675537109375, 4.1964111328125, 4.40606689453125, 4.61572265625, 4.82537841796875, 5.0350341796875, 5.24468994140625, 5.454345703125, 5.66400146484375, 5.8736572265625, 6.08331298828125, 6.29296875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 4.0, 6.0, 17.0, 14.0, 23.0, 20.0, 38.0, 55.0, 91.0, 131.0, 339.0, 1219.0, 13591.0, 704841.0, 3438725.0, 32247.0, 2040.0, 428.0, 169.0, 99.0, 63.0, 40.0, 19.0, 12.0, 9.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53125, -23.767822265625, -23.00439453125, -22.240966796875, -21.4775390625, -20.714111328125, -19.95068359375, -19.187255859375, -18.423828125, -17.660400390625, -16.89697265625, -16.133544921875, -15.3701171875, -14.606689453125, -13.84326171875, -13.079833984375, -12.31640625, -11.552978515625, -10.78955078125, -10.026123046875, -9.2626953125, -8.499267578125, -7.73583984375, -6.972412109375, -6.208984375, -5.445556640625, -4.68212890625, -3.918701171875, -3.1552734375, -2.391845703125, -1.62841796875, -0.864990234375, -0.1015625, 0.661865234375, 1.42529296875, 2.188720703125, 2.9521484375, 3.715576171875, 4.47900390625, 5.242431640625, 6.005859375, 6.769287109375, 7.53271484375, 8.296142578125, 9.0595703125, 9.822998046875, 10.58642578125, 11.349853515625, 12.11328125, 12.876708984375, 13.64013671875, 14.403564453125, 15.1669921875, 15.930419921875, 16.69384765625, 17.457275390625, 18.220703125, 18.984130859375, 19.74755859375, 20.510986328125, 21.2744140625, 22.037841796875, 22.80126953125, 23.564697265625, 24.328125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 19.0, 9.0, 28.0, 28.0, 44.0, 63.0, 86.0, 110.0, 109.0, 105.0, 109.0, 82.0, 76.0, 51.0, 30.0, 14.0, 11.0, 16.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.738236427307129, -9.052277565002441, -8.36631965637207, -7.680360794067383, -6.994401931762695, -6.308443546295166, -5.622485160827637, -4.936526298522949, -4.25056791305542, -3.5646092891693115, -2.878650665283203, -2.192692279815674, -1.5067336559295654, -0.820775032043457, -0.13481664657592773, 0.5511422157287598, 1.237100601196289, 1.9230592250823975, 2.609017848968506, 3.294976234436035, 3.9809348583221436, 4.666893482208252, 5.352851867675781, 6.038810729980469, 6.724769115447998, 7.410727500915527, 8.096686363220215, 8.782644271850586, 9.468603134155273, 10.154561996459961, 10.840520858764648, 11.526479721069336, 12.212438583374023, 12.898397445678711, 13.584355354309082, 14.27031421661377, 14.956273078918457, 15.642230987548828, 16.328189849853516, 17.014148712158203, 17.70010757446289, 18.386066436767578, 19.072025299072266, 19.757984161376953, 20.443941116333008, 21.129899978637695, 21.815858840942383, 22.50181770324707, 23.187774658203125, 23.873733520507812, 24.5596923828125, 25.245651245117188, 25.931608200073242, 26.61756706237793, 27.303525924682617, 27.989484786987305, 28.675443649291992, 29.36140251159668, 30.047361373901367, 30.733318328857422, 31.41927719116211, 32.1052360534668, 32.791194915771484, 33.47715377807617, 34.16311264038086]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 1.0, 4.0, 7.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 19.0, 27.0, 12.0, 22.0, 21.0, 34.0, 33.0, 36.0, 26.0, 41.0, 39.0, 32.0, 42.0, 52.0, 40.0, 42.0, 35.0, 52.0, 40.0, 38.0, 29.0, 31.0, 28.0, 20.0, 28.0, 14.0, 13.0, 20.0, 12.0, 11.0, 10.0, 9.0, 0.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.44189453125, -17.84846305847168, -17.255033493041992, -16.661602020263672, -16.06817054748535, -15.474740028381348, -14.881309509277344, -14.287878036499023, -13.694446563720703, -13.1010160446167, -12.507584571838379, -11.914154052734375, -11.320722579956055, -10.72729206085205, -10.133861541748047, -9.540430068969727, -8.946999549865723, -8.353569030761719, -7.760137557983398, -7.1667070388793945, -6.573275566101074, -5.97984504699707, -5.386414051055908, -4.792983055114746, -4.199552059173584, -3.606121063232422, -3.0126900672912598, -2.4192593097686768, -1.8258283138275146, -1.2323973178863525, -0.6389665603637695, -0.04553556442260742, 0.5478954315185547, 1.1413264274597168, 1.7347573041915894, 2.328188180923462, 2.921619176864624, 3.515050172805786, 4.108480930328369, 4.701911926269531, 5.295342922210693, 5.8887739181518555, 6.482204914093018, 7.07563591003418, 7.669066429138184, 8.262497901916504, 8.855928421020508, 9.449359893798828, 10.042790412902832, 10.636220932006836, 11.229652404785156, 11.82308292388916, 12.41651439666748, 13.009944915771484, 13.603376388549805, 14.196806907653809, 14.790237426757812, 15.383667945861816, 15.977099418640137, 16.57052993774414, 17.16396141052246, 17.75739288330078, 18.35082244873047, 18.94425392150879, 19.53768539428711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 8.0, 8.0, 14.0, 11.0, 19.0, 12.0, 12.0, 26.0, 39.0, 26.0, 35.0, 32.0, 36.0, 46.0, 37.0, 37.0, 39.0, 49.0, 46.0, 52.0, 31.0, 39.0, 49.0, 34.0, 17.0, 29.0, 22.0, 13.0, 24.0, 26.0, 24.0, 12.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.677734375, -3.562835693359375, -3.44793701171875, -3.333038330078125, -3.2181396484375, -3.103240966796875, -2.98834228515625, -2.873443603515625, -2.758544921875, -2.643646240234375, -2.52874755859375, -2.413848876953125, -2.2989501953125, -2.184051513671875, -2.06915283203125, -1.954254150390625, -1.83935546875, -1.724456787109375, -1.60955810546875, -1.494659423828125, -1.3797607421875, -1.264862060546875, -1.14996337890625, -1.035064697265625, -0.920166015625, -0.805267333984375, -0.69036865234375, -0.575469970703125, -0.4605712890625, -0.345672607421875, -0.23077392578125, -0.115875244140625, -0.0009765625, 0.113922119140625, 0.22882080078125, 0.343719482421875, 0.4586181640625, 0.573516845703125, 0.68841552734375, 0.803314208984375, 0.918212890625, 1.033111572265625, 1.14801025390625, 1.262908935546875, 1.3778076171875, 1.492706298828125, 1.60760498046875, 1.722503662109375, 1.83740234375, 1.952301025390625, 2.06719970703125, 2.182098388671875, 2.2969970703125, 2.411895751953125, 2.52679443359375, 2.641693115234375, 2.756591796875, 2.871490478515625, 2.98638916015625, 3.101287841796875, 3.2161865234375, 3.331085205078125, 3.44598388671875, 3.560882568359375, 3.67578125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 12.0, 18.0, 24.0, 41.0, 66.0, 101.0, 137.0, 196.0, 282.0, 381.0, 573.0, 779.0, 1272.0, 1838.0, 2791.0, 4243.0, 6749.0, 11006.0, 18316.0, 32160.0, 60418.0, 124574.0, 250718.0, 256991.0, 128787.0, 62636.0, 33417.0, 18827.0, 11238.0, 6883.0, 4372.0, 2860.0, 1832.0, 1287.0, 868.0, 547.0, 437.0, 257.0, 195.0, 136.0, 99.0, 67.0, 46.0, 26.0, 21.0, 13.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.966796875, -0.9375228881835938, -0.9082489013671875, -0.8789749145507812, -0.849700927734375, -0.8204269409179688, -0.7911529541015625, -0.7618789672851562, -0.73260498046875, -0.7033309936523438, -0.6740570068359375, -0.6447830200195312, -0.615509033203125, -0.5862350463867188, -0.5569610595703125, -0.5276870727539062, -0.4984130859375, -0.46913909912109375, -0.4398651123046875, -0.41059112548828125, -0.381317138671875, -0.35204315185546875, -0.3227691650390625, -0.29349517822265625, -0.26422119140625, -0.23494720458984375, -0.2056732177734375, -0.17639923095703125, -0.147125244140625, -0.11785125732421875, -0.0885772705078125, -0.05930328369140625, -0.030029296875, -0.00075531005859375, 0.0285186767578125, 0.05779266357421875, 0.087066650390625, 0.11634063720703125, 0.1456146240234375, 0.17488861083984375, 0.20416259765625, 0.23343658447265625, 0.2627105712890625, 0.29198455810546875, 0.321258544921875, 0.35053253173828125, 0.3798065185546875, 0.40908050537109375, 0.4383544921875, 0.46762847900390625, 0.4969024658203125, 0.5261764526367188, 0.555450439453125, 0.5847244262695312, 0.6139984130859375, 0.6432723999023438, 0.67254638671875, 0.7018203735351562, 0.7310943603515625, 0.7603683471679688, 0.789642333984375, 0.8189163208007812, 0.8481903076171875, 0.8774642944335938, 0.90673828125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 6.0, 8.0, 7.0, 13.0, 14.0, 13.0, 13.0, 23.0, 17.0, 28.0, 29.0, 29.0, 29.0, 38.0, 29.0, 45.0, 45.0, 33.0, 47.0, 1061.0, 34.0, 46.0, 48.0, 47.0, 39.0, 32.0, 36.0, 29.0, 30.0, 25.0, 19.0, 19.0, 14.0, 9.0, 12.0, 9.0, 11.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.88543701171875, -2.7982177734375, -2.71099853515625, -2.623779296875, -2.53656005859375, -2.4493408203125, -2.36212158203125, -2.27490234375, -2.18768310546875, -2.1004638671875, -2.01324462890625, -1.926025390625, -1.83880615234375, -1.7515869140625, -1.66436767578125, -1.5771484375, -1.48992919921875, -1.4027099609375, -1.31549072265625, -1.228271484375, -1.14105224609375, -1.0538330078125, -0.96661376953125, -0.87939453125, -0.79217529296875, -0.7049560546875, -0.61773681640625, -0.530517578125, -0.44329833984375, -0.3560791015625, -0.26885986328125, -0.181640625, -0.09442138671875, -0.0072021484375, 0.08001708984375, 0.167236328125, 0.25445556640625, 0.3416748046875, 0.42889404296875, 0.51611328125, 0.60333251953125, 0.6905517578125, 0.77777099609375, 0.864990234375, 0.95220947265625, 1.0394287109375, 1.12664794921875, 1.2138671875, 1.30108642578125, 1.3883056640625, 1.47552490234375, 1.562744140625, 1.64996337890625, 1.7371826171875, 1.82440185546875, 1.91162109375, 1.99884033203125, 2.0860595703125, 2.17327880859375, 2.260498046875, 2.34771728515625, 2.4349365234375, 2.52215576171875, 2.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 11.0, 17.0, 21.0, 39.0, 61.0, 85.0, 150.0, 269.0, 471.0, 893.0, 1734.0, 3808.0, 9192.0, 27240.0, 119766.0, 1428486.0, 417500.0, 58950.0, 16754.0, 6204.0, 2605.0, 1274.0, 654.0, 348.0, 211.0, 131.0, 89.0, 44.0, 36.0, 34.0, 12.0, 13.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4755859375, -1.4276580810546875, -1.379730224609375, -1.3318023681640625, -1.28387451171875, -1.2359466552734375, -1.188018798828125, -1.1400909423828125, -1.0921630859375, -1.0442352294921875, -0.996307373046875, -0.9483795166015625, -0.90045166015625, -0.8525238037109375, -0.804595947265625, -0.7566680908203125, -0.708740234375, -0.6608123779296875, -0.612884521484375, -0.5649566650390625, -0.51702880859375, -0.4691009521484375, -0.421173095703125, -0.3732452392578125, -0.3253173828125, -0.2773895263671875, -0.229461669921875, -0.1815338134765625, -0.13360595703125, -0.0856781005859375, -0.037750244140625, 0.0101776123046875, 0.05810546875, 0.1060333251953125, 0.153961181640625, 0.2018890380859375, 0.24981689453125, 0.2977447509765625, 0.345672607421875, 0.3936004638671875, 0.4415283203125, 0.4894561767578125, 0.537384033203125, 0.5853118896484375, 0.63323974609375, 0.6811676025390625, 0.729095458984375, 0.7770233154296875, 0.824951171875, 0.8728790283203125, 0.920806884765625, 0.9687347412109375, 1.01666259765625, 1.0645904541015625, 1.112518310546875, 1.1604461669921875, 1.2083740234375, 1.2563018798828125, 1.304229736328125, 1.3521575927734375, 1.40008544921875, 1.4480133056640625, 1.495941162109375, 1.5438690185546875, 1.591796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 8.0, 7.0, 12.0, 14.0, 21.0, 28.0, 41.0, 69.0, 131.0, 148.0, 182.0, 115.0, 76.0, 46.0, 25.0, 17.0, 14.0, 14.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3879966735839844, -0.37584686279296875, -0.3636970520019531, -0.3515472412109375, -0.3393974304199219, -0.32724761962890625, -0.3150978088378906, -0.302947998046875, -0.2907981872558594, -0.27864837646484375, -0.2664985656738281, -0.2543487548828125, -0.24219894409179688, -0.23004913330078125, -0.21789932250976562, -0.20574951171875, -0.19359970092773438, -0.18144989013671875, -0.16930007934570312, -0.1571502685546875, -0.14500045776367188, -0.13285064697265625, -0.12070083618164062, -0.108551025390625, -0.09640121459960938, -0.08425140380859375, -0.07210159301757812, -0.0599517822265625, -0.047801971435546875, -0.03565216064453125, -0.023502349853515625, -0.0113525390625, 0.000797271728515625, 0.01294708251953125, 0.025096893310546875, 0.0372467041015625, 0.049396514892578125, 0.06154632568359375, 0.07369613647460938, 0.085845947265625, 0.09799575805664062, 0.11014556884765625, 0.12229537963867188, 0.1344451904296875, 0.14659500122070312, 0.15874481201171875, 0.17089462280273438, 0.18304443359375, 0.19519424438476562, 0.20734405517578125, 0.21949386596679688, 0.2316436767578125, 0.24379348754882812, 0.25594329833984375, 0.2680931091308594, 0.280242919921875, 0.2923927307128906, 0.30454254150390625, 0.3166923522949219, 0.3288421630859375, 0.3409919738769531, 0.35314178466796875, 0.3652915954589844, 0.37744140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 21.0, 29.0, 54.0, 93.0, 200.0, 492.0, 11757.0, 1033877.0, 1393.0, 274.0, 120.0, 70.0, 40.0, 30.0, 16.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.857666015625, -7.59814453125, -7.338623046875, -7.0791015625, -6.819580078125, -6.56005859375, -6.300537109375, -6.041015625, -5.781494140625, -5.52197265625, -5.262451171875, -5.0029296875, -4.743408203125, -4.48388671875, -4.224365234375, -3.96484375, -3.705322265625, -3.44580078125, -3.186279296875, -2.9267578125, -2.667236328125, -2.40771484375, -2.148193359375, -1.888671875, -1.629150390625, -1.36962890625, -1.110107421875, -0.8505859375, -0.591064453125, -0.33154296875, -0.072021484375, 0.1875, 0.447021484375, 0.70654296875, 0.966064453125, 1.2255859375, 1.485107421875, 1.74462890625, 2.004150390625, 2.263671875, 2.523193359375, 2.78271484375, 3.042236328125, 3.3017578125, 3.561279296875, 3.82080078125, 4.080322265625, 4.33984375, 4.599365234375, 4.85888671875, 5.118408203125, 5.3779296875, 5.637451171875, 5.89697265625, 6.156494140625, 6.416015625, 6.675537109375, 6.93505859375, 7.194580078125, 7.4541015625, 7.713623046875, 7.97314453125, 8.232666015625, 8.4921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 40.0, 258.0, 540.0, 130.0, 19.0, 13.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423232913017273, -1.3887617588043213, -1.35429048538208, -1.3198192119598389, -1.2853480577468872, -1.2508769035339355, -1.2164056301116943, -1.1819343566894531, -1.1474632024765015, -1.1129920482635498, -1.0785207748413086, -1.0440495014190674, -1.0095783472061157, -0.9751071333885193, -0.9406359195709229, -0.9061647057533264, -0.87169349193573, -0.8372222781181335, -0.8027510643005371, -0.7682798504829407, -0.7338086366653442, -0.6993374228477478, -0.6648662090301514, -0.6303949952125549, -0.5959237813949585, -0.5614525675773621, -0.5269813537597656, -0.4925101399421692, -0.45803892612457275, -0.4235677123069763, -0.3890964984893799, -0.35462528467178345, -0.3201541304588318, -0.28568291664123535, -0.2512117028236389, -0.21674048900604248, -0.18226927518844604, -0.1477980613708496, -0.11332684755325317, -0.07885563373565674, -0.0443844199180603, -0.009913206100463867, 0.02455800771713257, 0.059029221534729004, 0.09350043535232544, 0.12797164916992188, 0.1624428629875183, 0.19691407680511475, 0.23138529062271118, 0.2658565044403076, 0.30032771825790405, 0.3347989320755005, 0.3692701458930969, 0.40374135971069336, 0.4382125735282898, 0.47268378734588623, 0.5071550011634827, 0.5416262149810791, 0.5760974287986755, 0.610568642616272, 0.6450398564338684, 0.6795110702514648, 0.7139822840690613, 0.7484534978866577, 0.7829247117042542]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 10.0, 9.0, 15.0, 13.0, 16.0, 13.0, 21.0, 26.0, 36.0, 24.0, 37.0, 45.0, 36.0, 42.0, 39.0, 34.0, 45.0, 31.0, 36.0, 41.0, 40.0, 48.0, 23.0, 35.0, 30.0, 24.0, 43.0, 25.0, 29.0, 17.0, 12.0, 12.0, 13.0, 9.0, 13.0, 8.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2747429609298706, -0.26545190811157227, -0.2561608552932739, -0.24686981737613678, -0.23757877945899963, -0.2282877266407013, -0.21899667382240295, -0.2097056359052658, -0.20041459798812866, -0.19112354516983032, -0.18183250725269318, -0.17254145443439484, -0.1632504165172577, -0.15395936369895935, -0.144668310880661, -0.13537727296352386, -0.12608622014522552, -0.11679517477750778, -0.10750412940979004, -0.0982130765914917, -0.08892203867435455, -0.07963098585605621, -0.07033994048833847, -0.06104889512062073, -0.051757849752902985, -0.04246680438518524, -0.0331757590174675, -0.023884709924459457, -0.014593664556741714, -0.0053026191890239716, 0.00398842990398407, 0.013279475271701813, 0.022570520639419556, 0.0318615660071373, 0.04115261137485504, 0.05044366046786308, 0.059734705835580826, 0.06902575492858887, 0.07831680029630661, 0.08760784566402435, 0.0968988910317421, 0.10618993639945984, 0.11548098176717758, 0.12477202713489532, 0.13406307995319366, 0.1433541178703308, 0.15264517068862915, 0.1619362235069275, 0.17122726142406464, 0.18051831424236298, 0.18980935215950012, 0.19910040497779846, 0.2083914428949356, 0.21768249571323395, 0.2269735336303711, 0.23626458644866943, 0.24555563926696777, 0.2548466920852661, 0.26413774490356445, 0.2734287679195404, 0.28271982073783875, 0.2920108735561371, 0.3013019263744354, 0.3105929493904114, 0.3198840022087097]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 11.0, 14.0, 12.0, 25.0, 26.0, 23.0, 30.0, 30.0, 25.0, 38.0, 33.0, 54.0, 58.0, 44.0, 46.0, 57.0, 34.0, 53.0, 47.0, 31.0, 35.0, 25.0, 25.0, 27.0, 25.0, 19.0, 21.0, 18.0, 27.0, 10.0, 14.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.609466552734375, -3.48651123046875, -3.363555908203125, -3.2406005859375, -3.117645263671875, -2.99468994140625, -2.871734619140625, -2.748779296875, -2.625823974609375, -2.50286865234375, -2.379913330078125, -2.2569580078125, -2.134002685546875, -2.01104736328125, -1.888092041015625, -1.76513671875, -1.642181396484375, -1.51922607421875, -1.396270751953125, -1.2733154296875, -1.150360107421875, -1.02740478515625, -0.904449462890625, -0.781494140625, -0.658538818359375, -0.53558349609375, -0.412628173828125, -0.2896728515625, -0.166717529296875, -0.04376220703125, 0.079193115234375, 0.2021484375, 0.325103759765625, 0.44805908203125, 0.571014404296875, 0.6939697265625, 0.816925048828125, 0.93988037109375, 1.062835693359375, 1.185791015625, 1.308746337890625, 1.43170166015625, 1.554656982421875, 1.6776123046875, 1.800567626953125, 1.92352294921875, 2.046478271484375, 2.16943359375, 2.292388916015625, 2.41534423828125, 2.538299560546875, 2.6612548828125, 2.784210205078125, 2.90716552734375, 3.030120849609375, 3.153076171875, 3.276031494140625, 3.39898681640625, 3.521942138671875, 3.6448974609375, 3.767852783203125, 3.89080810546875, 4.013763427734375, 4.13671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 13.0, 28.0, 24.0, 35.0, 79.0, 75.0, 106.0, 198.0, 315.0, 430.0, 624.0, 1073.0, 1685.0, 2820.0, 4806.0, 8945.0, 16816.0, 33790.0, 73748.0, 181310.0, 365130.0, 199208.0, 80284.0, 36727.0, 17801.0, 9546.0, 5093.0, 2958.0, 1736.0, 1059.0, 704.0, 418.0, 297.0, 194.0, 137.0, 86.0, 67.0, 50.0, 36.0, 27.0, 13.0, 13.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7890625, -4.63726806640625, -4.4854736328125, -4.33367919921875, -4.181884765625, -4.03009033203125, -3.8782958984375, -3.72650146484375, -3.57470703125, -3.42291259765625, -3.2711181640625, -3.11932373046875, -2.967529296875, -2.81573486328125, -2.6639404296875, -2.51214599609375, -2.3603515625, -2.20855712890625, -2.0567626953125, -1.90496826171875, -1.753173828125, -1.60137939453125, -1.4495849609375, -1.29779052734375, -1.14599609375, -0.99420166015625, -0.8424072265625, -0.69061279296875, -0.538818359375, -0.38702392578125, -0.2352294921875, -0.08343505859375, 0.068359375, 0.22015380859375, 0.3719482421875, 0.52374267578125, 0.675537109375, 0.82733154296875, 0.9791259765625, 1.13092041015625, 1.28271484375, 1.43450927734375, 1.5863037109375, 1.73809814453125, 1.889892578125, 2.04168701171875, 2.1934814453125, 2.34527587890625, 2.4970703125, 2.64886474609375, 2.8006591796875, 2.95245361328125, 3.104248046875, 3.25604248046875, 3.4078369140625, 3.55963134765625, 3.71142578125, 3.86322021484375, 4.0150146484375, 4.16680908203125, 4.318603515625, 4.47039794921875, 4.6221923828125, 4.77398681640625, 4.92578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 8.0, 7.0, 10.0, 11.0, 14.0, 22.0, 28.0, 26.0, 33.0, 20.0, 28.0, 40.0, 53.0, 65.0, 91.0, 194.0, 1412.0, 341.0, 168.0, 84.0, 56.0, 50.0, 47.0, 25.0, 38.0, 31.0, 23.0, 20.0, 14.0, 23.0, 19.0, 8.0, 9.0, 8.0, 7.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-11.8515625, -11.5390625, -11.2265625, -10.9140625, -10.6015625, -10.2890625, -9.9765625, -9.6640625, -9.3515625, -9.0390625, -8.7265625, -8.4140625, -8.1015625, -7.7890625, -7.4765625, -7.1640625, -6.8515625, -6.5390625, -6.2265625, -5.9140625, -5.6015625, -5.2890625, -4.9765625, -4.6640625, -4.3515625, -4.0390625, -3.7265625, -3.4140625, -3.1015625, -2.7890625, -2.4765625, -2.1640625, -1.8515625, -1.5390625, -1.2265625, -0.9140625, -0.6015625, -0.2890625, 0.0234375, 0.3359375, 0.6484375, 0.9609375, 1.2734375, 1.5859375, 1.8984375, 2.2109375, 2.5234375, 2.8359375, 3.1484375, 3.4609375, 3.7734375, 4.0859375, 4.3984375, 4.7109375, 5.0234375, 5.3359375, 5.6484375, 5.9609375, 6.2734375, 6.5859375, 6.8984375, 7.2109375, 7.5234375, 7.8359375, 8.1484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 6.0, 7.0, 17.0, 14.0, 20.0, 24.0, 35.0, 39.0, 41.0, 61.0, 96.0, 145.0, 236.0, 360.0, 626.0, 1828.0, 18223.0, 2969360.0, 147951.0, 4268.0, 983.0, 470.0, 257.0, 181.0, 126.0, 71.0, 47.0, 38.0, 31.0, 17.0, 20.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0], "bins": [-25.890625, -25.145263671875, -24.39990234375, -23.654541015625, -22.9091796875, -22.163818359375, -21.41845703125, -20.673095703125, -19.927734375, -19.182373046875, -18.43701171875, -17.691650390625, -16.9462890625, -16.200927734375, -15.45556640625, -14.710205078125, -13.96484375, -13.219482421875, -12.47412109375, -11.728759765625, -10.9833984375, -10.238037109375, -9.49267578125, -8.747314453125, -8.001953125, -7.256591796875, -6.51123046875, -5.765869140625, -5.0205078125, -4.275146484375, -3.52978515625, -2.784423828125, -2.0390625, -1.293701171875, -0.54833984375, 0.197021484375, 0.9423828125, 1.687744140625, 2.43310546875, 3.178466796875, 3.923828125, 4.669189453125, 5.41455078125, 6.159912109375, 6.9052734375, 7.650634765625, 8.39599609375, 9.141357421875, 9.88671875, 10.632080078125, 11.37744140625, 12.122802734375, 12.8681640625, 13.613525390625, 14.35888671875, 15.104248046875, 15.849609375, 16.594970703125, 17.34033203125, 18.085693359375, 18.8310546875, 19.576416015625, 20.32177734375, 21.067138671875, 21.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 17.0, 125.0, 341.0, 372.0, 129.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.57786560058594, -113.2703628540039, -110.96285247802734, -108.65534973144531, -106.34784698486328, -104.04034423828125, -101.73283386230469, -99.42533111572266, -97.11782836914062, -94.8103256225586, -92.50281524658203, -90.1953125, -87.88780975341797, -85.58030700683594, -83.27279663085938, -80.96529388427734, -78.65778350830078, -76.35028076171875, -74.04277038574219, -71.73526763916016, -69.42776489257812, -67.12025451660156, -64.81275177001953, -62.5052490234375, -60.1977424621582, -57.890235900878906, -55.582733154296875, -53.27522659301758, -50.96772003173828, -48.66021728515625, -46.35271072387695, -44.045204162597656, -41.737701416015625, -39.43019485473633, -37.1226921081543, -34.815185546875, -32.50768280029297, -30.200176239013672, -27.892669677734375, -25.58516502380371, -23.277660369873047, -20.970155715942383, -18.66265106201172, -16.355144500732422, -14.047639846801758, -11.740135192871094, -9.432629585266113, -7.125123977661133, -4.817619323730469, -2.5101141929626465, -0.20260906219482422, 2.104896068572998, 4.41240119934082, 6.719905853271484, 9.027411460876465, 11.334917068481445, 13.64242172241211, 15.949926376342773, 18.257431030273438, 20.564937591552734, 22.8724422454834, 25.179946899414062, 27.48745346069336, 29.794958114624023, 32.10246276855469]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 3.0, 7.0, 7.0, 10.0, 8.0, 18.0, 9.0, 20.0, 15.0, 29.0, 24.0, 30.0, 37.0, 34.0, 38.0, 36.0, 50.0, 46.0, 47.0, 45.0, 36.0, 49.0, 46.0, 39.0, 38.0, 32.0, 21.0, 26.0, 28.0, 23.0, 26.0, 20.0, 26.0, 10.0, 21.0, 10.0, 11.0, 4.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.476526260375977, -25.670103073120117, -24.863679885864258, -24.057254791259766, -23.250831604003906, -22.444408416748047, -21.637985229492188, -20.831562042236328, -20.02513885498047, -19.21871566772461, -18.41229248046875, -17.60586929321289, -16.7994441986084, -15.993021011352539, -15.18659782409668, -14.38017463684082, -13.573750495910645, -12.767327308654785, -11.96090316772461, -11.15447998046875, -10.34805679321289, -9.541633605957031, -8.735209465026855, -7.928786277770996, -7.1223626136779785, -6.315938949584961, -5.509515762329102, -4.703092098236084, -3.8966686725616455, -3.090245246887207, -2.2838215827941895, -1.47739839553833, -0.6709747314453125, 0.13544875383377075, 0.941872239112854, 1.748295783996582, 2.5547192096710205, 3.361142635345459, 4.167566299438477, 4.973989486694336, 5.7804131507873535, 6.586836814880371, 7.3932600021362305, 8.199684143066406, 9.006107330322266, 9.812530517578125, 10.618953704833984, 11.425376892089844, 12.23180103302002, 13.038224220275879, 13.844648361206055, 14.651071548461914, 15.457494735717773, 16.263917922973633, 17.070343017578125, 17.876766204833984, 18.683189392089844, 19.489612579345703, 20.296035766601562, 21.102458953857422, 21.908884048461914, 22.715307235717773, 23.521730422973633, 24.328153610229492, 25.13457679748535]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 12.0, 13.0, 15.0, 17.0, 21.0, 31.0, 24.0, 35.0, 38.0, 47.0, 34.0, 45.0, 57.0, 43.0, 56.0, 54.0, 39.0, 46.0, 44.0, 36.0, 41.0, 35.0, 30.0, 29.0, 22.0, 24.0, 21.0, 12.0, 20.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13739013671875, -4.0013427734375, -3.86529541015625, -3.729248046875, -3.59320068359375, -3.4571533203125, -3.32110595703125, -3.18505859375, -3.04901123046875, -2.9129638671875, -2.77691650390625, -2.640869140625, -2.50482177734375, -2.3687744140625, -2.23272705078125, -2.0966796875, -1.96063232421875, -1.8245849609375, -1.68853759765625, -1.552490234375, -1.41644287109375, -1.2803955078125, -1.14434814453125, -1.00830078125, -0.87225341796875, -0.7362060546875, -0.60015869140625, -0.464111328125, -0.32806396484375, -0.1920166015625, -0.05596923828125, 0.080078125, 0.21612548828125, 0.3521728515625, 0.48822021484375, 0.624267578125, 0.76031494140625, 0.8963623046875, 1.03240966796875, 1.16845703125, 1.30450439453125, 1.4405517578125, 1.57659912109375, 1.712646484375, 1.84869384765625, 1.9847412109375, 2.12078857421875, 2.2568359375, 2.39288330078125, 2.5289306640625, 2.66497802734375, 2.801025390625, 2.93707275390625, 3.0731201171875, 3.20916748046875, 3.34521484375, 3.48126220703125, 3.6173095703125, 3.75335693359375, 3.889404296875, 4.02545166015625, 4.1614990234375, 4.29754638671875, 4.43359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 5.0, 3.0, 2.0, 10.0, 15.0, 24.0, 22.0, 29.0, 52.0, 63.0, 89.0, 117.0, 162.0, 235.0, 302.0, 466.0, 638.0, 898.0, 1370.0, 2175.0, 3787.0, 6985.0, 14283.0, 35694.0, 115746.0, 430163.0, 1408792.0, 1530492.0, 458715.0, 115234.0, 34971.0, 14786.0, 7065.0, 3946.0, 2294.0, 1475.0, 935.0, 635.0, 485.0, 296.0, 191.0, 169.0, 128.0, 100.0, 70.0, 51.0, 37.0, 19.0, 22.0, 11.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0], "bins": [-4.83203125, -4.69000244140625, -4.5479736328125, -4.40594482421875, -4.263916015625, -4.12188720703125, -3.9798583984375, -3.83782958984375, -3.69580078125, -3.55377197265625, -3.4117431640625, -3.26971435546875, -3.127685546875, -2.98565673828125, -2.8436279296875, -2.70159912109375, -2.5595703125, -2.41754150390625, -2.2755126953125, -2.13348388671875, -1.991455078125, -1.84942626953125, -1.7073974609375, -1.56536865234375, -1.42333984375, -1.28131103515625, -1.1392822265625, -0.99725341796875, -0.855224609375, -0.71319580078125, -0.5711669921875, -0.42913818359375, -0.287109375, -0.14508056640625, -0.0030517578125, 0.13897705078125, 0.281005859375, 0.42303466796875, 0.5650634765625, 0.70709228515625, 0.84912109375, 0.99114990234375, 1.1331787109375, 1.27520751953125, 1.417236328125, 1.55926513671875, 1.7012939453125, 1.84332275390625, 1.9853515625, 2.12738037109375, 2.2694091796875, 2.41143798828125, 2.553466796875, 2.69549560546875, 2.8375244140625, 2.97955322265625, 3.12158203125, 3.26361083984375, 3.4056396484375, 3.54766845703125, 3.689697265625, 3.83172607421875, 3.9737548828125, 4.11578369140625, 4.2578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 15.0, 8.0, 9.0, 26.0, 22.0, 37.0, 30.0, 52.0, 87.0, 110.0, 103.0, 140.0, 195.0, 301.0, 467.0, 562.0, 523.0, 381.0, 244.0, 180.0, 122.0, 88.0, 79.0, 65.0, 53.0, 41.0, 35.0, 27.0, 11.0, 22.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.8863525390625, -6.682861328125, -6.4793701171875, -6.27587890625, -6.0723876953125, -5.868896484375, -5.6654052734375, -5.4619140625, -5.2584228515625, -5.054931640625, -4.8514404296875, -4.64794921875, -4.4444580078125, -4.240966796875, -4.0374755859375, -3.833984375, -3.6304931640625, -3.427001953125, -3.2235107421875, -3.02001953125, -2.8165283203125, -2.613037109375, -2.4095458984375, -2.2060546875, -2.0025634765625, -1.799072265625, -1.5955810546875, -1.39208984375, -1.1885986328125, -0.985107421875, -0.7816162109375, -0.578125, -0.3746337890625, -0.171142578125, 0.0323486328125, 0.23583984375, 0.4393310546875, 0.642822265625, 0.8463134765625, 1.0498046875, 1.2532958984375, 1.456787109375, 1.6602783203125, 1.86376953125, 2.0672607421875, 2.270751953125, 2.4742431640625, 2.677734375, 2.8812255859375, 3.084716796875, 3.2882080078125, 3.49169921875, 3.6951904296875, 3.898681640625, 4.1021728515625, 4.3056640625, 4.5091552734375, 4.712646484375, 4.9161376953125, 5.11962890625, 5.3231201171875, 5.526611328125, 5.7301025390625, 5.93359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 10.0, 8.0, 18.0, 21.0, 17.0, 28.0, 31.0, 62.0, 83.0, 127.0, 208.0, 288.0, 480.0, 782.0, 1301.0, 2523.0, 5991.0, 18329.0, 78661.0, 446471.0, 2885271.0, 615516.0, 101235.0, 23016.0, 7131.0, 2901.0, 1496.0, 833.0, 515.0, 322.0, 197.0, 130.0, 102.0, 56.0, 32.0, 27.0, 19.0, 13.0, 10.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1875, -6.9268798828125, -6.666259765625, -6.4056396484375, -6.14501953125, -5.8843994140625, -5.623779296875, -5.3631591796875, -5.1025390625, -4.8419189453125, -4.581298828125, -4.3206787109375, -4.06005859375, -3.7994384765625, -3.538818359375, -3.2781982421875, -3.017578125, -2.7569580078125, -2.496337890625, -2.2357177734375, -1.97509765625, -1.7144775390625, -1.453857421875, -1.1932373046875, -0.9326171875, -0.6719970703125, -0.411376953125, -0.1507568359375, 0.10986328125, 0.3704833984375, 0.631103515625, 0.8917236328125, 1.15234375, 1.4129638671875, 1.673583984375, 1.9342041015625, 2.19482421875, 2.4554443359375, 2.716064453125, 2.9766845703125, 3.2373046875, 3.4979248046875, 3.758544921875, 4.0191650390625, 4.27978515625, 4.5404052734375, 4.801025390625, 5.0616455078125, 5.322265625, 5.5828857421875, 5.843505859375, 6.1041259765625, 6.36474609375, 6.6253662109375, 6.885986328125, 7.1466064453125, 7.4072265625, 7.6678466796875, 7.928466796875, 8.1890869140625, 8.44970703125, 8.7103271484375, 8.970947265625, 9.2315673828125, 9.4921875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 19.0, 222.0, 553.0, 196.0, 17.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.85098266601562, -154.71749877929688, -150.58399963378906, -146.4505157470703, -142.31703186035156, -138.1835479736328, -134.050048828125, -129.91656494140625, -125.7830810546875, -121.64958953857422, -117.51610565185547, -113.38261413574219, -109.24913024902344, -105.11563873291016, -100.98214721679688, -96.84866333007812, -92.71517181396484, -88.58168029785156, -84.44819641113281, -80.31470489501953, -76.18122100830078, -72.0477294921875, -67.91424560546875, -63.78075408935547, -59.64726638793945, -55.51377868652344, -51.38029098510742, -47.246803283691406, -43.113311767578125, -38.979827880859375, -34.846336364746094, -30.712848663330078, -26.579360961914062, -22.445873260498047, -18.31238555908203, -14.178895950317383, -10.045408248901367, -5.911920547485352, -1.7784309387207031, 2.3550567626953125, 6.488544464111328, 10.622032165527344, 14.755520820617676, 18.889009475708008, 23.022497177124023, 27.15598487854004, 31.289474487304688, 35.4229621887207, 39.55644989013672, 43.689937591552734, 47.82342529296875, 51.95691680908203, 56.09040069580078, 60.22389221191406, 64.35737609863281, 68.4908676147461, 72.62435913085938, 76.75785064697266, 80.8913345336914, 85.02482604980469, 89.15830993652344, 93.29180145263672, 97.42529296875, 101.55877685546875, 105.6922607421875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 3.0, 3.0, 7.0, 11.0, 14.0, 7.0, 11.0, 21.0, 20.0, 21.0, 20.0, 25.0, 30.0, 32.0, 33.0, 35.0, 38.0, 28.0, 40.0, 40.0, 30.0, 44.0, 41.0, 46.0, 42.0, 56.0, 38.0, 39.0, 31.0, 25.0, 33.0, 14.0, 18.0, 18.0, 18.0, 14.0, 11.0, 12.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.935544967651367, -23.193965911865234, -22.45238494873047, -21.710805892944336, -20.96922492980957, -20.227645874023438, -19.486064910888672, -18.74448585510254, -18.002906799316406, -17.261327743530273, -16.519746780395508, -15.778167724609375, -15.036587715148926, -14.295007705688477, -13.553427696228027, -12.811847686767578, -12.070267677307129, -11.32868766784668, -10.58710765838623, -9.845527648925781, -9.103948593139648, -8.3623685836792, -7.62078857421875, -6.879209041595459, -6.13762903213501, -5.3960490226745605, -4.6544694900512695, -3.9128894805908203, -3.17130970954895, -2.42972993850708, -1.6881499290466309, -0.9465703964233398, -0.20499038696289062, 0.5365894436836243, 1.2781692743301392, 2.019749164581299, 2.761328935623169, 3.502908706665039, 4.244488716125488, 4.986068248748779, 5.7276482582092285, 6.469228267669678, 7.210807800292969, 7.952387809753418, 8.693967819213867, 9.435546875, 10.177127838134766, 10.918706893920898, 11.660286903381348, 12.401866912841797, 13.143446922302246, 13.885026931762695, 14.626605987548828, 15.368185997009277, 16.109766006469727, 16.85134506225586, 17.592926025390625, 18.334505081176758, 19.076086044311523, 19.817665100097656, 20.559246063232422, 21.300825119018555, 22.042404174804688, 22.783985137939453, 23.525564193725586]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 16.0, 19.0, 19.0, 15.0, 22.0, 30.0, 34.0, 23.0, 36.0, 37.0, 29.0, 36.0, 38.0, 40.0, 37.0, 37.0, 32.0, 33.0, 39.0, 40.0, 37.0, 29.0, 36.0, 28.0, 18.0, 28.0, 21.0, 19.0, 20.0, 19.0, 12.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0], "bins": [-2.810546875, -2.7255859375, -2.640625, -2.5556640625, -2.470703125, -2.3857421875, -2.30078125, -2.2158203125, -2.130859375, -2.0458984375, -1.9609375, -1.8759765625, -1.791015625, -1.7060546875, -1.62109375, -1.5361328125, -1.451171875, -1.3662109375, -1.28125, -1.1962890625, -1.111328125, -1.0263671875, -0.94140625, -0.8564453125, -0.771484375, -0.6865234375, -0.6015625, -0.5166015625, -0.431640625, -0.3466796875, -0.26171875, -0.1767578125, -0.091796875, -0.0068359375, 0.078125, 0.1630859375, 0.248046875, 0.3330078125, 0.41796875, 0.5029296875, 0.587890625, 0.6728515625, 0.7578125, 0.8427734375, 0.927734375, 1.0126953125, 1.09765625, 1.1826171875, 1.267578125, 1.3525390625, 1.4375, 1.5224609375, 1.607421875, 1.6923828125, 1.77734375, 1.8623046875, 1.947265625, 2.0322265625, 2.1171875, 2.2021484375, 2.287109375, 2.3720703125, 2.45703125, 2.5419921875, 2.626953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 31.0, 41.0, 50.0, 77.0, 115.0, 171.0, 252.0, 372.0, 554.0, 818.0, 1189.0, 1943.0, 3036.0, 4958.0, 7892.0, 12653.0, 21952.0, 37743.0, 65510.0, 113168.0, 185345.0, 220414.0, 152409.0, 90633.0, 52283.0, 29595.0, 17629.0, 10443.0, 6301.0, 3779.0, 2466.0, 1550.0, 1000.0, 686.0, 469.0, 310.0, 224.0, 134.0, 113.0, 75.0, 41.0, 31.0, 27.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.378662109375, -0.36728668212890625, -0.3559112548828125, -0.34453582763671875, -0.333160400390625, -0.32178497314453125, -0.3104095458984375, -0.29903411865234375, -0.28765869140625, -0.27628326416015625, -0.2649078369140625, -0.25353240966796875, -0.242156982421875, -0.23078155517578125, -0.2194061279296875, -0.20803070068359375, -0.1966552734375, -0.18527984619140625, -0.1739044189453125, -0.16252899169921875, -0.151153564453125, -0.13977813720703125, -0.1284027099609375, -0.11702728271484375, -0.10565185546875, -0.09427642822265625, -0.0829010009765625, -0.07152557373046875, -0.060150146484375, -0.04877471923828125, -0.0373992919921875, -0.02602386474609375, -0.0146484375, -0.00327301025390625, 0.0081024169921875, 0.01947784423828125, 0.030853271484375, 0.04222869873046875, 0.0536041259765625, 0.06497955322265625, 0.07635498046875, 0.08773040771484375, 0.0991058349609375, 0.11048126220703125, 0.121856689453125, 0.13323211669921875, 0.1446075439453125, 0.15598297119140625, 0.1673583984375, 0.17873382568359375, 0.1901092529296875, 0.20148468017578125, 0.212860107421875, 0.22423553466796875, 0.2356109619140625, 0.24698638916015625, 0.25836181640625, 0.26973724365234375, 0.2811126708984375, 0.29248809814453125, 0.303863525390625, 0.31523895263671875, 0.3266143798828125, 0.33798980712890625, 0.349365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 4.0, 9.0, 7.0, 15.0, 8.0, 15.0, 23.0, 14.0, 16.0, 24.0, 31.0, 31.0, 37.0, 37.0, 38.0, 38.0, 28.0, 33.0, 39.0, 45.0, 1069.0, 35.0, 43.0, 37.0, 40.0, 26.0, 37.0, 24.0, 40.0, 23.0, 22.0, 22.0, 23.0, 19.0, 10.0, 13.0, 10.0, 6.0, 2.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.14959716796875, -2.0784912109375, -2.00738525390625, -1.936279296875, -1.86517333984375, -1.7940673828125, -1.72296142578125, -1.65185546875, -1.58074951171875, -1.5096435546875, -1.43853759765625, -1.367431640625, -1.29632568359375, -1.2252197265625, -1.15411376953125, -1.0830078125, -1.01190185546875, -0.9407958984375, -0.86968994140625, -0.798583984375, -0.72747802734375, -0.6563720703125, -0.58526611328125, -0.51416015625, -0.44305419921875, -0.3719482421875, -0.30084228515625, -0.229736328125, -0.15863037109375, -0.0875244140625, -0.01641845703125, 0.0546875, 0.12579345703125, 0.1968994140625, 0.26800537109375, 0.339111328125, 0.41021728515625, 0.4813232421875, 0.55242919921875, 0.62353515625, 0.69464111328125, 0.7657470703125, 0.83685302734375, 0.907958984375, 0.97906494140625, 1.0501708984375, 1.12127685546875, 1.1923828125, 1.26348876953125, 1.3345947265625, 1.40570068359375, 1.476806640625, 1.54791259765625, 1.6190185546875, 1.69012451171875, 1.76123046875, 1.83233642578125, 1.9034423828125, 1.97454833984375, 2.045654296875, 2.11676025390625, 2.1878662109375, 2.25897216796875, 2.330078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 16.0, 25.0, 49.0, 67.0, 121.0, 176.0, 342.0, 706.0, 1634.0, 4252.0, 12901.0, 50466.0, 248536.0, 1489727.0, 222880.0, 46285.0, 12175.0, 3798.0, 1490.0, 653.0, 345.0, 197.0, 105.0, 55.0, 34.0, 17.0, 14.0, 16.0, 13.0, 2.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6912612915039062, -0.6706085205078125, -0.6499557495117188, -0.629302978515625, -0.6086502075195312, -0.5879974365234375, -0.5673446655273438, -0.54669189453125, -0.5260391235351562, -0.5053863525390625, -0.48473358154296875, -0.464080810546875, -0.44342803955078125, -0.4227752685546875, -0.40212249755859375, -0.3814697265625, -0.36081695556640625, -0.3401641845703125, -0.31951141357421875, -0.298858642578125, -0.27820587158203125, -0.2575531005859375, -0.23690032958984375, -0.21624755859375, -0.19559478759765625, -0.1749420166015625, -0.15428924560546875, -0.133636474609375, -0.11298370361328125, -0.0923309326171875, -0.07167816162109375, -0.051025390625, -0.03037261962890625, -0.0097198486328125, 0.01093292236328125, 0.031585693359375, 0.05223846435546875, 0.0728912353515625, 0.09354400634765625, 0.11419677734375, 0.13484954833984375, 0.1555023193359375, 0.17615509033203125, 0.196807861328125, 0.21746063232421875, 0.2381134033203125, 0.25876617431640625, 0.2794189453125, 0.30007171630859375, 0.3207244873046875, 0.34137725830078125, 0.362030029296875, 0.38268280029296875, 0.4033355712890625, 0.42398834228515625, 0.44464111328125, 0.46529388427734375, 0.4859466552734375, 0.5065994262695312, 0.527252197265625, 0.5479049682617188, 0.5685577392578125, 0.5892105102539062, 0.60986328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 10.0, 17.0, 18.0, 24.0, 27.0, 62.0, 61.0, 88.0, 133.0, 139.0, 132.0, 68.0, 41.0, 26.0, 29.0, 14.0, 13.0, 10.0, 9.0, 6.0, 14.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.090576171875, -0.0881357192993164, -0.08569526672363281, -0.08325481414794922, -0.08081436157226562, -0.07837390899658203, -0.07593345642089844, -0.07349300384521484, -0.07105255126953125, -0.06861209869384766, -0.06617164611816406, -0.06373119354248047, -0.061290740966796875, -0.05885028839111328, -0.05640983581542969, -0.053969383239746094, -0.0515289306640625, -0.049088478088378906, -0.04664802551269531, -0.04420757293701172, -0.041767120361328125, -0.03932666778564453, -0.03688621520996094, -0.034445762634277344, -0.03200531005859375, -0.029564857482910156, -0.027124404907226562, -0.02468395233154297, -0.022243499755859375, -0.01980304718017578, -0.017362594604492188, -0.014922142028808594, -0.012481689453125, -0.010041236877441406, -0.0076007843017578125, -0.005160331726074219, -0.002719879150390625, -0.00027942657470703125, 0.0021610260009765625, 0.004601478576660156, 0.00704193115234375, 0.009482383728027344, 0.011922836303710938, 0.014363288879394531, 0.016803741455078125, 0.01924419403076172, 0.021684646606445312, 0.024125099182128906, 0.0265655517578125, 0.029006004333496094, 0.03144645690917969, 0.03388690948486328, 0.036327362060546875, 0.03876781463623047, 0.04120826721191406, 0.043648719787597656, 0.04608917236328125, 0.048529624938964844, 0.05097007751464844, 0.05341053009033203, 0.055850982666015625, 0.05829143524169922, 0.06073188781738281, 0.0631723403930664, 0.06561279296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 4.0, 7.0, 13.0, 10.0, 18.0, 35.0, 27.0, 32.0, 61.0, 83.0, 171.0, 317.0, 1021.0, 1026617.0, 18845.0, 568.0, 267.0, 123.0, 92.0, 54.0, 42.0, 30.0, 20.0, 17.0, 13.0, 6.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.646484375, -1.593017578125, -1.53955078125, -1.486083984375, -1.4326171875, -1.379150390625, -1.32568359375, -1.272216796875, -1.21875, -1.165283203125, -1.11181640625, -1.058349609375, -1.0048828125, -0.951416015625, -0.89794921875, -0.844482421875, -0.791015625, -0.737548828125, -0.68408203125, -0.630615234375, -0.5771484375, -0.523681640625, -0.47021484375, -0.416748046875, -0.36328125, -0.309814453125, -0.25634765625, -0.202880859375, -0.1494140625, -0.095947265625, -0.04248046875, 0.010986328125, 0.064453125, 0.117919921875, 0.17138671875, 0.224853515625, 0.2783203125, 0.331787109375, 0.38525390625, 0.438720703125, 0.4921875, 0.545654296875, 0.59912109375, 0.652587890625, 0.7060546875, 0.759521484375, 0.81298828125, 0.866455078125, 0.919921875, 0.973388671875, 1.02685546875, 1.080322265625, 1.1337890625, 1.187255859375, 1.24072265625, 1.294189453125, 1.34765625, 1.401123046875, 1.45458984375, 1.508056640625, 1.5615234375, 1.614990234375, 1.66845703125, 1.721923828125, 1.775390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 67.0, 617.0, 297.0, 27.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23715998232364655, -0.22576290369033813, -0.21436583995819092, -0.2029687613248825, -0.1915716826915741, -0.18017460405826569, -0.16877752542495728, -0.15738046169281006, -0.14598338305950165, -0.13458630442619324, -0.12318923324346542, -0.11179216206073761, -0.1003950834274292, -0.08899800479412079, -0.07760093361139297, -0.06620386242866516, -0.05480678379535675, -0.04340970888733864, -0.032012633979320526, -0.020615559071302414, -0.009218484163284302, 0.0021785907447338104, 0.013575665652751923, 0.024972736835479736, 0.03636981546878815, 0.04776689037680626, 0.05916396528482437, 0.07056103646755219, 0.0819581151008606, 0.093355193734169, 0.10475226491689682, 0.11614933609962463, 0.12754639983177185, 0.13894347846508026, 0.15034055709838867, 0.1617376208305359, 0.1731346994638443, 0.1845317780971527, 0.19592884182929993, 0.20732592046260834, 0.21872299909591675, 0.23012007772922516, 0.24151715636253357, 0.2529142200946808, 0.2643113136291504, 0.2757083773612976, 0.2871054410934448, 0.29850250482559204, 0.30989959836006165, 0.32129666209220886, 0.33269375562667847, 0.3440908193588257, 0.3554878830909729, 0.3668849766254425, 0.3782820403575897, 0.3896791338920593, 0.40107619762420654, 0.41247326135635376, 0.42387035489082336, 0.4352674186229706, 0.4466645121574402, 0.4580615758895874, 0.4694586396217346, 0.48085570335388184, 0.49225279688835144]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 13.0, 8.0, 9.0, 20.0, 13.0, 18.0, 23.0, 20.0, 38.0, 33.0, 44.0, 31.0, 42.0, 37.0, 44.0, 47.0, 50.0, 46.0, 36.0, 55.0, 48.0, 44.0, 38.0, 27.0, 35.0, 31.0, 22.0, 23.0, 28.0, 19.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05618172883987427, -0.05404782295227051, -0.051913920789957047, -0.049780018627643585, -0.047646112740039825, -0.045512206852436066, -0.043378304690122604, -0.04124440252780914, -0.03911049664020538, -0.036976590752601624, -0.03484268859028816, -0.0327087864279747, -0.03057488054037094, -0.02844097651541233, -0.02630707249045372, -0.02417316846549511, -0.0220392644405365, -0.01990536041557789, -0.017771456390619278, -0.015637552365660667, -0.013503648340702057, -0.011369744315743446, -0.009235840290784836, -0.007101936265826225, -0.004968032240867615, -0.002834128215909004, -0.0007002241909503937, 0.0014336798340082169, 0.0035675838589668274, 0.005701487883925438, 0.007835391908884048, 0.009969295933842659, 0.01210319995880127, 0.01423710398375988, 0.01637100800871849, 0.0185049120336771, 0.02063881605863571, 0.022772720083594322, 0.024906624108552933, 0.027040528133511543, 0.029174432158470154, 0.031308338046073914, 0.033442240208387375, 0.035576142370700836, 0.037710048258304596, 0.039843954145908356, 0.04197785630822182, 0.04411175847053528, 0.04624566435813904, 0.0483795702457428, 0.05051347240805626, 0.05264737457036972, 0.05478128045797348, 0.05691518634557724, 0.0590490885078907, 0.06118299067020416, 0.06331689655780792, 0.06545080244541168, 0.06758470833301544, 0.0697186067700386, 0.07185251265764236, 0.07398641854524612, 0.07612031698226929, 0.07825422286987305, 0.0803881287574768]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 0.0, 4.0, 1.0, 8.0, 9.0, 6.0, 11.0, 12.0, 18.0, 13.0, 21.0, 26.0, 33.0, 24.0, 31.0, 34.0, 41.0, 33.0, 43.0, 36.0, 46.0, 36.0, 49.0, 42.0, 30.0, 41.0, 40.0, 34.0, 37.0, 21.0, 29.0, 35.0, 23.0, 13.0, 27.0, 23.0, 18.0, 12.0, 9.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0], "bins": [-3.279296875, -3.18701171875, -3.0947265625, -3.00244140625, -2.91015625, -2.81787109375, -2.7255859375, -2.63330078125, -2.541015625, -2.44873046875, -2.3564453125, -2.26416015625, -2.171875, -2.07958984375, -1.9873046875, -1.89501953125, -1.802734375, -1.71044921875, -1.6181640625, -1.52587890625, -1.43359375, -1.34130859375, -1.2490234375, -1.15673828125, -1.064453125, -0.97216796875, -0.8798828125, -0.78759765625, -0.6953125, -0.60302734375, -0.5107421875, -0.41845703125, -0.326171875, -0.23388671875, -0.1416015625, -0.04931640625, 0.04296875, 0.13525390625, 0.2275390625, 0.31982421875, 0.412109375, 0.50439453125, 0.5966796875, 0.68896484375, 0.78125, 0.87353515625, 0.9658203125, 1.05810546875, 1.150390625, 1.24267578125, 1.3349609375, 1.42724609375, 1.51953125, 1.61181640625, 1.7041015625, 1.79638671875, 1.888671875, 1.98095703125, 2.0732421875, 2.16552734375, 2.2578125, 2.35009765625, 2.4423828125, 2.53466796875, 2.626953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 13.0, 15.0, 18.0, 32.0, 48.0, 65.0, 83.0, 122.0, 173.0, 267.0, 435.0, 698.0, 1106.0, 1843.0, 3475.0, 6632.0, 13107.0, 28071.0, 70064.0, 247232.0, 464830.0, 125851.0, 44263.0, 19315.0, 9263.0, 4871.0, 2616.0, 1538.0, 909.0, 524.0, 316.0, 238.0, 148.0, 107.0, 60.0, 58.0, 45.0, 24.0, 19.0, 13.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.6671142578125, -4.517822265625, -4.3685302734375, -4.21923828125, -4.0699462890625, -3.920654296875, -3.7713623046875, -3.6220703125, -3.4727783203125, -3.323486328125, -3.1741943359375, -3.02490234375, -2.8756103515625, -2.726318359375, -2.5770263671875, -2.427734375, -2.2784423828125, -2.129150390625, -1.9798583984375, -1.83056640625, -1.6812744140625, -1.531982421875, -1.3826904296875, -1.2333984375, -1.0841064453125, -0.934814453125, -0.7855224609375, -0.63623046875, -0.4869384765625, -0.337646484375, -0.1883544921875, -0.0390625, 0.1102294921875, 0.259521484375, 0.4088134765625, 0.55810546875, 0.7073974609375, 0.856689453125, 1.0059814453125, 1.1552734375, 1.3045654296875, 1.453857421875, 1.6031494140625, 1.75244140625, 1.9017333984375, 2.051025390625, 2.2003173828125, 2.349609375, 2.4989013671875, 2.648193359375, 2.7974853515625, 2.94677734375, 3.0960693359375, 3.245361328125, 3.3946533203125, 3.5439453125, 3.6932373046875, 3.842529296875, 3.9918212890625, 4.14111328125, 4.2904052734375, 4.439697265625, 4.5889892578125, 4.73828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 7.0, 3.0, 7.0, 12.0, 11.0, 13.0, 22.0, 25.0, 33.0, 34.0, 32.0, 46.0, 57.0, 44.0, 87.0, 158.0, 370.0, 1473.0, 151.0, 108.0, 60.0, 39.0, 28.0, 37.0, 32.0, 23.0, 21.0, 18.0, 12.0, 14.0, 14.0, 13.0, 10.0, 7.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.18896484375, -6.9326171875, -6.67626953125, -6.419921875, -6.16357421875, -5.9072265625, -5.65087890625, -5.39453125, -5.13818359375, -4.8818359375, -4.62548828125, -4.369140625, -4.11279296875, -3.8564453125, -3.60009765625, -3.34375, -3.08740234375, -2.8310546875, -2.57470703125, -2.318359375, -2.06201171875, -1.8056640625, -1.54931640625, -1.29296875, -1.03662109375, -0.7802734375, -0.52392578125, -0.267578125, -0.01123046875, 0.2451171875, 0.50146484375, 0.7578125, 1.01416015625, 1.2705078125, 1.52685546875, 1.783203125, 2.03955078125, 2.2958984375, 2.55224609375, 2.80859375, 3.06494140625, 3.3212890625, 3.57763671875, 3.833984375, 4.09033203125, 4.3466796875, 4.60302734375, 4.859375, 5.11572265625, 5.3720703125, 5.62841796875, 5.884765625, 6.14111328125, 6.3974609375, 6.65380859375, 6.91015625, 7.16650390625, 7.4228515625, 7.67919921875, 7.935546875, 8.19189453125, 8.4482421875, 8.70458984375, 8.9609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 12.0, 12.0, 9.0, 10.0, 11.0, 20.0, 34.0, 30.0, 61.0, 87.0, 121.0, 217.0, 293.0, 497.0, 1095.0, 9267.0, 2981498.0, 147223.0, 3147.0, 802.0, 429.0, 247.0, 158.0, 109.0, 86.0, 62.0, 37.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.46875, -21.783935546875, -21.09912109375, -20.414306640625, -19.7294921875, -19.044677734375, -18.35986328125, -17.675048828125, -16.990234375, -16.305419921875, -15.62060546875, -14.935791015625, -14.2509765625, -13.566162109375, -12.88134765625, -12.196533203125, -11.51171875, -10.826904296875, -10.14208984375, -9.457275390625, -8.7724609375, -8.087646484375, -7.40283203125, -6.718017578125, -6.033203125, -5.348388671875, -4.66357421875, -3.978759765625, -3.2939453125, -2.609130859375, -1.92431640625, -1.239501953125, -0.5546875, 0.130126953125, 0.81494140625, 1.499755859375, 2.1845703125, 2.869384765625, 3.55419921875, 4.239013671875, 4.923828125, 5.608642578125, 6.29345703125, 6.978271484375, 7.6630859375, 8.347900390625, 9.03271484375, 9.717529296875, 10.40234375, 11.087158203125, 11.77197265625, 12.456787109375, 13.1416015625, 13.826416015625, 14.51123046875, 15.196044921875, 15.880859375, 16.565673828125, 17.25048828125, 17.935302734375, 18.6201171875, 19.304931640625, 19.98974609375, 20.674560546875, 21.359375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 15.0, 34.0, 103.0, 142.0, 205.0, 192.0, 130.0, 88.0, 44.0, 18.0, 12.0, 3.0, 4.0], "bins": [-57.1346435546875, -56.117767333984375, -55.10089111328125, -54.08401107788086, -53.067134857177734, -52.05025863647461, -51.033382415771484, -50.01650619506836, -48.99962615966797, -47.982749938964844, -46.96587371826172, -45.94899368286133, -44.9321174621582, -43.91524124145508, -42.89836502075195, -41.88148880004883, -40.8646125793457, -39.84773635864258, -38.83086013793945, -37.81398010253906, -36.79710388183594, -35.78022766113281, -34.76335144042969, -33.74647521972656, -32.72959899902344, -31.712722778320312, -30.695844650268555, -29.67896842956543, -28.662090301513672, -27.645214080810547, -26.628337860107422, -25.611461639404297, -24.59458351135254, -23.577707290649414, -22.560829162597656, -21.54395294189453, -20.527076721191406, -19.51019859313965, -18.493322372436523, -17.476444244384766, -16.45956802368164, -15.4426908493042, -14.425813674926758, -13.408937454223633, -12.392060279846191, -11.37518310546875, -10.358306884765625, -9.341429710388184, -8.324552536010742, -7.307675361633301, -6.290798664093018, -5.273921966552734, -4.257044792175293, -3.2401676177978516, -2.2232909202575684, -1.2064142227172852, -0.18953657150268555, 0.8273403644561768, 1.844217300415039, 2.8610942363739014, 3.8779711723327637, 4.894848346710205, 5.911725044250488, 6.9286017417907715, 7.945478916168213]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 13.0, 14.0, 15.0, 19.0, 13.0, 24.0, 29.0, 26.0, 28.0, 24.0, 28.0, 37.0, 46.0, 36.0, 52.0, 39.0, 37.0, 37.0, 47.0, 41.0, 28.0, 38.0, 39.0, 34.0, 29.0, 26.0, 31.0, 19.0, 15.0, 19.0, 13.0, 17.0, 13.0, 5.0, 10.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.634201049804688, -22.898351669311523, -22.16250228881836, -21.426652908325195, -20.69080352783203, -19.9549560546875, -19.219104766845703, -18.483257293701172, -17.747407913208008, -17.011558532714844, -16.27570915222168, -15.539859771728516, -14.804011344909668, -14.068161964416504, -13.33231258392334, -12.596464157104492, -11.860613822937012, -11.124764442443848, -10.388915061950684, -9.653066635131836, -8.917217254638672, -8.181367874145508, -7.445518493652344, -6.709669589996338, -5.973820209503174, -5.23797082901001, -4.502121925354004, -3.76627254486084, -3.030423402786255, -2.29457426071167, -1.5587248802185059, -0.8228759765625, -0.08702659606933594, 0.6488226056098938, 1.3846718072891235, 2.120521068572998, 2.856370210647583, 3.592219352722168, 4.328068733215332, 5.063917636871338, 5.799767017364502, 6.535616397857666, 7.271465301513672, 8.007314682006836, 8.7431640625, 9.479013442993164, 10.214862823486328, 10.950711250305176, 11.68656063079834, 12.422410011291504, 13.158259391784668, 13.894107818603516, 14.62995719909668, 15.365806579589844, 16.101655960083008, 16.837505340576172, 17.573354721069336, 18.3092041015625, 19.045053482055664, 19.780902862548828, 20.516752243041992, 21.252601623535156, 21.988449096679688, 22.72429847717285, 23.460147857666016]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 14.0, 17.0, 17.0, 12.0, 17.0, 21.0, 25.0, 21.0, 33.0, 44.0, 42.0, 45.0, 40.0, 46.0, 55.0, 46.0, 47.0, 46.0, 50.0, 42.0, 37.0, 27.0, 36.0, 22.0, 26.0, 26.0, 18.0, 19.0, 12.0, 13.0, 20.0, 12.0, 10.0, 10.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20172119140625, -3.0909423828125, -2.98016357421875, -2.869384765625, -2.75860595703125, -2.6478271484375, -2.53704833984375, -2.42626953125, -2.31549072265625, -2.2047119140625, -2.09393310546875, -1.983154296875, -1.87237548828125, -1.7615966796875, -1.65081787109375, -1.5400390625, -1.42926025390625, -1.3184814453125, -1.20770263671875, -1.096923828125, -0.98614501953125, -0.8753662109375, -0.76458740234375, -0.65380859375, -0.54302978515625, -0.4322509765625, -0.32147216796875, -0.210693359375, -0.09991455078125, 0.0108642578125, 0.12164306640625, 0.232421875, 0.34320068359375, 0.4539794921875, 0.56475830078125, 0.675537109375, 0.78631591796875, 0.8970947265625, 1.00787353515625, 1.11865234375, 1.22943115234375, 1.3402099609375, 1.45098876953125, 1.561767578125, 1.67254638671875, 1.7833251953125, 1.89410400390625, 2.0048828125, 2.11566162109375, 2.2264404296875, 2.33721923828125, 2.447998046875, 2.55877685546875, 2.6695556640625, 2.78033447265625, 2.89111328125, 3.00189208984375, 3.1126708984375, 3.22344970703125, 3.334228515625, 3.44500732421875, 3.5557861328125, 3.66656494140625, 3.77734375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 11.0, 26.0, 26.0, 47.0, 53.0, 74.0, 117.0, 166.0, 315.0, 534.0, 1082.0, 2276.0, 5476.0, 19693.0, 511298.0, 3447242.0, 183814.0, 13588.0, 4378.0, 1870.0, 873.0, 465.0, 293.0, 166.0, 104.0, 72.0, 61.0, 36.0, 28.0, 17.0, 12.0, 12.0, 4.0, 16.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.15625, -12.8043212890625, -12.452392578125, -12.1004638671875, -11.74853515625, -11.3966064453125, -11.044677734375, -10.6927490234375, -10.3408203125, -9.9888916015625, -9.636962890625, -9.2850341796875, -8.93310546875, -8.5811767578125, -8.229248046875, -7.8773193359375, -7.525390625, -7.1734619140625, -6.821533203125, -6.4696044921875, -6.11767578125, -5.7657470703125, -5.413818359375, -5.0618896484375, -4.7099609375, -4.3580322265625, -4.006103515625, -3.6541748046875, -3.30224609375, -2.9503173828125, -2.598388671875, -2.2464599609375, -1.89453125, -1.5426025390625, -1.190673828125, -0.8387451171875, -0.48681640625, -0.1348876953125, 0.217041015625, 0.5689697265625, 0.9208984375, 1.2728271484375, 1.624755859375, 1.9766845703125, 2.32861328125, 2.6805419921875, 3.032470703125, 3.3843994140625, 3.736328125, 4.0882568359375, 4.440185546875, 4.7921142578125, 5.14404296875, 5.4959716796875, 5.847900390625, 6.1998291015625, 6.5517578125, 6.9036865234375, 7.255615234375, 7.6075439453125, 7.95947265625, 8.3114013671875, 8.663330078125, 9.0152587890625, 9.3671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 11.0, 12.0, 13.0, 25.0, 24.0, 58.0, 61.0, 77.0, 85.0, 123.0, 142.0, 208.0, 273.0, 392.0, 447.0, 487.0, 386.0, 319.0, 222.0, 171.0, 132.0, 93.0, 81.0, 62.0, 46.0, 35.0, 23.0, 13.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.06787109375, -3.9130859375, -3.75830078125, -3.603515625, -3.44873046875, -3.2939453125, -3.13916015625, -2.984375, -2.82958984375, -2.6748046875, -2.52001953125, -2.365234375, -2.21044921875, -2.0556640625, -1.90087890625, -1.74609375, -1.59130859375, -1.4365234375, -1.28173828125, -1.126953125, -0.97216796875, -0.8173828125, -0.66259765625, -0.5078125, -0.35302734375, -0.1982421875, -0.04345703125, 0.111328125, 0.26611328125, 0.4208984375, 0.57568359375, 0.73046875, 0.88525390625, 1.0400390625, 1.19482421875, 1.349609375, 1.50439453125, 1.6591796875, 1.81396484375, 1.96875, 2.12353515625, 2.2783203125, 2.43310546875, 2.587890625, 2.74267578125, 2.8974609375, 3.05224609375, 3.20703125, 3.36181640625, 3.5166015625, 3.67138671875, 3.826171875, 3.98095703125, 4.1357421875, 4.29052734375, 4.4453125, 4.60009765625, 4.7548828125, 4.90966796875, 5.064453125, 5.21923828125, 5.3740234375, 5.52880859375, 5.68359375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 12.0, 7.0, 22.0, 28.0, 48.0, 61.0, 85.0, 154.0, 246.0, 496.0, 1003.0, 2605.0, 9259.0, 86348.0, 3019085.0, 1025990.0, 38825.0, 5963.0, 1979.0, 918.0, 411.0, 266.0, 161.0, 88.0, 70.0, 42.0, 29.0, 22.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9140625, -12.5728759765625, -12.231689453125, -11.8905029296875, -11.54931640625, -11.2081298828125, -10.866943359375, -10.5257568359375, -10.1845703125, -9.8433837890625, -9.502197265625, -9.1610107421875, -8.81982421875, -8.4786376953125, -8.137451171875, -7.7962646484375, -7.455078125, -7.1138916015625, -6.772705078125, -6.4315185546875, -6.09033203125, -5.7491455078125, -5.407958984375, -5.0667724609375, -4.7255859375, -4.3843994140625, -4.043212890625, -3.7020263671875, -3.36083984375, -3.0196533203125, -2.678466796875, -2.3372802734375, -1.99609375, -1.6549072265625, -1.313720703125, -0.9725341796875, -0.63134765625, -0.2901611328125, 0.051025390625, 0.3922119140625, 0.7333984375, 1.0745849609375, 1.415771484375, 1.7569580078125, 2.09814453125, 2.4393310546875, 2.780517578125, 3.1217041015625, 3.462890625, 3.8040771484375, 4.145263671875, 4.4864501953125, 4.82763671875, 5.1688232421875, 5.510009765625, 5.8511962890625, 6.1923828125, 6.5335693359375, 6.874755859375, 7.2159423828125, 7.55712890625, 7.8983154296875, 8.239501953125, 8.5806884765625, 8.921875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 53.0, 312.0, 465.0, 137.0, 33.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.54766082763672, -120.54611206054688, -117.5445556640625, -114.54300689697266, -111.54145812988281, -108.53990173339844, -105.5383529663086, -102.53680419921875, -99.53524780273438, -96.53369903564453, -93.53214263916016, -90.53059387207031, -87.52904510498047, -84.5274887084961, -81.52593994140625, -78.52438354492188, -75.52284240722656, -72.52129364013672, -69.51973724365234, -66.5181884765625, -63.51663589477539, -60.51508331298828, -57.51353454589844, -54.51198196411133, -51.51042938232422, -48.50887680053711, -45.507328033447266, -42.505775451660156, -39.50422286987305, -36.50267028808594, -33.501121520996094, -30.499568939208984, -27.498016357421875, -24.4964656829834, -21.49491310119629, -18.493362426757812, -15.49181079864502, -12.490259170532227, -9.48870849609375, -6.487155914306641, -3.485605239868164, -0.4840538501739502, 2.5174975395202637, 5.519048690795898, 8.520600318908691, 11.522151947021484, 14.523702621459961, 17.52525520324707, 20.526805877685547, 23.528356552124023, 26.529909133911133, 29.53145980834961, 32.53301239013672, 35.53456115722656, 38.53611373901367, 41.53766632080078, 44.539215087890625, 47.540767669677734, 50.54231643676758, 53.54386901855469, 56.5454216003418, 59.546974182128906, 62.54852294921875, 65.55007934570312, 68.55162811279297]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 7.0, 15.0, 6.0, 11.0, 10.0, 17.0, 16.0, 21.0, 21.0, 34.0, 15.0, 35.0, 27.0, 28.0, 37.0, 37.0, 30.0, 39.0, 35.0, 29.0, 48.0, 43.0, 35.0, 41.0, 39.0, 30.0, 28.0, 36.0, 30.0, 25.0, 25.0, 24.0, 14.0, 15.0, 12.0, 15.0, 11.0, 12.0, 6.0, 10.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-21.14389419555664, -20.527685165405273, -19.911476135253906, -19.295265197753906, -18.67905616760254, -18.062847137451172, -17.446636199951172, -16.830427169799805, -16.214218139648438, -15.59800910949707, -14.981799125671387, -14.365589141845703, -13.749380111694336, -13.133171081542969, -12.516961097717285, -11.900751113891602, -11.284542083740234, -10.668333053588867, -10.052123069763184, -9.4359130859375, -8.819704055786133, -8.203495025634766, -7.587285041809082, -6.971075534820557, -6.354866027832031, -5.738656520843506, -5.1224470138549805, -4.506237506866455, -3.8900279998779297, -3.2738184928894043, -2.657608985900879, -2.0413994789123535, -1.4251899719238281, -0.8089804649353027, -0.19277095794677734, 0.42343854904174805, 1.0396480560302734, 1.6558575630187988, 2.272067070007324, 2.8882765769958496, 3.504486083984375, 4.1206955909729, 4.736905097961426, 5.353114604949951, 5.969324111938477, 6.585533618927002, 7.201743125915527, 7.817952632904053, 8.434162139892578, 9.050371170043945, 9.666581153869629, 10.282791137695312, 10.89900016784668, 11.515209197998047, 12.13141918182373, 12.747629165649414, 13.363838195800781, 13.980047225952148, 14.596257209777832, 15.212467193603516, 15.828676223754883, 16.44488525390625, 17.06109619140625, 17.677305221557617, 18.293514251708984]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 5.0, 8.0, 13.0, 17.0, 18.0, 23.0, 23.0, 32.0, 38.0, 28.0, 33.0, 49.0, 59.0, 43.0, 59.0, 57.0, 50.0, 54.0, 50.0, 45.0, 39.0, 38.0, 48.0, 24.0, 29.0, 23.0, 18.0, 19.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.099884033203125, -2.99859619140625, -2.897308349609375, -2.7960205078125, -2.694732666015625, -2.59344482421875, -2.492156982421875, -2.390869140625, -2.289581298828125, -2.18829345703125, -2.087005615234375, -1.9857177734375, -1.884429931640625, -1.78314208984375, -1.681854248046875, -1.58056640625, -1.479278564453125, -1.37799072265625, -1.276702880859375, -1.1754150390625, -1.074127197265625, -0.97283935546875, -0.871551513671875, -0.770263671875, -0.668975830078125, -0.56768798828125, -0.466400146484375, -0.3651123046875, -0.263824462890625, -0.16253662109375, -0.061248779296875, 0.0400390625, 0.141326904296875, 0.24261474609375, 0.343902587890625, 0.4451904296875, 0.546478271484375, 0.64776611328125, 0.749053955078125, 0.850341796875, 0.951629638671875, 1.05291748046875, 1.154205322265625, 1.2554931640625, 1.356781005859375, 1.45806884765625, 1.559356689453125, 1.66064453125, 1.761932373046875, 1.86322021484375, 1.964508056640625, 2.0657958984375, 2.167083740234375, 2.26837158203125, 2.369659423828125, 2.470947265625, 2.572235107421875, 2.67352294921875, 2.774810791015625, 2.8760986328125, 2.977386474609375, 3.07867431640625, 3.179962158203125, 3.28125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 10.0, 5.0, 8.0, 17.0, 11.0, 27.0, 60.0, 84.0, 116.0, 192.0, 277.0, 411.0, 639.0, 1125.0, 1806.0, 3001.0, 5433.0, 9860.0, 19505.0, 43727.0, 122384.0, 402828.0, 284987.0, 84734.0, 32958.0, 15175.0, 8073.0, 4439.0, 2553.0, 1571.0, 910.0, 554.0, 399.0, 247.0, 148.0, 90.0, 63.0, 35.0, 34.0, 13.0, 19.0, 7.0, 9.0, 9.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7116470336914062, -0.6869659423828125, -0.6622848510742188, -0.637603759765625, -0.6129226684570312, -0.5882415771484375, -0.5635604858398438, -0.53887939453125, -0.5141983032226562, -0.4895172119140625, -0.46483612060546875, -0.440155029296875, -0.41547393798828125, -0.3907928466796875, -0.36611175537109375, -0.3414306640625, -0.31674957275390625, -0.2920684814453125, -0.26738739013671875, -0.242706298828125, -0.21802520751953125, -0.1933441162109375, -0.16866302490234375, -0.14398193359375, -0.11930084228515625, -0.0946197509765625, -0.06993865966796875, -0.045257568359375, -0.02057647705078125, 0.0041046142578125, 0.02878570556640625, 0.053466796875, 0.07814788818359375, 0.1028289794921875, 0.12751007080078125, 0.152191162109375, 0.17687225341796875, 0.2015533447265625, 0.22623443603515625, 0.25091552734375, 0.27559661865234375, 0.3002777099609375, 0.32495880126953125, 0.349639892578125, 0.37432098388671875, 0.3990020751953125, 0.42368316650390625, 0.4483642578125, 0.47304534912109375, 0.4977264404296875, 0.5224075317382812, 0.547088623046875, 0.5717697143554688, 0.5964508056640625, 0.6211318969726562, 0.64581298828125, 0.6704940795898438, 0.6951751708984375, 0.7198562622070312, 0.744537353515625, 0.7692184448242188, 0.7938995361328125, 0.8185806274414062, 0.84326171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 18.0, 16.0, 17.0, 16.0, 12.0, 12.0, 19.0, 31.0, 33.0, 44.0, 51.0, 30.0, 41.0, 39.0, 52.0, 49.0, 1070.0, 38.0, 50.0, 47.0, 31.0, 38.0, 36.0, 32.0, 29.0, 30.0, 22.0, 27.0, 18.0, 7.0, 17.0, 11.0, 6.0, 6.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.33984375, -2.2772064208984375, -2.214569091796875, -2.1519317626953125, -2.08929443359375, -2.0266571044921875, -1.964019775390625, -1.9013824462890625, -1.8387451171875, -1.7761077880859375, -1.713470458984375, -1.6508331298828125, -1.58819580078125, -1.5255584716796875, -1.462921142578125, -1.4002838134765625, -1.337646484375, -1.2750091552734375, -1.212371826171875, -1.1497344970703125, -1.08709716796875, -1.0244598388671875, -0.961822509765625, -0.8991851806640625, -0.8365478515625, -0.7739105224609375, -0.711273193359375, -0.6486358642578125, -0.58599853515625, -0.5233612060546875, -0.460723876953125, -0.3980865478515625, -0.33544921875, -0.2728118896484375, -0.210174560546875, -0.1475372314453125, -0.08489990234375, -0.0222625732421875, 0.040374755859375, 0.1030120849609375, 0.1656494140625, 0.2282867431640625, 0.290924072265625, 0.3535614013671875, 0.41619873046875, 0.4788360595703125, 0.541473388671875, 0.6041107177734375, 0.666748046875, 0.7293853759765625, 0.792022705078125, 0.8546600341796875, 0.91729736328125, 0.9799346923828125, 1.042572021484375, 1.1052093505859375, 1.1678466796875, 1.2304840087890625, 1.293121337890625, 1.3557586669921875, 1.41839599609375, 1.4810333251953125, 1.543670654296875, 1.6063079833984375, 1.6689453125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 13.0, 9.0, 22.0, 33.0, 47.0, 69.0, 107.0, 144.0, 198.0, 283.0, 424.0, 630.0, 983.0, 1711.0, 3000.0, 5655.0, 12262.0, 30611.0, 100832.0, 623720.0, 1128978.0, 122917.0, 35879.0, 13728.0, 6422.0, 3326.0, 1815.0, 1153.0, 738.0, 429.0, 294.0, 203.0, 159.0, 76.0, 62.0, 43.0, 37.0, 28.0, 25.0, 13.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5236740112304688, -0.5068206787109375, -0.48996734619140625, -0.473114013671875, -0.45626068115234375, -0.4394073486328125, -0.42255401611328125, -0.40570068359375, -0.38884735107421875, -0.3719940185546875, -0.35514068603515625, -0.338287353515625, -0.32143402099609375, -0.3045806884765625, -0.28772735595703125, -0.2708740234375, -0.25402069091796875, -0.2371673583984375, -0.22031402587890625, -0.203460693359375, -0.18660736083984375, -0.1697540283203125, -0.15290069580078125, -0.13604736328125, -0.11919403076171875, -0.1023406982421875, -0.08548736572265625, -0.068634033203125, -0.05178070068359375, -0.0349273681640625, -0.01807403564453125, -0.001220703125, 0.01563262939453125, 0.0324859619140625, 0.04933929443359375, 0.066192626953125, 0.08304595947265625, 0.0998992919921875, 0.11675262451171875, 0.13360595703125, 0.15045928955078125, 0.1673126220703125, 0.18416595458984375, 0.201019287109375, 0.21787261962890625, 0.2347259521484375, 0.25157928466796875, 0.2684326171875, 0.28528594970703125, 0.3021392822265625, 0.31899261474609375, 0.335845947265625, 0.35269927978515625, 0.3695526123046875, 0.38640594482421875, 0.40325927734375, 0.42011260986328125, 0.4369659423828125, 0.45381927490234375, 0.470672607421875, 0.48752593994140625, 0.5043792724609375, 0.5212326049804688, 0.5380859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 15.0, 16.0, 15.0, 10.0, 22.0, 21.0, 37.0, 41.0, 90.0, 161.0, 186.0, 139.0, 55.0, 30.0, 21.0, 27.0, 18.0, 15.0, 16.0, 10.0, 8.0, 7.0, 1.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08339881896972656, -0.08110427856445312, -0.07880973815917969, -0.07651519775390625, -0.07422065734863281, -0.07192611694335938, -0.06963157653808594, -0.0673370361328125, -0.06504249572753906, -0.06274795532226562, -0.06045341491699219, -0.05815887451171875, -0.05586433410644531, -0.053569793701171875, -0.05127525329589844, -0.048980712890625, -0.04668617248535156, -0.044391632080078125, -0.04209709167480469, -0.03980255126953125, -0.03750801086425781, -0.035213470458984375, -0.03291893005371094, -0.0306243896484375, -0.028329849243164062, -0.026035308837890625, -0.023740768432617188, -0.02144622802734375, -0.019151687622070312, -0.016857147216796875, -0.014562606811523438, -0.01226806640625, -0.009973526000976562, -0.007678985595703125, -0.0053844451904296875, -0.00308990478515625, -0.0007953643798828125, 0.001499176025390625, 0.0037937164306640625, 0.0060882568359375, 0.008382797241210938, 0.010677337646484375, 0.012971878051757812, 0.01526641845703125, 0.017560958862304688, 0.019855499267578125, 0.022150039672851562, 0.024444580078125, 0.026739120483398438, 0.029033660888671875, 0.03132820129394531, 0.03362274169921875, 0.03591728210449219, 0.038211822509765625, 0.04050636291503906, 0.0428009033203125, 0.04509544372558594, 0.047389984130859375, 0.04968452453613281, 0.05197906494140625, 0.05427360534667969, 0.056568145751953125, 0.05886268615722656, 0.0611572265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 6.0, 11.0, 8.0, 14.0, 26.0, 26.0, 29.0, 48.0, 55.0, 74.0, 126.0, 212.0, 422.0, 2074.0, 1021993.0, 21895.0, 692.0, 274.0, 184.0, 86.0, 56.0, 48.0, 44.0, 40.0, 21.0, 17.0, 13.0, 12.0, 7.0, 7.0, 4.0, 6.0, 8.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1769256591796875, -1.131195068359375, -1.0854644775390625, -1.03973388671875, -0.9940032958984375, -0.948272705078125, -0.9025421142578125, -0.8568115234375, -0.8110809326171875, -0.765350341796875, -0.7196197509765625, -0.67388916015625, -0.6281585693359375, -0.582427978515625, -0.5366973876953125, -0.490966796875, -0.4452362060546875, -0.399505615234375, -0.3537750244140625, -0.30804443359375, -0.2623138427734375, -0.216583251953125, -0.1708526611328125, -0.1251220703125, -0.0793914794921875, -0.033660888671875, 0.0120697021484375, 0.05780029296875, 0.1035308837890625, 0.149261474609375, 0.1949920654296875, 0.24072265625, 0.2864532470703125, 0.332183837890625, 0.3779144287109375, 0.42364501953125, 0.4693756103515625, 0.515106201171875, 0.5608367919921875, 0.6065673828125, 0.6522979736328125, 0.698028564453125, 0.7437591552734375, 0.78948974609375, 0.8352203369140625, 0.880950927734375, 0.9266815185546875, 0.972412109375, 1.0181427001953125, 1.063873291015625, 1.1096038818359375, 1.15533447265625, 1.2010650634765625, 1.246795654296875, 1.2925262451171875, 1.3382568359375, 1.3839874267578125, 1.429718017578125, 1.4754486083984375, 1.52117919921875, 1.5669097900390625, 1.612640380859375, 1.6583709716796875, 1.7041015625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 48.0, 716.0, 239.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27755460143089294, -0.2641831934452057, -0.25081175565719604, -0.2374403476715088, -0.22406893968582153, -0.21069751679897308, -0.19732609391212463, -0.18395468592643738, -0.17058326303958893, -0.15721184015274048, -0.14384043216705322, -0.13046900928020477, -0.11709759384393692, -0.10372617840766907, -0.09035475552082062, -0.07698334008455276, -0.06361192464828491, -0.05024050921201706, -0.03686909005045891, -0.023497670888900757, -0.010126255452632904, 0.0032451599836349487, 0.0166165828704834, 0.02998799830675125, 0.043359413743019104, 0.05673082917928696, 0.07010224461555481, 0.08347366750240326, 0.09684508293867111, 0.11021649837493896, 0.12358792126178741, 0.13695934414863586, 0.15033072233200073, 0.16370214521884918, 0.17707355320453644, 0.1904449760913849, 0.20381638407707214, 0.2171878069639206, 0.23055922985076904, 0.2439306378364563, 0.25730204582214355, 0.2706734538078308, 0.28404489159584045, 0.2974162995815277, 0.31078770756721497, 0.3241591453552246, 0.33753055334091187, 0.3509019613265991, 0.36427339911460876, 0.377644807100296, 0.39101624488830566, 0.4043876528739929, 0.4177590608596802, 0.43113046884536743, 0.4445019066333771, 0.45787331461906433, 0.471244752407074, 0.48461616039276123, 0.4979875981807709, 0.5113589763641357, 0.5247304439544678, 0.538101851940155, 0.5514732599258423, 0.5648446679115295, 0.5782160758972168]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 11.0, 24.0, 19.0, 19.0, 25.0, 28.0, 31.0, 34.0, 32.0, 34.0, 38.0, 41.0, 39.0, 60.0, 45.0, 47.0, 48.0, 41.0, 37.0, 34.0, 44.0, 28.0, 29.0, 21.0, 20.0, 25.0, 20.0, 13.0, 13.0, 15.0, 16.0, 8.0, 4.0, 10.0, 6.0, 7.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-0.09314745664596558, -0.09059496223926544, -0.0880424752831459, -0.08548998087644577, -0.08293749392032623, -0.0803849995136261, -0.07783250510692596, -0.07528001070022583, -0.07272752374410629, -0.07017502933740616, -0.06762254238128662, -0.06507004797458649, -0.06251755356788635, -0.059965066611766815, -0.05741257220506668, -0.054860081523656845, -0.05230759084224701, -0.04975510016083717, -0.04720260947942734, -0.0446501150727272, -0.04209762439131737, -0.03954513370990753, -0.0369926393032074, -0.03444014862179756, -0.031887657940387726, -0.02933516725897789, -0.026782674714922905, -0.02423018217086792, -0.021677691489458084, -0.01912520080804825, -0.016572708263993263, -0.014020215719938278, -0.011467725038528442, -0.008915233425796032, -0.0063627418130636215, -0.003810250200331211, -0.0012577585875988007, 0.0012947330251336098, 0.00384722463786602, 0.006399717181921005, 0.008952207863330841, 0.011504699476063251, 0.014057191088795662, 0.016609683632850647, 0.019162174314260483, 0.02171466499567032, 0.024267157539725304, 0.02681965008378029, 0.029372140765190125, 0.03192463144659996, 0.034477122128009796, 0.03702961653470993, 0.039582107216119766, 0.0421345978975296, 0.044687092304229736, 0.04723958298563957, 0.04979207366704941, 0.052344564348459244, 0.05489705502986908, 0.057449549436569214, 0.06000204011797905, 0.06255453079938889, 0.06510702520608902, 0.06765951216220856, 0.07021200656890869]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 11.0, 8.0, 15.0, 17.0, 14.0, 17.0, 30.0, 21.0, 27.0, 32.0, 38.0, 42.0, 38.0, 51.0, 50.0, 60.0, 56.0, 53.0, 53.0, 39.0, 48.0, 39.0, 45.0, 39.0, 27.0, 25.0, 23.0, 15.0, 12.0, 15.0, 10.0, 11.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.443359375, -3.34259033203125, -3.2418212890625, -3.14105224609375, -3.040283203125, -2.93951416015625, -2.8387451171875, -2.73797607421875, -2.63720703125, -2.53643798828125, -2.4356689453125, -2.33489990234375, -2.234130859375, -2.13336181640625, -2.0325927734375, -1.93182373046875, -1.8310546875, -1.73028564453125, -1.6295166015625, -1.52874755859375, -1.427978515625, -1.32720947265625, -1.2264404296875, -1.12567138671875, -1.02490234375, -0.92413330078125, -0.8233642578125, -0.72259521484375, -0.621826171875, -0.52105712890625, -0.4202880859375, -0.31951904296875, -0.21875, -0.11798095703125, -0.0172119140625, 0.08355712890625, 0.184326171875, 0.28509521484375, 0.3858642578125, 0.48663330078125, 0.58740234375, 0.68817138671875, 0.7889404296875, 0.88970947265625, 0.990478515625, 1.09124755859375, 1.1920166015625, 1.29278564453125, 1.3935546875, 1.49432373046875, 1.5950927734375, 1.69586181640625, 1.796630859375, 1.89739990234375, 1.9981689453125, 2.09893798828125, 2.19970703125, 2.30047607421875, 2.4012451171875, 2.50201416015625, 2.602783203125, 2.70355224609375, 2.8043212890625, 2.90509033203125, 3.005859375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 9.0, 6.0, 8.0, 14.0, 18.0, 33.0, 41.0, 69.0, 78.0, 95.0, 167.0, 250.0, 374.0, 569.0, 905.0, 1574.0, 2725.0, 5337.0, 11255.0, 27577.0, 83778.0, 291965.0, 411097.0, 137682.0, 41363.0, 15774.0, 7082.0, 3625.0, 1993.0, 1104.0, 688.0, 433.0, 253.0, 182.0, 134.0, 85.0, 64.0, 34.0, 33.0, 27.0, 19.0, 6.0, 13.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.056640625, -2.967254638671875, -2.87786865234375, -2.788482666015625, -2.6990966796875, -2.609710693359375, -2.52032470703125, -2.430938720703125, -2.341552734375, -2.252166748046875, -2.16278076171875, -2.073394775390625, -1.9840087890625, -1.894622802734375, -1.80523681640625, -1.715850830078125, -1.62646484375, -1.537078857421875, -1.44769287109375, -1.358306884765625, -1.2689208984375, -1.179534912109375, -1.09014892578125, -1.000762939453125, -0.911376953125, -0.821990966796875, -0.73260498046875, -0.643218994140625, -0.5538330078125, -0.464447021484375, -0.37506103515625, -0.285675048828125, -0.1962890625, -0.106903076171875, -0.01751708984375, 0.071868896484375, 0.1612548828125, 0.250640869140625, 0.34002685546875, 0.429412841796875, 0.518798828125, 0.608184814453125, 0.69757080078125, 0.786956787109375, 0.8763427734375, 0.965728759765625, 1.05511474609375, 1.144500732421875, 1.23388671875, 1.323272705078125, 1.41265869140625, 1.502044677734375, 1.5914306640625, 1.680816650390625, 1.77020263671875, 1.859588623046875, 1.948974609375, 2.038360595703125, 2.12774658203125, 2.217132568359375, 2.3065185546875, 2.395904541015625, 2.48529052734375, 2.574676513671875, 2.6640625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 12.0, 17.0, 19.0, 18.0, 23.0, 22.0, 25.0, 35.0, 30.0, 50.0, 70.0, 65.0, 151.0, 342.0, 1516.0, 173.0, 88.0, 59.0, 47.0, 44.0, 38.0, 31.0, 25.0, 30.0, 20.0, 17.0, 20.0, 8.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.81170654296875, -7.5609130859375, -7.31011962890625, -7.059326171875, -6.80853271484375, -6.5577392578125, -6.30694580078125, -6.05615234375, -5.80535888671875, -5.5545654296875, -5.30377197265625, -5.052978515625, -4.80218505859375, -4.5513916015625, -4.30059814453125, -4.0498046875, -3.79901123046875, -3.5482177734375, -3.29742431640625, -3.046630859375, -2.79583740234375, -2.5450439453125, -2.29425048828125, -2.04345703125, -1.79266357421875, -1.5418701171875, -1.29107666015625, -1.040283203125, -0.78948974609375, -0.5386962890625, -0.28790283203125, -0.037109375, 0.21368408203125, 0.4644775390625, 0.71527099609375, 0.966064453125, 1.21685791015625, 1.4676513671875, 1.71844482421875, 1.96923828125, 2.22003173828125, 2.4708251953125, 2.72161865234375, 2.972412109375, 3.22320556640625, 3.4739990234375, 3.72479248046875, 3.9755859375, 4.22637939453125, 4.4771728515625, 4.72796630859375, 4.978759765625, 5.22955322265625, 5.4803466796875, 5.73114013671875, 5.98193359375, 6.23272705078125, 6.4835205078125, 6.73431396484375, 6.985107421875, 7.23590087890625, 7.4866943359375, 7.73748779296875, 7.98828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 7.0, 8.0, 9.0, 14.0, 17.0, 33.0, 32.0, 33.0, 61.0, 83.0, 95.0, 192.0, 281.0, 517.0, 1243.0, 49335.0, 3087497.0, 4384.0, 786.0, 393.0, 213.0, 133.0, 96.0, 60.0, 39.0, 36.0, 31.0, 20.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.671142578125, -16.17041015625, -15.669677734375, -15.1689453125, -14.668212890625, -14.16748046875, -13.666748046875, -13.166015625, -12.665283203125, -12.16455078125, -11.663818359375, -11.1630859375, -10.662353515625, -10.16162109375, -9.660888671875, -9.16015625, -8.659423828125, -8.15869140625, -7.657958984375, -7.1572265625, -6.656494140625, -6.15576171875, -5.655029296875, -5.154296875, -4.653564453125, -4.15283203125, -3.652099609375, -3.1513671875, -2.650634765625, -2.14990234375, -1.649169921875, -1.1484375, -0.647705078125, -0.14697265625, 0.353759765625, 0.8544921875, 1.355224609375, 1.85595703125, 2.356689453125, 2.857421875, 3.358154296875, 3.85888671875, 4.359619140625, 4.8603515625, 5.361083984375, 5.86181640625, 6.362548828125, 6.86328125, 7.364013671875, 7.86474609375, 8.365478515625, 8.8662109375, 9.366943359375, 9.86767578125, 10.368408203125, 10.869140625, 11.369873046875, 11.87060546875, 12.371337890625, 12.8720703125, 13.372802734375, 13.87353515625, 14.374267578125, 14.875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 88.0, 791.0, 132.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.147857666015625, -21.607765197753906, -19.06767463684082, -16.5275821685791, -13.9874906539917, -11.447399139404297, -8.907306671142578, -6.367216110229492, -3.8271236419677734, -1.287031888961792, 1.2530598640441895, 3.79315185546875, 6.333243370056152, 8.873334884643555, 11.413427352905273, 13.95351791381836, 16.493610382080078, 19.033702850341797, 21.573793411254883, 24.1138858795166, 26.653976440429688, 29.194068908691406, 31.734161376953125, 34.274253845214844, 36.81434631347656, 39.35443878173828, 41.89453125, 44.43462371826172, 46.97471237182617, 49.51480484008789, 52.05489730834961, 54.59498596191406, 57.13507843017578, 59.6751708984375, 62.21526336669922, 64.75535583496094, 67.29544830322266, 69.83554077148438, 72.37562561035156, 74.91571807861328, 77.455810546875, 79.99590301513672, 82.53599548339844, 85.07608795166016, 87.61618041992188, 90.15626525878906, 92.69636535644531, 95.2364501953125, 97.77655029296875, 100.31664276123047, 102.85673522949219, 105.3968276977539, 107.93692016601562, 110.47700500488281, 113.01710510253906, 115.55718994140625, 118.09728240966797, 120.63737487792969, 123.1774673461914, 125.71755981445312, 128.2576446533203, 130.79774475097656, 133.33782958984375, 135.8779296875, 138.4180145263672]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 5.0, 3.0, 5.0, 21.0, 10.0, 7.0, 16.0, 32.0, 20.0, 24.0, 34.0, 34.0, 40.0, 41.0, 44.0, 57.0, 45.0, 48.0, 32.0, 56.0, 46.0, 42.0, 42.0, 42.0, 37.0, 39.0, 31.0, 22.0, 22.0, 21.0, 15.0, 13.0, 9.0, 9.0, 7.0, 4.0, 8.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.396127700805664, -14.830148696899414, -14.264169692993164, -13.698189735412598, -13.132210731506348, -12.566231727600098, -12.000251770019531, -11.434272766113281, -10.868293762207031, -10.302314758300781, -9.736335754394531, -9.170355796813965, -8.604376792907715, -8.038397789001465, -7.472418308258057, -6.906438827514648, -6.340459823608398, -5.774480819702148, -5.20850133895874, -4.642521858215332, -4.076542854309082, -3.510563611984253, -2.944584369659424, -2.3786051273345947, -1.8126258850097656, -1.2466466426849365, -0.6806674003601074, -0.11468815803527832, 0.4512910842895508, 1.0172703266143799, 1.583249568939209, 2.149228811264038, 2.7152099609375, 3.281189203262329, 3.847168445587158, 4.413147926330566, 4.979126930236816, 5.545105934143066, 6.111085414886475, 6.677064895629883, 7.243043899536133, 7.809022903442383, 8.375001907348633, 8.9409818649292, 9.50696086883545, 10.0729398727417, 10.638919830322266, 11.204898834228516, 11.770877838134766, 12.336856842041016, 12.902835845947266, 13.468815803527832, 14.034794807434082, 14.600773811340332, 15.166753768920898, 15.732732772827148, 16.2987117767334, 16.86469078063965, 17.4306697845459, 17.99664878845215, 18.56262969970703, 19.12860870361328, 19.69458770751953, 20.26056671142578, 20.82654571533203]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 18.0, 15.0, 14.0, 20.0, 22.0, 30.0, 31.0, 46.0, 37.0, 35.0, 34.0, 53.0, 51.0, 47.0, 36.0, 31.0, 52.0, 34.0, 34.0, 47.0, 39.0, 36.0, 28.0, 30.0, 28.0, 19.0, 19.0, 13.0, 12.0, 15.0, 12.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.12890625, -3.03179931640625, -2.9346923828125, -2.83758544921875, -2.740478515625, -2.64337158203125, -2.5462646484375, -2.44915771484375, -2.35205078125, -2.25494384765625, -2.1578369140625, -2.06072998046875, -1.963623046875, -1.86651611328125, -1.7694091796875, -1.67230224609375, -1.5751953125, -1.47808837890625, -1.3809814453125, -1.28387451171875, -1.186767578125, -1.08966064453125, -0.9925537109375, -0.89544677734375, -0.79833984375, -0.70123291015625, -0.6041259765625, -0.50701904296875, -0.409912109375, -0.31280517578125, -0.2156982421875, -0.11859130859375, -0.021484375, 0.07562255859375, 0.1727294921875, 0.26983642578125, 0.366943359375, 0.46405029296875, 0.5611572265625, 0.65826416015625, 0.75537109375, 0.85247802734375, 0.9495849609375, 1.04669189453125, 1.143798828125, 1.24090576171875, 1.3380126953125, 1.43511962890625, 1.5322265625, 1.62933349609375, 1.7264404296875, 1.82354736328125, 1.920654296875, 2.01776123046875, 2.1148681640625, 2.21197509765625, 2.30908203125, 2.40618896484375, 2.5032958984375, 2.60040283203125, 2.697509765625, 2.79461669921875, 2.8917236328125, 2.98883056640625, 3.0859375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 5.0, 7.0, 19.0, 22.0, 26.0, 40.0, 50.0, 74.0, 98.0, 113.0, 173.0, 213.0, 292.0, 366.0, 518.0, 841.0, 1391.0, 3111.0, 8229.0, 33605.0, 969166.0, 3073720.0, 79142.0, 13253.0, 4460.0, 1955.0, 1020.0, 658.0, 450.0, 332.0, 235.0, 165.0, 139.0, 100.0, 60.0, 65.0, 39.0, 35.0, 24.0, 14.0, 9.0, 14.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.375, -13.928466796875, -13.48193359375, -13.035400390625, -12.5888671875, -12.142333984375, -11.69580078125, -11.249267578125, -10.802734375, -10.356201171875, -9.90966796875, -9.463134765625, -9.0166015625, -8.570068359375, -8.12353515625, -7.677001953125, -7.23046875, -6.783935546875, -6.33740234375, -5.890869140625, -5.4443359375, -4.997802734375, -4.55126953125, -4.104736328125, -3.658203125, -3.211669921875, -2.76513671875, -2.318603515625, -1.8720703125, -1.425537109375, -0.97900390625, -0.532470703125, -0.0859375, 0.360595703125, 0.80712890625, 1.253662109375, 1.7001953125, 2.146728515625, 2.59326171875, 3.039794921875, 3.486328125, 3.932861328125, 4.37939453125, 4.825927734375, 5.2724609375, 5.718994140625, 6.16552734375, 6.612060546875, 7.05859375, 7.505126953125, 7.95166015625, 8.398193359375, 8.8447265625, 9.291259765625, 9.73779296875, 10.184326171875, 10.630859375, 11.077392578125, 11.52392578125, 11.970458984375, 12.4169921875, 12.863525390625, 13.31005859375, 13.756591796875, 14.203125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 9.0, 11.0, 21.0, 13.0, 31.0, 46.0, 74.0, 143.0, 195.0, 335.0, 581.0, 730.0, 683.0, 442.0, 286.0, 160.0, 112.0, 59.0, 41.0, 31.0, 23.0, 16.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.08966064453125, -5.8629150390625, -5.63616943359375, -5.409423828125, -5.18267822265625, -4.9559326171875, -4.72918701171875, -4.50244140625, -4.27569580078125, -4.0489501953125, -3.82220458984375, -3.595458984375, -3.36871337890625, -3.1419677734375, -2.91522216796875, -2.6884765625, -2.46173095703125, -2.2349853515625, -2.00823974609375, -1.781494140625, -1.55474853515625, -1.3280029296875, -1.10125732421875, -0.87451171875, -0.64776611328125, -0.4210205078125, -0.19427490234375, 0.032470703125, 0.25921630859375, 0.4859619140625, 0.71270751953125, 0.939453125, 1.16619873046875, 1.3929443359375, 1.61968994140625, 1.846435546875, 2.07318115234375, 2.2999267578125, 2.52667236328125, 2.75341796875, 2.98016357421875, 3.2069091796875, 3.43365478515625, 3.660400390625, 3.88714599609375, 4.1138916015625, 4.34063720703125, 4.5673828125, 4.79412841796875, 5.0208740234375, 5.24761962890625, 5.474365234375, 5.70111083984375, 5.9278564453125, 6.15460205078125, 6.38134765625, 6.60809326171875, 6.8348388671875, 7.06158447265625, 7.288330078125, 7.51507568359375, 7.7418212890625, 7.96856689453125, 8.1953125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 26.0, 34.0, 97.0, 227.0, 639.0, 2397.0, 12262.0, 136039.0, 3671862.0, 345138.0, 20665.0, 3483.0, 886.0, 284.0, 121.0, 59.0, 16.0, 12.0, 5.0, 4.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.3397216796875, -13.937255859375, -13.5347900390625, -13.13232421875, -12.7298583984375, -12.327392578125, -11.9249267578125, -11.5224609375, -11.1199951171875, -10.717529296875, -10.3150634765625, -9.91259765625, -9.5101318359375, -9.107666015625, -8.7052001953125, -8.302734375, -7.9002685546875, -7.497802734375, -7.0953369140625, -6.69287109375, -6.2904052734375, -5.887939453125, -5.4854736328125, -5.0830078125, -4.6805419921875, -4.278076171875, -3.8756103515625, -3.47314453125, -3.0706787109375, -2.668212890625, -2.2657470703125, -1.86328125, -1.4608154296875, -1.058349609375, -0.6558837890625, -0.25341796875, 0.1490478515625, 0.551513671875, 0.9539794921875, 1.3564453125, 1.7589111328125, 2.161376953125, 2.5638427734375, 2.96630859375, 3.3687744140625, 3.771240234375, 4.1737060546875, 4.576171875, 4.9786376953125, 5.381103515625, 5.7835693359375, 6.18603515625, 6.5885009765625, 6.990966796875, 7.3934326171875, 7.7958984375, 8.1983642578125, 8.600830078125, 9.0032958984375, 9.40576171875, 9.8082275390625, 10.210693359375, 10.6131591796875, 11.015625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 3.0, 14.0, 20.0, 41.0, 64.0, 88.0, 95.0, 96.0, 124.0, 106.0, 105.0, 82.0, 48.0, 29.0, 33.0, 14.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.936784744262695, -19.583702087402344, -18.230619430541992, -16.87753677368164, -15.524456024169922, -14.17137336730957, -12.818290710449219, -11.465209007263184, -10.112126350402832, -8.75904369354248, -7.405961990356445, -6.052879333496094, -4.6997971534729, -3.346714973449707, -1.9936323165893555, -0.6405506134033203, 0.7125320434570312, 2.0656142234802246, 3.418696641921997, 4.7717790603637695, 6.124861240386963, 7.477943420410156, 8.831026077270508, 10.184107780456543, 11.537190437316895, 12.890273094177246, 14.243354797363281, 15.596437454223633, 16.949520111083984, 18.302600860595703, 19.655685424804688, 21.008766174316406, 22.36185073852539, 23.714933395385742, 25.068016052246094, 26.421096801757812, 27.774179458618164, 29.127262115478516, 30.480344772338867, 31.83342742919922, 33.18650817871094, 34.539588928222656, 35.89267349243164, 37.24575424194336, 38.598838806152344, 39.95191955566406, 41.30500030517578, 42.658084869384766, 44.01116943359375, 45.36425018310547, 46.71733474731445, 48.07041549682617, 49.423500061035156, 50.776580810546875, 52.129661560058594, 53.48274612426758, 54.8358268737793, 56.188907623291016, 57.5419921875, 58.89507293701172, 60.2481575012207, 61.60123825073242, 62.954322814941406, 64.30740356445312, 65.66048431396484]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 11.0, 12.0, 16.0, 17.0, 13.0, 26.0, 16.0, 27.0, 31.0, 34.0, 37.0, 47.0, 41.0, 44.0, 43.0, 43.0, 55.0, 34.0, 48.0, 33.0, 34.0, 40.0, 29.0, 31.0, 37.0, 34.0, 22.0, 16.0, 23.0, 10.0, 10.0, 12.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.79792594909668, -19.13520050048828, -18.47247314453125, -17.80974578857422, -17.14702033996582, -16.484294891357422, -15.82156753540039, -15.158841133117676, -14.496114730834961, -13.833388328552246, -13.170661926269531, -12.507935523986816, -11.845209121704102, -11.182482719421387, -10.519756317138672, -9.857029914855957, -9.194303512573242, -8.531577110290527, -7.8688507080078125, -7.206124305725098, -6.543397903442383, -5.880671501159668, -5.217945098876953, -4.555218696594238, -3.8924922943115234, -3.2297658920288086, -2.5670394897460938, -1.904313087463379, -1.241586685180664, -0.5788602828979492, 0.08386611938476562, 0.7465925216674805, 1.4093189239501953, 2.07204532623291, 2.734771728515625, 3.39749813079834, 4.060224533081055, 4.7229509353637695, 5.385677337646484, 6.048403739929199, 6.711130142211914, 7.373856544494629, 8.036582946777344, 8.699309349060059, 9.362035751342773, 10.024762153625488, 10.687488555908203, 11.350214958190918, 12.012941360473633, 12.675667762756348, 13.338394165039062, 14.001120567321777, 14.663846969604492, 15.326573371887207, 15.989299774169922, 16.652027130126953, 17.31475257873535, 17.97747802734375, 18.64020538330078, 19.302932739257812, 19.96565818786621, 20.62838363647461, 21.29111099243164, 21.953838348388672, 22.61656379699707]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 10.0, 22.0, 20.0, 20.0, 25.0, 26.0, 34.0, 40.0, 29.0, 41.0, 43.0, 51.0, 49.0, 60.0, 56.0, 58.0, 48.0, 43.0, 33.0, 43.0, 33.0, 34.0, 27.0, 21.0, 20.0, 15.0, 18.0, 13.0, 8.0, 9.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.81884765625, -45.2001953125, -43.58154296875, -41.962890625, -40.34423828125, -38.7255859375, -37.10693359375, -35.48828125, -33.86962890625, -32.2509765625, -30.63232421875, -29.013671875, -27.39501953125, -25.7763671875, -24.15771484375, -22.5390625, -20.92041015625, -19.3017578125, -17.68310546875, -16.064453125, -14.44580078125, -12.8271484375, -11.20849609375, -9.58984375, -7.97119140625, -6.3525390625, -4.73388671875, -3.115234375, -1.49658203125, 0.1220703125, 1.74072265625, 3.359375, 4.97802734375, 6.5966796875, 8.21533203125, 9.833984375, 11.45263671875, 13.0712890625, 14.68994140625, 16.30859375, 17.92724609375, 19.5458984375, 21.16455078125, 22.783203125, 24.40185546875, 26.0205078125, 27.63916015625, 29.2578125, 30.87646484375, 32.4951171875, 34.11376953125, 35.732421875, 37.35107421875, 38.9697265625, 40.58837890625, 42.20703125, 43.82568359375, 45.4443359375, 47.06298828125, 48.681640625, 50.30029296875, 51.9189453125, 53.53759765625, 55.15625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 24.0, 32.0, 53.0, 65.0, 103.0, 131.0, 215.0, 332.0, 467.0, 612.0, 926.0, 1371.0, 2107.0, 3306.0, 5035.0, 7847.0, 12210.0, 19513.0, 31071.0, 49947.0, 80042.0, 127820.0, 189079.0, 185208.0, 123221.0, 76773.0, 48549.0, 30078.0, 18694.0, 11881.0, 7554.0, 4762.0, 3141.0, 2128.0, 1383.0, 927.0, 613.0, 410.0, 270.0, 186.0, 149.0, 92.0, 60.0, 46.0, 33.0, 25.0, 15.0, 15.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.409027099609375, -1.36199951171875, -1.314971923828125, -1.2679443359375, -1.220916748046875, -1.17388916015625, -1.126861572265625, -1.079833984375, -1.032806396484375, -0.98577880859375, -0.938751220703125, -0.8917236328125, -0.844696044921875, -0.79766845703125, -0.750640869140625, -0.70361328125, -0.656585693359375, -0.60955810546875, -0.562530517578125, -0.5155029296875, -0.468475341796875, -0.42144775390625, -0.374420166015625, -0.327392578125, -0.280364990234375, -0.23333740234375, -0.186309814453125, -0.1392822265625, -0.092254638671875, -0.04522705078125, 0.001800537109375, 0.048828125, 0.095855712890625, 0.14288330078125, 0.189910888671875, 0.2369384765625, 0.283966064453125, 0.33099365234375, 0.378021240234375, 0.425048828125, 0.472076416015625, 0.51910400390625, 0.566131591796875, 0.6131591796875, 0.660186767578125, 0.70721435546875, 0.754241943359375, 0.80126953125, 0.848297119140625, 0.89532470703125, 0.942352294921875, 0.9893798828125, 1.036407470703125, 1.08343505859375, 1.130462646484375, 1.177490234375, 1.224517822265625, 1.27154541015625, 1.318572998046875, 1.3656005859375, 1.412628173828125, 1.45965576171875, 1.506683349609375, 1.5537109375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 10.0, 13.0, 12.0, 23.0, 16.0, 27.0, 18.0, 24.0, 30.0, 42.0, 40.0, 38.0, 46.0, 36.0, 46.0, 40.0, 1062.0, 46.0, 37.0, 36.0, 37.0, 37.0, 42.0, 26.0, 31.0, 31.0, 22.0, 23.0, 27.0, 15.0, 14.0, 12.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.078125, -28.218505859375, -27.35888671875, -26.499267578125, -25.6396484375, -24.780029296875, -23.92041015625, -23.060791015625, -22.201171875, -21.341552734375, -20.48193359375, -19.622314453125, -18.7626953125, -17.903076171875, -17.04345703125, -16.183837890625, -15.32421875, -14.464599609375, -13.60498046875, -12.745361328125, -11.8857421875, -11.026123046875, -10.16650390625, -9.306884765625, -8.447265625, -7.587646484375, -6.72802734375, -5.868408203125, -5.0087890625, -4.149169921875, -3.28955078125, -2.429931640625, -1.5703125, -0.710693359375, 0.14892578125, 1.008544921875, 1.8681640625, 2.727783203125, 3.58740234375, 4.447021484375, 5.306640625, 6.166259765625, 7.02587890625, 7.885498046875, 8.7451171875, 9.604736328125, 10.46435546875, 11.323974609375, 12.18359375, 13.043212890625, 13.90283203125, 14.762451171875, 15.6220703125, 16.481689453125, 17.34130859375, 18.200927734375, 19.060546875, 19.920166015625, 20.77978515625, 21.639404296875, 22.4990234375, 23.358642578125, 24.21826171875, 25.077880859375, 25.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 17.0, 31.0, 41.0, 72.0, 111.0, 174.0, 271.0, 362.0, 574.0, 896.0, 1350.0, 2141.0, 3227.0, 4941.0, 7400.0, 11538.0, 17318.0, 26223.0, 40243.0, 60883.0, 92070.0, 140712.0, 1173072.0, 199507.0, 106519.0, 70916.0, 46974.0, 30595.0, 20261.0, 13395.0, 8761.0, 5805.0, 3790.0, 2330.0, 1548.0, 1067.0, 695.0, 438.0, 304.0, 184.0, 122.0, 70.0, 57.0, 43.0, 20.0, 12.0, 15.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.220703125, -1.1795806884765625, -1.138458251953125, -1.0973358154296875, -1.05621337890625, -1.0150909423828125, -0.973968505859375, -0.9328460693359375, -0.8917236328125, -0.8506011962890625, -0.809478759765625, -0.7683563232421875, -0.72723388671875, -0.6861114501953125, -0.644989013671875, -0.6038665771484375, -0.562744140625, -0.5216217041015625, -0.480499267578125, -0.4393768310546875, -0.39825439453125, -0.3571319580078125, -0.316009521484375, -0.2748870849609375, -0.2337646484375, -0.1926422119140625, -0.151519775390625, -0.1103973388671875, -0.06927490234375, -0.0281524658203125, 0.012969970703125, 0.0540924072265625, 0.09521484375, 0.1363372802734375, 0.177459716796875, 0.2185821533203125, 0.25970458984375, 0.3008270263671875, 0.341949462890625, 0.3830718994140625, 0.4241943359375, 0.4653167724609375, 0.506439208984375, 0.5475616455078125, 0.58868408203125, 0.6298065185546875, 0.670928955078125, 0.7120513916015625, 0.753173828125, 0.7942962646484375, 0.835418701171875, 0.8765411376953125, 0.91766357421875, 0.9587860107421875, 0.999908447265625, 1.0410308837890625, 1.0821533203125, 1.1232757568359375, 1.164398193359375, 1.2055206298828125, 1.24664306640625, 1.2877655029296875, 1.328887939453125, 1.3700103759765625, 1.4111328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 13.0, 10.0, 8.0, 18.0, 12.0, 16.0, 19.0, 19.0, 25.0, 34.0, 27.0, 49.0, 51.0, 42.0, 64.0, 54.0, 50.0, 62.0, 55.0, 48.0, 43.0, 40.0, 30.0, 25.0, 22.0, 26.0, 12.0, 14.0, 13.0, 13.0, 12.0, 10.0, 5.0, 10.0, 6.0, 3.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.027862548828125, -0.027006864547729492, -0.026151180267333984, -0.025295495986938477, -0.02443981170654297, -0.02358412742614746, -0.022728443145751953, -0.021872758865356445, -0.021017074584960938, -0.02016139030456543, -0.019305706024169922, -0.018450021743774414, -0.017594337463378906, -0.0167386531829834, -0.01588296890258789, -0.015027284622192383, -0.014171600341796875, -0.013315916061401367, -0.01246023178100586, -0.011604547500610352, -0.010748863220214844, -0.009893178939819336, -0.009037494659423828, -0.00818181037902832, -0.0073261260986328125, -0.006470441818237305, -0.005614757537841797, -0.004759073257446289, -0.0039033889770507812, -0.0030477046966552734, -0.0021920204162597656, -0.0013363361358642578, -0.00048065185546875, 0.0003750324249267578, 0.0012307167053222656, 0.0020864009857177734, 0.0029420852661132812, 0.003797769546508789, 0.004653453826904297, 0.005509138107299805, 0.0063648223876953125, 0.00722050666809082, 0.008076190948486328, 0.008931875228881836, 0.009787559509277344, 0.010643243789672852, 0.01149892807006836, 0.012354612350463867, 0.013210296630859375, 0.014065980911254883, 0.01492166519165039, 0.0157773494720459, 0.016633033752441406, 0.017488718032836914, 0.018344402313232422, 0.01920008659362793, 0.020055770874023438, 0.020911455154418945, 0.021767139434814453, 0.02262282371520996, 0.02347850799560547, 0.024334192276000977, 0.025189876556396484, 0.026045560836791992, 0.0269012451171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 11.0, 18.0, 29.0, 41.0, 67.0, 78.0, 133.0, 160.0, 286.0, 484.0, 819.0, 1410.0, 2950.0, 6612.0, 16926.0, 52741.0, 200815.0, 475048.0, 205228.0, 54140.0, 17193.0, 6655.0, 3048.0, 1468.0, 818.0, 468.0, 298.0, 182.0, 121.0, 97.0, 48.0, 37.0, 29.0, 25.0, 18.0, 10.0, 7.0, 5.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1968212127685547, -0.19015121459960938, -0.18348121643066406, -0.17681121826171875, -0.17014122009277344, -0.16347122192382812, -0.1568012237548828, -0.1501312255859375, -0.1434612274169922, -0.13679122924804688, -0.13012123107910156, -0.12345123291015625, -0.11678123474121094, -0.11011123657226562, -0.10344123840332031, -0.096771240234375, -0.09010124206542969, -0.08343124389648438, -0.07676124572753906, -0.07009124755859375, -0.06342124938964844, -0.056751251220703125, -0.05008125305175781, -0.0434112548828125, -0.03674125671386719, -0.030071258544921875, -0.023401260375976562, -0.01673126220703125, -0.010061264038085938, -0.003391265869140625, 0.0032787322998046875, 0.00994873046875, 0.016618728637695312, 0.023288726806640625, 0.029958724975585938, 0.03662872314453125, 0.04329872131347656, 0.049968719482421875, 0.05663871765136719, 0.0633087158203125, 0.06997871398925781, 0.07664871215820312, 0.08331871032714844, 0.08998870849609375, 0.09665870666503906, 0.10332870483398438, 0.10999870300292969, 0.116668701171875, 0.12333869934082031, 0.13000869750976562, 0.13667869567871094, 0.14334869384765625, 0.15001869201660156, 0.15668869018554688, 0.1633586883544922, 0.1700286865234375, 0.1766986846923828, 0.18336868286132812, 0.19003868103027344, 0.19670867919921875, 0.20337867736816406, 0.21004867553710938, 0.2167186737060547, 0.223388671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 19.0, 47.0, 81.0, 168.0, 253.0, 201.0, 94.0, 56.0, 31.0, 18.0, 9.0, 9.0, 8.0, 0.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073527030646801, -0.0676354467868805, -0.061743855476379395, -0.055852267891168594, -0.049960680305957794, -0.044069092720746994, -0.038177505135536194, -0.032285917550325394, -0.026394329965114594, -0.020502742379903793, -0.014611154794692993, -0.008719567209482193, -0.002827979624271393, 0.0030636079609394073, 0.008955195546150208, 0.014846783131361008, 0.020738370716571808, 0.026629958301782608, 0.03252154588699341, 0.03841313347220421, 0.04430472105741501, 0.05019630864262581, 0.05608789622783661, 0.06197948381304741, 0.06787107139825821, 0.07376265525817871, 0.07965424656867981, 0.08554583787918091, 0.09143742173910141, 0.09732900559902191, 0.10322059690952301, 0.10911218822002411, 0.11500376462936401, 0.12089535593986511, 0.1267869472503662, 0.13267852365970612, 0.13857011497020721, 0.1444617062807083, 0.15035328269004822, 0.15624487400054932, 0.16213646531105042, 0.1680280566215515, 0.1739196479320526, 0.17981122434139252, 0.18570281565189362, 0.19159440696239471, 0.19748598337173462, 0.20337757468223572, 0.20926916599273682, 0.21516075730323792, 0.221052348613739, 0.22694392502307892, 0.23283551633358002, 0.23872710764408112, 0.24461868405342102, 0.2505102753639221, 0.2564018666744232, 0.2622934579849243, 0.2681850492954254, 0.2740766406059265, 0.2799682021141052, 0.2858597934246063, 0.2917513847351074, 0.2976429760456085, 0.3035345673561096]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 8.0, 19.0, 17.0, 17.0, 20.0, 13.0, 28.0, 28.0, 33.0, 27.0, 32.0, 41.0, 32.0, 30.0, 41.0, 31.0, 37.0, 35.0, 50.0, 45.0, 39.0, 30.0, 33.0, 36.0, 28.0, 22.0, 27.0, 18.0, 22.0, 16.0, 21.0, 17.0, 15.0, 8.0, 12.0, 5.0, 14.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04460030794143677, -0.0431242436170578, -0.041648175567388535, -0.04017210751771927, -0.0386960431933403, -0.037219978868961334, -0.03574391081929207, -0.0342678427696228, -0.032791778445243835, -0.03131571412086487, -0.029839646071195602, -0.028363579884171486, -0.02688751369714737, -0.025411447510123253, -0.023935381323099136, -0.02245931513607502, -0.020983248949050903, -0.019507182762026787, -0.01803111657500267, -0.016555050387978554, -0.015078984200954437, -0.01360291801393032, -0.012126851826906204, -0.010650785639882088, -0.009174719452857971, -0.007698653265833855, -0.006222587078809738, -0.004746520891785622, -0.003270454704761505, -0.0017943885177373886, -0.0003183223307132721, 0.0011577438563108444, 0.002633810043334961, 0.0041098762303590775, 0.005585942417383194, 0.0070620086044073105, 0.008538074791431427, 0.010014140978455544, 0.01149020716547966, 0.012966273352503777, 0.014442339539527893, 0.01591840572655201, 0.017394471913576126, 0.018870538100600243, 0.02034660428762436, 0.021822670474648476, 0.023298736661672592, 0.02477480284869671, 0.026250869035720825, 0.02772693522274494, 0.029203001409769058, 0.030679067596793175, 0.03215513378381729, 0.03363119810819626, 0.035107266157865524, 0.03658333420753479, 0.03805939853191376, 0.039535462856292725, 0.04101153090596199, 0.042487598955631256, 0.04396366328001022, 0.04543972760438919, 0.046915795654058456, 0.04839186370372772, 0.04986792802810669]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 10.0, 12.0, 14.0, 9.0, 10.0, 19.0, 23.0, 21.0, 25.0, 30.0, 39.0, 46.0, 41.0, 48.0, 37.0, 48.0, 53.0, 57.0, 45.0, 51.0, 42.0, 36.0, 43.0, 40.0, 32.0, 26.0, 23.0, 29.0, 16.0, 15.0, 7.0, 11.0, 10.0, 10.0, 2.0, 1.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.71875, -46.12744140625, -44.5361328125, -42.94482421875, -41.353515625, -39.76220703125, -38.1708984375, -36.57958984375, -34.98828125, -33.39697265625, -31.8056640625, -30.21435546875, -28.623046875, -27.03173828125, -25.4404296875, -23.84912109375, -22.2578125, -20.66650390625, -19.0751953125, -17.48388671875, -15.892578125, -14.30126953125, -12.7099609375, -11.11865234375, -9.52734375, -7.93603515625, -6.3447265625, -4.75341796875, -3.162109375, -1.57080078125, 0.0205078125, 1.61181640625, 3.203125, 4.79443359375, 6.3857421875, 7.97705078125, 9.568359375, 11.15966796875, 12.7509765625, 14.34228515625, 15.93359375, 17.52490234375, 19.1162109375, 20.70751953125, 22.298828125, 23.89013671875, 25.4814453125, 27.07275390625, 28.6640625, 30.25537109375, 31.8466796875, 33.43798828125, 35.029296875, 36.62060546875, 38.2119140625, 39.80322265625, 41.39453125, 42.98583984375, 44.5771484375, 46.16845703125, 47.759765625, 49.35107421875, 50.9423828125, 52.53369140625, 54.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 16.0, 22.0, 26.0, 25.0, 43.0, 32.0, 67.0, 79.0, 112.0, 190.0, 430.0, 1066.0, 4057.0, 22589.0, 171148.0, 636515.0, 181928.0, 23756.0, 4189.0, 1145.0, 406.0, 202.0, 113.0, 72.0, 60.0, 43.0, 41.0, 29.0, 25.0, 20.0, 20.0, 17.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.98046875, -7.71893310546875, -7.4573974609375, -7.19586181640625, -6.934326171875, -6.67279052734375, -6.4112548828125, -6.14971923828125, -5.88818359375, -5.62664794921875, -5.3651123046875, -5.10357666015625, -4.842041015625, -4.58050537109375, -4.3189697265625, -4.05743408203125, -3.7958984375, -3.53436279296875, -3.2728271484375, -3.01129150390625, -2.749755859375, -2.48822021484375, -2.2266845703125, -1.96514892578125, -1.70361328125, -1.44207763671875, -1.1805419921875, -0.91900634765625, -0.657470703125, -0.39593505859375, -0.1343994140625, 0.12713623046875, 0.388671875, 0.65020751953125, 0.9117431640625, 1.17327880859375, 1.434814453125, 1.69635009765625, 1.9578857421875, 2.21942138671875, 2.48095703125, 2.74249267578125, 3.0040283203125, 3.26556396484375, 3.527099609375, 3.78863525390625, 4.0501708984375, 4.31170654296875, 4.5732421875, 4.83477783203125, 5.0963134765625, 5.35784912109375, 5.619384765625, 5.88092041015625, 6.1424560546875, 6.40399169921875, 6.66552734375, 6.92706298828125, 7.1885986328125, 7.45013427734375, 7.711669921875, 7.97320556640625, 8.2347412109375, 8.49627685546875, 8.7578125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 5.0, 13.0, 15.0, 19.0, 26.0, 44.0, 45.0, 52.0, 49.0, 61.0, 52.0, 75.0, 2117.0, 75.0, 80.0, 66.0, 51.0, 46.0, 33.0, 27.0, 27.0, 15.0, 15.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-105.4375, -102.5517578125, -99.666015625, -96.7802734375, -93.89453125, -91.0087890625, -88.123046875, -85.2373046875, -82.3515625, -79.4658203125, -76.580078125, -73.6943359375, -70.80859375, -67.9228515625, -65.037109375, -62.1513671875, -59.265625, -56.3798828125, -53.494140625, -50.6083984375, -47.72265625, -44.8369140625, -41.951171875, -39.0654296875, -36.1796875, -33.2939453125, -30.408203125, -27.5224609375, -24.63671875, -21.7509765625, -18.865234375, -15.9794921875, -13.09375, -10.2080078125, -7.322265625, -4.4365234375, -1.55078125, 1.3349609375, 4.220703125, 7.1064453125, 9.9921875, 12.8779296875, 15.763671875, 18.6494140625, 21.53515625, 24.4208984375, 27.306640625, 30.1923828125, 33.078125, 35.9638671875, 38.849609375, 41.7353515625, 44.62109375, 47.5068359375, 50.392578125, 53.2783203125, 56.1640625, 59.0498046875, 61.935546875, 64.8212890625, 67.70703125, 70.5927734375, 73.478515625, 76.3642578125, 79.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 19.0, 34.0, 43.0, 46.0, 92.0, 162.0, 315.0, 446.0, 877.0, 1976.0, 5950.0, 29657.0, 228575.0, 2731176.0, 121407.0, 17484.0, 4072.0, 1487.0, 761.0, 407.0, 247.0, 143.0, 90.0, 63.0, 34.0, 35.0, 14.0, 13.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40264892578125, -6.1685791015625, -5.93450927734375, -5.700439453125, -5.46636962890625, -5.2322998046875, -4.99822998046875, -4.76416015625, -4.53009033203125, -4.2960205078125, -4.06195068359375, -3.827880859375, -3.59381103515625, -3.3597412109375, -3.12567138671875, -2.8916015625, -2.65753173828125, -2.4234619140625, -2.18939208984375, -1.955322265625, -1.72125244140625, -1.4871826171875, -1.25311279296875, -1.01904296875, -0.78497314453125, -0.5509033203125, -0.31683349609375, -0.082763671875, 0.15130615234375, 0.3853759765625, 0.61944580078125, 0.853515625, 1.08758544921875, 1.3216552734375, 1.55572509765625, 1.789794921875, 2.02386474609375, 2.2579345703125, 2.49200439453125, 2.72607421875, 2.96014404296875, 3.1942138671875, 3.42828369140625, 3.662353515625, 3.89642333984375, 4.1304931640625, 4.36456298828125, 4.5986328125, 4.83270263671875, 5.0667724609375, 5.30084228515625, 5.534912109375, 5.76898193359375, 6.0030517578125, 6.23712158203125, 6.47119140625, 6.70526123046875, 6.9393310546875, 7.17340087890625, 7.407470703125, 7.64154052734375, 7.8756103515625, 8.10968017578125, 8.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 34.0, 96.0, 342.0, 331.0, 102.0, 39.0, 23.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.48118591308594, -124.69154357910156, -116.90190124511719, -109.11225891113281, -101.32261657714844, -93.53297424316406, -85.74333190917969, -77.95368957519531, -70.16404724121094, -62.37440490722656, -54.58476257324219, -46.79512023925781, -39.00547790527344, -31.215835571289062, -23.426193237304688, -15.636550903320312, -7.8469085693359375, -0.0572662353515625, 7.7323760986328125, 15.522018432617188, 23.311660766601562, 31.101303100585938, 38.89094543457031, 46.68058776855469, 54.47023010253906, 62.25987243652344, 70.04951477050781, 77.83915710449219, 85.62879943847656, 93.41844177246094, 101.20808410644531, 108.99772644042969, 116.787353515625, 124.57699584960938, 132.36663818359375, 140.15628051757812, 147.9459228515625, 155.73556518554688, 163.52520751953125, 171.31484985351562, 179.1044921875, 186.89413452148438, 194.68377685546875, 202.47341918945312, 210.2630615234375, 218.05270385742188, 225.84234619140625, 233.63198852539062, 241.421630859375, 249.21127319335938, 257.00091552734375, 264.7905578613281, 272.5802001953125, 280.3698425292969, 288.15948486328125, 295.9491271972656, 303.73876953125, 311.5284118652344, 319.31805419921875, 327.1076965332031, 334.8973388671875, 342.6869812011719, 350.47662353515625, 358.2662658691406, 366.055908203125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 11.0, 12.0, 12.0, 14.0, 16.0, 23.0, 25.0, 28.0, 26.0, 36.0, 46.0, 37.0, 47.0, 46.0, 46.0, 52.0, 48.0, 31.0, 42.0, 33.0, 26.0, 44.0, 40.0, 29.0, 25.0, 23.0, 24.0, 15.0, 22.0, 26.0, 10.0, 11.0, 6.0, 11.0, 9.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.71125030517578, -78.79401397705078, -75.87677001953125, -72.95953369140625, -70.04229736328125, -67.12506103515625, -64.20781707763672, -61.29058074951172, -58.37334442138672, -55.45610427856445, -52.53886795043945, -49.62162780761719, -46.70439147949219, -43.78715133666992, -40.869911193847656, -37.952674865722656, -35.03543472290039, -32.118194580078125, -29.200958251953125, -26.28371810913086, -23.36648178100586, -20.449241638183594, -17.53200340270996, -14.614765167236328, -11.697526931762695, -8.780288696289062, -5.8630499839782715, -2.9458112716674805, -0.028573036193847656, 2.888665199279785, 5.805904388427734, 8.723142623901367, 11.640380859375, 14.557619094848633, 17.474857330322266, 20.39209747314453, 23.30933380126953, 26.226573944091797, 29.14381217956543, 32.06105041503906, 34.97828674316406, 37.89552688598633, 40.81276321411133, 43.730003356933594, 46.647239685058594, 49.56447982788086, 52.481719970703125, 55.398956298828125, 58.31619644165039, 61.233436584472656, 64.15067291259766, 67.06790924072266, 69.98515319824219, 72.90238952636719, 75.81962585449219, 78.73686218261719, 81.65410614013672, 84.57134246826172, 87.48858642578125, 90.40582275390625, 93.32305908203125, 96.24029541015625, 99.15753936767578, 102.07477569580078, 104.99201202392578]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 9.0, 13.0, 20.0, 16.0, 15.0, 22.0, 35.0, 43.0, 56.0, 78.0, 103.0, 127.0, 185.0, 285.0, 475.0, 731.0, 1338.0, 3104.0, 1025392.0, 11026.0, 2426.0, 1023.0, 634.0, 398.0, 293.0, 168.0, 126.0, 85.0, 65.0, 48.0, 53.0, 32.0, 27.0, 21.0, 23.0, 14.0, 12.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.460712432861328, -25.603782653808594, -24.74685287475586, -23.889923095703125, -23.032995223999023, -22.17606544494629, -21.319135665893555, -20.46220588684082, -19.60527801513672, -18.748348236083984, -17.89141845703125, -17.034488677978516, -16.177560806274414, -15.32063102722168, -14.463701248168945, -13.606771469116211, -12.749841690063477, -11.892911911010742, -11.035983085632324, -10.17905330657959, -9.322124481201172, -8.465194702148438, -7.608264923095703, -6.751335620880127, -5.894406318664551, -5.037477016448975, -4.180547714233398, -3.323617935180664, -2.466688632965088, -1.6097593307495117, -0.7528295516967773, 0.10409975051879883, 0.9610271453857422, 1.817956566810608, 2.6748859882354736, 3.531815528869629, 4.388744831085205, 5.245674133300781, 6.102603912353516, 6.959533214569092, 7.816462516784668, 8.673392295837402, 9.53032112121582, 10.387250900268555, 11.244180679321289, 12.101109504699707, 12.958039283752441, 13.81496810913086, 14.671897888183594, 15.528827667236328, 16.385757446289062, 17.242687225341797, 18.0996150970459, 18.956544876098633, 19.813474655151367, 20.6704044342041, 21.527332305908203, 22.384262084960938, 23.241191864013672, 24.098121643066406, 24.955049514770508, 25.811979293823242, 26.668909072875977, 27.52583885192871, 28.382768630981445]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 39.0, 596.0, 51462116.0, 354.0, 23.0, 9.0, 0.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3868.11083984375, -3772.389892578125, -3676.668701171875, -3580.94775390625, -3485.226806640625, -3389.505859375, -3293.78466796875, -3198.063720703125, -3102.3427734375, -3006.621826171875, -2910.900634765625, -2815.1796875, -2719.458740234375, -2623.73779296875, -2528.0166015625, -2432.295654296875, -2336.574462890625, -2240.853515625, -2145.13232421875, -2049.411376953125, -1953.6904296875, -1857.9693603515625, -1762.248291015625, -1666.52734375, -1570.8062744140625, -1475.085205078125, -1379.3642578125, -1283.6431884765625, -1187.922119140625, -1092.201171875, -996.4801025390625, -900.7590942382812, -805.037841796875, -709.3168334960938, -613.5958251953125, -517.874755859375, -422.15374755859375, -326.4327392578125, -230.711669921875, -134.99066162109375, -39.2696533203125, 56.45137023925781, 152.17239379882812, 247.8934326171875, 343.61444091796875, 439.33544921875, 535.0565185546875, 630.7775268554688, 726.49853515625, 822.2195434570312, 917.9405517578125, 1013.66162109375, 1109.382568359375, 1205.1036376953125, 1300.82470703125, 1396.545654296875, 1492.2667236328125, 1587.98779296875, 1683.708740234375, 1779.4298095703125, 1875.15087890625, 1970.871826171875, 2066.5927734375, 2162.31396484375, 2258.034912109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 21.0, 36.0, 50.0, 81.0, 133.0, 181.0, 272.0, 431.0, 680.0, 1070.0, 1775.0, 2839.0, 4880.0, 8802.0, 15621.0, 29268.0, 58469.0, 125211.0, 297986.0, 919622.0, 3504103.0, 808701.0, 275663.0, 117125.0, 54991.0, 27986.0, 14940.0, 8423.0, 4700.0, 2698.0, 1703.0, 1092.0, 639.0, 429.0, 236.0, 182.0, 113.0, 77.0, 58.0, 28.0, 24.0, 17.0, 14.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.265625, -15.71337890625, -15.1611328125, -14.60888671875, -14.056640625, -13.50439453125, -12.9521484375, -12.39990234375, -11.84765625, -11.29541015625, -10.7431640625, -10.19091796875, -9.638671875, -9.08642578125, -8.5341796875, -7.98193359375, -7.4296875, -6.87744140625, -6.3251953125, -5.77294921875, -5.220703125, -4.66845703125, -4.1162109375, -3.56396484375, -3.01171875, -2.45947265625, -1.9072265625, -1.35498046875, -0.802734375, -0.25048828125, 0.3017578125, 0.85400390625, 1.40625, 1.95849609375, 2.5107421875, 3.06298828125, 3.615234375, 4.16748046875, 4.7197265625, 5.27197265625, 5.82421875, 6.37646484375, 6.9287109375, 7.48095703125, 8.033203125, 8.58544921875, 9.1376953125, 9.68994140625, 10.2421875, 10.79443359375, 11.3466796875, 11.89892578125, 12.451171875, 13.00341796875, 13.5556640625, 14.10791015625, 14.66015625, 15.21240234375, 15.7646484375, 16.31689453125, 16.869140625, 17.42138671875, 17.9736328125, 18.52587890625, 19.078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 10.0, 5.0, 12.0, 21.0, 18.0, 11.0, 20.0, 18.0, 32.0, 34.0, 21.0, 25.0, 31.0, 39.0, 45.0, 72.0, 130.0, 296.0, 459.0, 207.0, 93.0, 58.0, 42.0, 38.0, 32.0, 40.0, 34.0, 28.0, 20.0, 19.0, 23.0, 18.0, 13.0, 12.0, 9.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.625, -21.96484375, -21.3046875, -20.64453125, -19.984375, -19.32421875, -18.6640625, -18.00390625, -17.34375, -16.68359375, -16.0234375, -15.36328125, -14.703125, -14.04296875, -13.3828125, -12.72265625, -12.0625, -11.40234375, -10.7421875, -10.08203125, -9.421875, -8.76171875, -8.1015625, -7.44140625, -6.78125, -6.12109375, -5.4609375, -4.80078125, -4.140625, -3.48046875, -2.8203125, -2.16015625, -1.5, -0.83984375, -0.1796875, 0.48046875, 1.140625, 1.80078125, 2.4609375, 3.12109375, 3.78125, 4.44140625, 5.1015625, 5.76171875, 6.421875, 7.08203125, 7.7421875, 8.40234375, 9.0625, 9.72265625, 10.3828125, 11.04296875, 11.703125, 12.36328125, 13.0234375, 13.68359375, 14.34375, 15.00390625, 15.6640625, 16.32421875, 16.984375, 17.64453125, 18.3046875, 18.96484375, 19.625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 13.0, 26.0, 36.0, 55.0, 73.0, 93.0, 146.0, 207.0, 327.0, 408.0, 621.0, 870.0, 1382.0, 2039.0, 3249.0, 4947.0, 7784.0, 12736.0, 20596.0, 34537.0, 58981.0, 100216.0, 173628.0, 296755.0, 556631.0, 2300921.0, 1597311.0, 475200.0, 264279.0, 153846.0, 89678.0, 52171.0, 31039.0, 18677.0, 11342.0, 7031.0, 4501.0, 2861.0, 1966.0, 1322.0, 896.0, 615.0, 419.0, 307.0, 213.0, 148.0, 96.0, 91.0, 52.0, 37.0, 20.0, 17.0, 3.0, 8.0, 5.0, 1.0, 4.0], "bins": [-7.18359375, -6.96514892578125, -6.7467041015625, -6.52825927734375, -6.309814453125, -6.09136962890625, -5.8729248046875, -5.65447998046875, -5.43603515625, -5.21759033203125, -4.9991455078125, -4.78070068359375, -4.562255859375, -4.34381103515625, -4.1253662109375, -3.90692138671875, -3.6884765625, -3.47003173828125, -3.2515869140625, -3.03314208984375, -2.814697265625, -2.59625244140625, -2.3778076171875, -2.15936279296875, -1.94091796875, -1.72247314453125, -1.5040283203125, -1.28558349609375, -1.067138671875, -0.84869384765625, -0.6302490234375, -0.41180419921875, -0.193359375, 0.02508544921875, 0.2435302734375, 0.46197509765625, 0.680419921875, 0.89886474609375, 1.1173095703125, 1.33575439453125, 1.55419921875, 1.77264404296875, 1.9910888671875, 2.20953369140625, 2.427978515625, 2.64642333984375, 2.8648681640625, 3.08331298828125, 3.3017578125, 3.52020263671875, 3.7386474609375, 3.95709228515625, 4.175537109375, 4.39398193359375, 4.6124267578125, 4.83087158203125, 5.04931640625, 5.26776123046875, 5.4862060546875, 5.70465087890625, 5.923095703125, 6.14154052734375, 6.3599853515625, 6.57843017578125, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 8.0, 5.0, 19.0, 21.0, 22.0, 29.0, 24.0, 35.0, 34.0, 45.0, 36.0, 55.0, 68.0, 174.0, 542.0, 351.0, 114.0, 60.0, 50.0, 38.0, 36.0, 34.0, 35.0, 34.0, 25.0, 28.0, 16.0, 14.0, 15.0, 13.0, 5.0, 3.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.24853515625, -35.9970703125, -34.74560546875, -33.494140625, -32.24267578125, -30.9912109375, -29.73974609375, -28.48828125, -27.23681640625, -25.9853515625, -24.73388671875, -23.482421875, -22.23095703125, -20.9794921875, -19.72802734375, -18.4765625, -17.22509765625, -15.9736328125, -14.72216796875, -13.470703125, -12.21923828125, -10.9677734375, -9.71630859375, -8.46484375, -7.21337890625, -5.9619140625, -4.71044921875, -3.458984375, -2.20751953125, -0.9560546875, 0.29541015625, 1.546875, 2.79833984375, 4.0498046875, 5.30126953125, 6.552734375, 7.80419921875, 9.0556640625, 10.30712890625, 11.55859375, 12.81005859375, 14.0615234375, 15.31298828125, 16.564453125, 17.81591796875, 19.0673828125, 20.31884765625, 21.5703125, 22.82177734375, 24.0732421875, 25.32470703125, 26.576171875, 27.82763671875, 29.0791015625, 30.33056640625, 31.58203125, 32.83349609375, 34.0849609375, 35.33642578125, 36.587890625, 37.83935546875, 39.0908203125, 40.34228515625, 41.59375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 14.0, 16.0, 12.0, 35.0, 48.0, 81.0, 108.0, 126.0, 190.0, 258.0, 377.0, 542.0, 773.0, 1241.0, 1934.0, 3044.0, 5519.0, 11276.0, 26282.0, 67939.0, 227579.0, 5735172.0, 126301.0, 44862.0, 17998.0, 8226.0, 4295.0, 2454.0, 1506.0, 989.0, 651.0, 469.0, 312.0, 212.0, 177.0, 110.0, 83.0, 43.0, 42.0, 26.0, 26.0, 18.0, 14.0, 8.0, 4.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0], "bins": [-39.90625, -38.67041015625, -37.4345703125, -36.19873046875, -34.962890625, -33.72705078125, -32.4912109375, -31.25537109375, -30.01953125, -28.78369140625, -27.5478515625, -26.31201171875, -25.076171875, -23.84033203125, -22.6044921875, -21.36865234375, -20.1328125, -18.89697265625, -17.6611328125, -16.42529296875, -15.189453125, -13.95361328125, -12.7177734375, -11.48193359375, -10.24609375, -9.01025390625, -7.7744140625, -6.53857421875, -5.302734375, -4.06689453125, -2.8310546875, -1.59521484375, -0.359375, 0.87646484375, 2.1123046875, 3.34814453125, 4.583984375, 5.81982421875, 7.0556640625, 8.29150390625, 9.52734375, 10.76318359375, 11.9990234375, 13.23486328125, 14.470703125, 15.70654296875, 16.9423828125, 18.17822265625, 19.4140625, 20.64990234375, 21.8857421875, 23.12158203125, 24.357421875, 25.59326171875, 26.8291015625, 28.06494140625, 29.30078125, 30.53662109375, 31.7724609375, 33.00830078125, 34.244140625, 35.47998046875, 36.7158203125, 37.95166015625, 39.1875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 7.0, 4.0, 4.0, 6.0, 10.0, 8.0, 18.0, 6.0, 19.0, 14.0, 16.0, 17.0, 29.0, 31.0, 39.0, 28.0, 32.0, 27.0, 33.0, 56.0, 119.0, 703.0, 291.0, 81.0, 36.0, 31.0, 36.0, 40.0, 28.0, 26.0, 26.0, 20.0, 22.0, 22.0, 25.0, 19.0, 8.0, 9.0, 23.0, 11.0, 9.0, 9.0, 5.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3388671875, -60.240234375, -58.1416015625, -56.04296875, -53.9443359375, -51.845703125, -49.7470703125, -47.6484375, -45.5498046875, -43.451171875, -41.3525390625, -39.25390625, -37.1552734375, -35.056640625, -32.9580078125, -30.859375, -28.7607421875, -26.662109375, -24.5634765625, -22.46484375, -20.3662109375, -18.267578125, -16.1689453125, -14.0703125, -11.9716796875, -9.873046875, -7.7744140625, -5.67578125, -3.5771484375, -1.478515625, 0.6201171875, 2.71875, 4.8173828125, 6.916015625, 9.0146484375, 11.11328125, 13.2119140625, 15.310546875, 17.4091796875, 19.5078125, 21.6064453125, 23.705078125, 25.8037109375, 27.90234375, 30.0009765625, 32.099609375, 34.1982421875, 36.296875, 38.3955078125, 40.494140625, 42.5927734375, 44.69140625, 46.7900390625, 48.888671875, 50.9873046875, 53.0859375, 55.1845703125, 57.283203125, 59.3818359375, 61.48046875, 63.5791015625, 65.677734375, 67.7763671875, 69.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 35.0, 461.0, 433.0, 29.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.9376831054688, -490.0948486328125, -461.25201416015625, -432.4091796875, -403.56634521484375, -374.7235107421875, -345.8807067871094, -317.0378723144531, -288.1950378417969, -259.3522033691406, -230.50936889648438, -201.6665496826172, -172.82371520996094, -143.9808807373047, -115.1380615234375, -86.29522705078125, -57.452392578125, -28.609561920166016, 0.23326873779296875, 29.076095581054688, 57.91893005371094, 86.76176452636719, 115.60458374023438, 144.44741821289062, 173.29025268554688, 202.13308715820312, 230.97592163085938, 259.8187255859375, 288.66156005859375, 317.50439453125, 346.34722900390625, 375.1900634765625, 404.0328369140625, 432.87567138671875, 461.718505859375, 490.56134033203125, 519.4041748046875, 548.2470092773438, 577.08984375, 605.9326171875, 634.7755126953125, 663.6183471679688, 692.461181640625, 721.3040161132812, 750.1468505859375, 778.9896850585938, 807.83251953125, 836.67529296875, 865.5181274414062, 894.3609619140625, 923.2037963867188, 952.046630859375, 980.8894653320312, 1009.7322998046875, 1038.5750732421875, 1067.41796875, 1096.2607421875, 1125.103515625, 1153.9464111328125, 1182.7891845703125, 1211.632080078125, 1240.474853515625, 1269.3177490234375, 1298.1605224609375, 1327.00341796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 8.0, 12.0, 15.0, 17.0, 18.0, 24.0, 71.0, 425.0, 234.0, 37.0, 24.0, 14.0, 20.0, 10.0, 7.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-519.654296875, -503.79681396484375, -487.9393310546875, -472.08184814453125, -456.224365234375, -440.36688232421875, -424.5093994140625, -408.65191650390625, -392.79443359375, -376.93695068359375, -361.0794677734375, -345.22198486328125, -329.364501953125, -313.50701904296875, -297.6495361328125, -281.79205322265625, -265.9345703125, -250.07708740234375, -234.2196044921875, -218.36212158203125, -202.504638671875, -186.64715576171875, -170.7896728515625, -154.93218994140625, -139.07467651367188, -123.21719360351562, -107.35971069335938, -91.50222778320312, -75.64474487304688, -59.787254333496094, -43.929771423339844, -28.072288513183594, -12.214813232421875, 3.6426706314086914, 19.500154495239258, 35.35763931274414, 51.21512222290039, 67.0726089477539, 82.93009185791016, 98.7875747680664, 114.64505767822266, 130.50254821777344, 146.3600311279297, 162.21751403808594, 178.0749969482422, 193.93247985839844, 209.7899627685547, 225.64744567871094, 241.5049285888672, 257.3624267578125, 273.21990966796875, 289.077392578125, 304.93487548828125, 320.7923583984375, 336.64984130859375, 352.50732421875, 368.36480712890625, 384.2222900390625, 400.07977294921875, 415.937255859375, 431.79473876953125, 447.6522216796875, 463.50970458984375, 479.3671875, 495.22467041015625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 16.0, 14.0, 18.0, 38.0, 52.0, 74.0, 98.0, 163.0, 242.0, 392.0, 673.0, 1194.0, 2144.0, 4426.0, 11405.0, 63006.0, 4059775.0, 33895.0, 8474.0, 3643.0, 1737.0, 1028.0, 602.0, 414.0, 259.0, 146.0, 94.0, 74.0, 55.0, 34.0, 35.0, 19.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8590087890625, -2.764892578125, -2.6707763671875, -2.57666015625, -2.4825439453125, -2.388427734375, -2.2943115234375, -2.2001953125, -2.1060791015625, -2.011962890625, -1.9178466796875, -1.82373046875, -1.7296142578125, -1.635498046875, -1.5413818359375, -1.447265625, -1.3531494140625, -1.259033203125, -1.1649169921875, -1.07080078125, -0.9766845703125, -0.882568359375, -0.7884521484375, -0.6943359375, -0.6002197265625, -0.506103515625, -0.4119873046875, -0.31787109375, -0.2237548828125, -0.129638671875, -0.0355224609375, 0.05859375, 0.1527099609375, 0.246826171875, 0.3409423828125, 0.43505859375, 0.5291748046875, 0.623291015625, 0.7174072265625, 0.8115234375, 0.9056396484375, 0.999755859375, 1.0938720703125, 1.18798828125, 1.2821044921875, 1.376220703125, 1.4703369140625, 1.564453125, 1.6585693359375, 1.752685546875, 1.8468017578125, 1.94091796875, 2.0350341796875, 2.129150390625, 2.2232666015625, 2.3173828125, 2.4114990234375, 2.505615234375, 2.5997314453125, 2.69384765625, 2.7879638671875, 2.882080078125, 2.9761962890625, 3.0703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 9.0, 12.0, 13.0, 12.0, 17.0, 113.0, 649.0, 35.0, 14.0, 10.0, 9.0, 5.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8466796875, -0.814453125, -0.7822265625, -0.75, -0.7177734375, -0.685546875, -0.6533203125, -0.62109375, -0.5888671875, -0.556640625, -0.5244140625, -0.4921875, -0.4599609375, -0.427734375, -0.3955078125, -0.36328125, -0.3310546875, -0.298828125, -0.2666015625, -0.234375, -0.2021484375, -0.169921875, -0.1376953125, -0.10546875, -0.0732421875, -0.041015625, -0.0087890625, 0.0234375, 0.0556640625, 0.087890625, 0.1201171875, 0.15234375, 0.1845703125, 0.216796875, 0.2490234375, 0.28125, 0.3134765625, 0.345703125, 0.3779296875, 0.41015625, 0.4423828125, 0.474609375, 0.5068359375, 0.5390625, 0.5712890625, 0.603515625, 0.6357421875, 0.66796875, 0.7001953125, 0.732421875, 0.7646484375, 0.796875, 0.8291015625, 0.861328125, 0.8935546875, 0.92578125, 0.9580078125, 0.990234375, 1.0224609375, 1.0546875, 1.0869140625, 1.119140625, 1.1513671875, 1.18359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 17.0, 24.0, 18.0, 28.0, 46.0, 71.0, 128.0, 214.0, 381.0, 684.0, 1344.0, 2533.0, 5148.0, 11090.0, 28513.0, 101133.0, 3090342.0, 831353.0, 77627.0, 23925.0, 9816.0, 4644.0, 2338.0, 1192.0, 689.0, 359.0, 222.0, 128.0, 80.0, 61.0, 40.0, 19.0, 12.0, 10.0, 11.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.816009521484375, -2.72186279296875, -2.627716064453125, -2.5335693359375, -2.439422607421875, -2.34527587890625, -2.251129150390625, -2.156982421875, -2.062835693359375, -1.96868896484375, -1.874542236328125, -1.7803955078125, -1.686248779296875, -1.59210205078125, -1.497955322265625, -1.40380859375, -1.309661865234375, -1.21551513671875, -1.121368408203125, -1.0272216796875, -0.933074951171875, -0.83892822265625, -0.744781494140625, -0.650634765625, -0.556488037109375, -0.46234130859375, -0.368194580078125, -0.2740478515625, -0.179901123046875, -0.08575439453125, 0.008392333984375, 0.1025390625, 0.196685791015625, 0.29083251953125, 0.384979248046875, 0.4791259765625, 0.573272705078125, 0.66741943359375, 0.761566162109375, 0.855712890625, 0.949859619140625, 1.04400634765625, 1.138153076171875, 1.2322998046875, 1.326446533203125, 1.42059326171875, 1.514739990234375, 1.60888671875, 1.703033447265625, 1.79718017578125, 1.891326904296875, 1.9854736328125, 2.079620361328125, 2.17376708984375, 2.267913818359375, 2.362060546875, 2.456207275390625, 2.55035400390625, 2.644500732421875, 2.7386474609375, 2.832794189453125, 2.92694091796875, 3.021087646484375, 3.115234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 9.0, 6.0, 9.0, 14.0, 19.0, 25.0, 35.0, 34.0, 56.0, 84.0, 115.0, 229.0, 802.0, 1739.0, 337.0, 154.0, 101.0, 67.0, 40.0, 34.0, 23.0, 27.0, 15.0, 11.0, 14.0, 12.0, 5.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.896484375, -0.8677520751953125, -0.839019775390625, -0.8102874755859375, -0.78155517578125, -0.7528228759765625, -0.724090576171875, -0.6953582763671875, -0.6666259765625, -0.6378936767578125, -0.609161376953125, -0.5804290771484375, -0.55169677734375, -0.5229644775390625, -0.494232177734375, -0.4654998779296875, -0.436767578125, -0.4080352783203125, -0.379302978515625, -0.3505706787109375, -0.32183837890625, -0.2931060791015625, -0.264373779296875, -0.2356414794921875, -0.2069091796875, -0.1781768798828125, -0.149444580078125, -0.1207122802734375, -0.09197998046875, -0.0632476806640625, -0.034515380859375, -0.0057830810546875, 0.02294921875, 0.0516815185546875, 0.080413818359375, 0.1091461181640625, 0.13787841796875, 0.1666107177734375, 0.195343017578125, 0.2240753173828125, 0.2528076171875, 0.2815399169921875, 0.310272216796875, 0.3390045166015625, 0.36773681640625, 0.3964691162109375, 0.425201416015625, 0.4539337158203125, 0.482666015625, 0.5113983154296875, 0.540130615234375, 0.5688629150390625, 0.59759521484375, 0.6263275146484375, 0.655059814453125, 0.6837921142578125, 0.7125244140625, 0.7412567138671875, 0.769989013671875, 0.7987213134765625, 0.82745361328125, 0.8561859130859375, 0.884918212890625, 0.9136505126953125, 0.9423828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 12.0, 114.0, 493.0, 328.0, 40.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.387290000915527, -10.665428161621094, -9.943567276000977, -9.221705436706543, -8.49984359741211, -7.777982711791992, -7.056120872497559, -6.334259510040283, -5.612398147583008, -4.890536785125732, -4.168675422668457, -3.4468135833740234, -2.724952220916748, -2.0030908584594727, -1.281229019165039, -0.5593676567077637, 0.16249370574951172, 0.8843551874160767, 1.6062166690826416, 2.328078269958496, 3.0499396324157715, 3.771800994873047, 4.4936628341674805, 5.215524196624756, 5.937385559082031, 6.659246921539307, 7.381108283996582, 8.102970123291016, 8.824831008911133, 9.546692848205566, 10.2685546875, 10.990415573120117, 11.712276458740234, 12.434138298034668, 13.155999183654785, 13.877861022949219, 14.599721908569336, 15.32158374786377, 16.043445587158203, 16.76530647277832, 17.487167358398438, 18.209028244018555, 18.930891036987305, 19.652751922607422, 20.37461280822754, 21.096473693847656, 21.818336486816406, 22.540197372436523, 23.262060165405273, 23.98392105102539, 24.70578384399414, 25.427644729614258, 26.149505615234375, 26.871368408203125, 27.593229293823242, 28.31509017944336, 29.03695297241211, 29.758813858032227, 30.480676651000977, 31.202537536621094, 31.92439842224121, 32.64625930786133, 33.36812210083008, 34.08998489379883, 34.81184387207031]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 3.0, 9.0, 5.0, 6.0, 16.0, 17.0, 20.0, 24.0, 29.0, 35.0, 62.0, 51.0, 49.0, 30.0, 51.0, 59.0, 60.0, 54.0, 53.0, 56.0, 52.0, 42.0, 31.0, 44.0, 39.0, 22.0, 21.0, 16.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.881981134414673, -2.762664556503296, -2.643348217010498, -2.524031639099121, -2.4047152996063232, -2.2853987216949463, -2.1660823822021484, -2.0467658042907715, -1.927449345588684, -1.8081328868865967, -1.6888164281845093, -1.5694999694824219, -1.450183391571045, -1.330867052078247, -1.2115504741668701, -1.0922340154647827, -0.9729175567626953, -0.8536010980606079, -0.7342846393585205, -0.6149681210517883, -0.4956516623497009, -0.3763352036476135, -0.25701868534088135, -0.13770222663879395, -0.018385767936706543, 0.10093070566654205, 0.22024717926979065, 0.33956366777420044, 0.45888012647628784, 0.5781965851783752, 0.6975131034851074, 0.8168295621871948, 0.9361462593078613, 1.0554627180099487, 1.1747791767120361, 1.294095754623413, 1.413412094116211, 1.532728672027588, 1.6520451307296753, 1.7713615894317627, 1.89067804813385, 2.0099945068359375, 2.1293110847473145, 2.2486274242401123, 2.3679440021514893, 2.487260341644287, 2.606576919555664, 2.725893497467041, 2.845209836959839, 2.964526414871216, 3.0838427543640137, 3.2031593322753906, 3.3224756717681885, 3.4417922496795654, 3.5611085891723633, 3.6804251670837402, 3.799741744995117, 3.919058322906494, 4.038374900817871, 4.15769100189209, 4.277007579803467, 4.396324157714844, 4.515640735626221, 4.634957313537598, 4.754273414611816]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 11.0, 12.0, 15.0, 25.0, 36.0, 44.0, 87.0, 96.0, 146.0, 213.0, 347.0, 496.0, 746.0, 1116.0, 1710.0, 2821.0, 4319.0, 7288.0, 12899.0, 25208.0, 72145.0, 835237.0, 39005.0, 18473.0, 10201.0, 5763.0, 3567.0, 2166.0, 1491.0, 973.0, 566.0, 424.0, 330.0, 199.0, 123.0, 76.0, 61.0, 44.0, 29.0, 17.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.591796875, -2.52227783203125, -2.4527587890625, -2.38323974609375, -2.313720703125, -2.24420166015625, -2.1746826171875, -2.10516357421875, -2.03564453125, -1.96612548828125, -1.8966064453125, -1.82708740234375, -1.757568359375, -1.68804931640625, -1.6185302734375, -1.54901123046875, -1.4794921875, -1.40997314453125, -1.3404541015625, -1.27093505859375, -1.201416015625, -1.13189697265625, -1.0623779296875, -0.99285888671875, -0.92333984375, -0.85382080078125, -0.7843017578125, -0.71478271484375, -0.645263671875, -0.57574462890625, -0.5062255859375, -0.43670654296875, -0.3671875, -0.29766845703125, -0.2281494140625, -0.15863037109375, -0.089111328125, -0.01959228515625, 0.0499267578125, 0.11944580078125, 0.18896484375, 0.25848388671875, 0.3280029296875, 0.39752197265625, 0.467041015625, 0.53656005859375, 0.6060791015625, 0.67559814453125, 0.7451171875, 0.81463623046875, 0.8841552734375, 0.95367431640625, 1.023193359375, 1.09271240234375, 1.1622314453125, 1.23175048828125, 1.30126953125, 1.37078857421875, 1.4403076171875, 1.50982666015625, 1.579345703125, 1.64886474609375, 1.7183837890625, 1.78790283203125, 1.857421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 11.0, 11.0, 129.0, 553.0, 116.0, 12.0, 13.0, 12.0, 6.0, 7.0, 5.0, 4.0, 8.0, 6.0, 2.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8037109375, -0.773284912109375, -0.74285888671875, -0.712432861328125, -0.6820068359375, -0.651580810546875, -0.62115478515625, -0.590728759765625, -0.560302734375, -0.529876708984375, -0.49945068359375, -0.469024658203125, -0.4385986328125, -0.408172607421875, -0.37774658203125, -0.347320556640625, -0.31689453125, -0.286468505859375, -0.25604248046875, -0.225616455078125, -0.1951904296875, -0.164764404296875, -0.13433837890625, -0.103912353515625, -0.073486328125, -0.043060302734375, -0.01263427734375, 0.017791748046875, 0.0482177734375, 0.078643798828125, 0.10906982421875, 0.139495849609375, 0.169921875, 0.200347900390625, 0.23077392578125, 0.261199951171875, 0.2916259765625, 0.322052001953125, 0.35247802734375, 0.382904052734375, 0.413330078125, 0.443756103515625, 0.47418212890625, 0.504608154296875, 0.5350341796875, 0.565460205078125, 0.59588623046875, 0.626312255859375, 0.65673828125, 0.687164306640625, 0.71759033203125, 0.748016357421875, 0.7784423828125, 0.808868408203125, 0.83929443359375, 0.869720458984375, 0.900146484375, 0.930572509765625, 0.96099853515625, 0.991424560546875, 1.0218505859375, 1.052276611328125, 1.08270263671875, 1.113128662109375, 1.1435546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 10.0, 6.0, 14.0, 17.0, 18.0, 22.0, 35.0, 53.0, 87.0, 119.0, 189.0, 351.0, 753.0, 1618.0, 3931.0, 11433.0, 39126.0, 176126.0, 576732.0, 179234.0, 39854.0, 11497.0, 3995.0, 1606.0, 714.0, 371.0, 213.0, 145.0, 92.0, 44.0, 31.0, 29.0, 19.0, 21.0, 11.0, 7.0, 8.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.4671630859375, -2.383544921875, -2.2999267578125, -2.21630859375, -2.1326904296875, -2.049072265625, -1.9654541015625, -1.8818359375, -1.7982177734375, -1.714599609375, -1.6309814453125, -1.54736328125, -1.4637451171875, -1.380126953125, -1.2965087890625, -1.212890625, -1.1292724609375, -1.045654296875, -0.9620361328125, -0.87841796875, -0.7947998046875, -0.711181640625, -0.6275634765625, -0.5439453125, -0.4603271484375, -0.376708984375, -0.2930908203125, -0.20947265625, -0.1258544921875, -0.042236328125, 0.0413818359375, 0.125, 0.2086181640625, 0.292236328125, 0.3758544921875, 0.45947265625, 0.5430908203125, 0.626708984375, 0.7103271484375, 0.7939453125, 0.8775634765625, 0.961181640625, 1.0447998046875, 1.12841796875, 1.2120361328125, 1.295654296875, 1.3792724609375, 1.462890625, 1.5465087890625, 1.630126953125, 1.7137451171875, 1.79736328125, 1.8809814453125, 1.964599609375, 2.0482177734375, 2.1318359375, 2.2154541015625, 2.299072265625, 2.3826904296875, 2.46630859375, 2.5499267578125, 2.633544921875, 2.7171630859375, 2.80078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 17.0, 31.0, 20.0, 20.0, 36.0, 24.0, 37.0, 29.0, 35.0, 34.0, 39.0, 42.0, 43.0, 43.0, 55.0, 55.0, 39.0, 52.0, 33.0, 42.0, 29.0, 28.0, 32.0, 25.0, 25.0, 25.0, 9.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0], "bins": [-4.734375, -4.611480712890625, -4.48858642578125, -4.365692138671875, -4.2427978515625, -4.119903564453125, -3.99700927734375, -3.874114990234375, -3.751220703125, -3.628326416015625, -3.50543212890625, -3.382537841796875, -3.2596435546875, -3.136749267578125, -3.01385498046875, -2.890960693359375, -2.76806640625, -2.645172119140625, -2.52227783203125, -2.399383544921875, -2.2764892578125, -2.153594970703125, -2.03070068359375, -1.907806396484375, -1.784912109375, -1.662017822265625, -1.53912353515625, -1.416229248046875, -1.2933349609375, -1.170440673828125, -1.04754638671875, -0.924652099609375, -0.8017578125, -0.678863525390625, -0.55596923828125, -0.433074951171875, -0.3101806640625, -0.187286376953125, -0.06439208984375, 0.058502197265625, 0.181396484375, 0.304290771484375, 0.42718505859375, 0.550079345703125, 0.6729736328125, 0.795867919921875, 0.91876220703125, 1.041656494140625, 1.16455078125, 1.287445068359375, 1.41033935546875, 1.533233642578125, 1.6561279296875, 1.779022216796875, 1.90191650390625, 2.024810791015625, 2.147705078125, 2.270599365234375, 2.39349365234375, 2.516387939453125, 2.6392822265625, 2.762176513671875, 2.88507080078125, 3.007965087890625, 3.130859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 14.0, 17.0, 31.0, 35.0, 62.0, 93.0, 150.0, 303.0, 522.0, 1226.0, 2982.0, 8955.0, 36460.0, 327064.0, 590653.0, 60423.0, 12429.0, 3998.0, 1610.0, 722.0, 342.0, 164.0, 114.0, 54.0, 26.0, 29.0, 24.0, 10.0, 8.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.340484619140625, -2.24737548828125, -2.154266357421875, -2.0611572265625, -1.968048095703125, -1.87493896484375, -1.781829833984375, -1.688720703125, -1.595611572265625, -1.50250244140625, -1.409393310546875, -1.3162841796875, -1.223175048828125, -1.13006591796875, -1.036956787109375, -0.94384765625, -0.850738525390625, -0.75762939453125, -0.664520263671875, -0.5714111328125, -0.478302001953125, -0.38519287109375, -0.292083740234375, -0.198974609375, -0.105865478515625, -0.01275634765625, 0.080352783203125, 0.1734619140625, 0.266571044921875, 0.35968017578125, 0.452789306640625, 0.5458984375, 0.639007568359375, 0.73211669921875, 0.825225830078125, 0.9183349609375, 1.011444091796875, 1.10455322265625, 1.197662353515625, 1.290771484375, 1.383880615234375, 1.47698974609375, 1.570098876953125, 1.6632080078125, 1.756317138671875, 1.84942626953125, 1.942535400390625, 2.03564453125, 2.128753662109375, 2.22186279296875, 2.314971923828125, 2.4080810546875, 2.501190185546875, 2.59429931640625, 2.687408447265625, 2.780517578125, 2.873626708984375, 2.96673583984375, 3.059844970703125, 3.1529541015625, 3.246063232421875, 3.33917236328125, 3.432281494140625, 3.525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 5.0, 11.0, 15.0, 23.0, 28.0, 39.0, 52.0, 62.0, 79.0, 68.0, 94.0, 91.0, 86.0, 60.0, 61.0, 41.0, 36.0, 40.0, 23.0, 14.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011790171265602112, -0.00011301785707473755, -0.00010813400149345398, -0.00010325014591217041, -9.836629033088684e-05, -9.348243474960327e-05, -8.85985791683197e-05, -8.371472358703613e-05, -7.883086800575256e-05, -7.3947012424469e-05, -6.906315684318542e-05, -6.417930126190186e-05, -5.9295445680618286e-05, -5.441159009933472e-05, -4.952773451805115e-05, -4.464387893676758e-05, -3.976002335548401e-05, -3.487616777420044e-05, -2.999231219291687e-05, -2.51084566116333e-05, -2.022460103034973e-05, -1.5340745449066162e-05, -1.0456889867782593e-05, -5.5730342864990234e-06, -6.891787052154541e-07, 4.194676876068115e-06, 9.078532457351685e-06, 1.3962388038635254e-05, 1.8846243619918823e-05, 2.3730099201202393e-05, 2.8613954782485962e-05, 3.349781036376953e-05, 3.83816659450531e-05, 4.326552152633667e-05, 4.814937710762024e-05, 5.303323268890381e-05, 5.791708827018738e-05, 6.280094385147095e-05, 6.768479943275452e-05, 7.256865501403809e-05, 7.745251059532166e-05, 8.233636617660522e-05, 8.72202217578888e-05, 9.210407733917236e-05, 9.698793292045593e-05, 0.0001018717885017395, 0.00010675564408302307, 0.00011163949966430664, 0.00011652335524559021, 0.00012140721082687378, 0.00012629106640815735, 0.00013117492198944092, 0.0001360587775707245, 0.00014094263315200806, 0.00014582648873329163, 0.0001507103443145752, 0.00015559419989585876, 0.00016047805547714233, 0.0001653619110584259, 0.00017024576663970947, 0.00017512962222099304, 0.0001800134778022766, 0.00018489733338356018, 0.00018978118896484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 16.0, 12.0, 24.0, 31.0, 64.0, 113.0, 197.0, 446.0, 1017.0, 2667.0, 9912.0, 73714.0, 773111.0, 164765.0, 16152.0, 3893.0, 1268.0, 544.0, 257.0, 142.0, 81.0, 46.0, 30.0, 12.0, 10.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.593963623046875, -4.46136474609375, -4.328765869140625, -4.1961669921875, -4.063568115234375, -3.93096923828125, -3.798370361328125, -3.665771484375, -3.533172607421875, -3.40057373046875, -3.267974853515625, -3.1353759765625, -3.002777099609375, -2.87017822265625, -2.737579345703125, -2.60498046875, -2.472381591796875, -2.33978271484375, -2.207183837890625, -2.0745849609375, -1.941986083984375, -1.80938720703125, -1.676788330078125, -1.544189453125, -1.411590576171875, -1.27899169921875, -1.146392822265625, -1.0137939453125, -0.881195068359375, -0.74859619140625, -0.615997314453125, -0.4833984375, -0.350799560546875, -0.21820068359375, -0.085601806640625, 0.0469970703125, 0.179595947265625, 0.31219482421875, 0.444793701171875, 0.577392578125, 0.709991455078125, 0.84259033203125, 0.975189208984375, 1.1077880859375, 1.240386962890625, 1.37298583984375, 1.505584716796875, 1.63818359375, 1.770782470703125, 1.90338134765625, 2.035980224609375, 2.1685791015625, 2.301177978515625, 2.43377685546875, 2.566375732421875, 2.698974609375, 2.831573486328125, 2.96417236328125, 3.096771240234375, 3.2293701171875, 3.361968994140625, 3.49456787109375, 3.627166748046875, 3.759765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 11.0, 20.0, 23.0, 38.0, 43.0, 47.0, 76.0, 86.0, 86.0, 114.0, 104.0, 89.0, 62.0, 47.0, 38.0, 33.0, 17.0, 18.0, 11.0, 13.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.326080322265625, -2.26153564453125, -2.196990966796875, -2.1324462890625, -2.067901611328125, -2.00335693359375, -1.938812255859375, -1.874267578125, -1.809722900390625, -1.74517822265625, -1.680633544921875, -1.6160888671875, -1.551544189453125, -1.48699951171875, -1.422454833984375, -1.35791015625, -1.293365478515625, -1.22882080078125, -1.164276123046875, -1.0997314453125, -1.035186767578125, -0.97064208984375, -0.906097412109375, -0.841552734375, -0.777008056640625, -0.71246337890625, -0.647918701171875, -0.5833740234375, -0.518829345703125, -0.45428466796875, -0.389739990234375, -0.3251953125, -0.260650634765625, -0.19610595703125, -0.131561279296875, -0.0670166015625, -0.002471923828125, 0.06207275390625, 0.126617431640625, 0.191162109375, 0.255706787109375, 0.32025146484375, 0.384796142578125, 0.4493408203125, 0.513885498046875, 0.57843017578125, 0.642974853515625, 0.70751953125, 0.772064208984375, 0.83660888671875, 0.901153564453125, 0.9656982421875, 1.030242919921875, 1.09478759765625, 1.159332275390625, 1.223876953125, 1.288421630859375, 1.35296630859375, 1.417510986328125, 1.4820556640625, 1.546600341796875, 1.61114501953125, 1.675689697265625, 1.740234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 16.0, 52.0, 371.0, 491.0, 59.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.24732971191406, -120.71041107177734, -117.17349243164062, -113.63656616210938, -110.09964752197266, -106.56272888183594, -103.02580261230469, -99.48888397216797, -95.95196533203125, -92.41504669189453, -88.87812805175781, -85.34120178222656, -81.80428314208984, -78.26736450195312, -74.73043823242188, -71.19351959228516, -67.65660095214844, -64.11968231201172, -60.582759857177734, -57.04583740234375, -53.50891876220703, -49.97200012207031, -46.43507766723633, -42.898155212402344, -39.361236572265625, -35.824317932128906, -32.28739547729492, -28.75047492980957, -25.21355438232422, -21.676633834838867, -18.139713287353516, -14.602792739868164, -11.065872192382812, -7.528951644897461, -3.9920310974121094, -0.4551105499267578, 3.0818099975585938, 6.618730545043945, 10.155651092529297, 13.692571640014648, 17.2294921875, 20.76641273498535, 24.303333282470703, 27.840253829956055, 31.377174377441406, 34.914093017578125, 38.45101547241211, 41.987937927246094, 45.52485656738281, 49.06177520751953, 52.598697662353516, 56.1356201171875, 59.67253875732422, 63.20945739746094, 66.74638366699219, 70.2833023071289, 73.82022094726562, 77.35713958740234, 80.89405822753906, 84.43098449707031, 87.96790313720703, 91.50482177734375, 95.041748046875, 98.57866668701172, 102.11558532714844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 3.0, 7.0, 9.0, 12.0, 20.0, 29.0, 38.0, 64.0, 109.0, 123.0, 150.0, 117.0, 87.0, 72.0, 36.0, 16.0, 12.0, 12.0, 15.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.0882339477539, -61.97610855102539, -59.863983154296875, -57.751861572265625, -55.63973617553711, -53.527610778808594, -51.41548538208008, -49.30335998535156, -47.19123840332031, -45.0791130065918, -42.96698760986328, -40.85486602783203, -38.742740631103516, -36.630615234375, -34.518489837646484, -32.40636444091797, -30.294239044189453, -28.182113647460938, -26.069990158081055, -23.95786476135254, -21.845741271972656, -19.73361587524414, -17.621490478515625, -15.509366035461426, -13.397241592407227, -11.285117149353027, -9.172992706298828, -7.0608673095703125, -4.948742866516113, -2.836618423461914, -0.7244930267333984, 1.3876314163208008, 3.499755859375, 5.611880302429199, 7.724005222320557, 9.836130142211914, 11.948254585266113, 14.060379028320312, 16.172504425048828, 18.284629821777344, 20.396753311157227, 22.508878707885742, 24.621002197265625, 26.73312759399414, 28.845252990722656, 30.95737648010254, 33.06950378417969, 35.18162536621094, 37.29375076293945, 39.40587615966797, 41.518001556396484, 43.630126953125, 45.74224853515625, 47.854373931884766, 49.96649932861328, 52.0786247253418, 54.19075012207031, 56.30287551879883, 58.415000915527344, 60.527122497558594, 62.63924789428711, 64.75137329101562, 66.86349487304688, 68.97562408447266, 71.0877456665039]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 6.0, 10.0, 14.0, 23.0, 46.0, 46.0, 71.0, 98.0, 121.0, 202.0, 299.0, 429.0, 677.0, 1101.0, 1763.0, 3029.0, 5592.0, 12177.0, 35067.0, 3594586.0, 486835.0, 29786.0, 10367.0, 4822.0, 2644.0, 1499.0, 941.0, 588.0, 432.0, 298.0, 203.0, 148.0, 77.0, 71.0, 44.0, 37.0, 29.0, 23.0, 17.0, 8.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.87890625, -7.65972900390625, -7.4405517578125, -7.22137451171875, -7.002197265625, -6.78302001953125, -6.5638427734375, -6.34466552734375, -6.12548828125, -5.90631103515625, -5.6871337890625, -5.46795654296875, -5.248779296875, -5.02960205078125, -4.8104248046875, -4.59124755859375, -4.3720703125, -4.15289306640625, -3.9337158203125, -3.71453857421875, -3.495361328125, -3.27618408203125, -3.0570068359375, -2.83782958984375, -2.61865234375, -2.39947509765625, -2.1802978515625, -1.96112060546875, -1.741943359375, -1.52276611328125, -1.3035888671875, -1.08441162109375, -0.865234375, -0.64605712890625, -0.4268798828125, -0.20770263671875, 0.011474609375, 0.23065185546875, 0.4498291015625, 0.66900634765625, 0.88818359375, 1.10736083984375, 1.3265380859375, 1.54571533203125, 1.764892578125, 1.98406982421875, 2.2032470703125, 2.42242431640625, 2.6416015625, 2.86077880859375, 3.0799560546875, 3.29913330078125, 3.518310546875, 3.73748779296875, 3.9566650390625, 4.17584228515625, 4.39501953125, 4.61419677734375, 4.8333740234375, 5.05255126953125, 5.271728515625, 5.49090576171875, 5.7100830078125, 5.92926025390625, 6.1484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 16.0, 14.0, 9.0, 19.0, 22.0, 140.0, 357.0, 244.0, 61.0, 19.0, 12.0, 12.0, 7.0, 8.0, 9.0, 6.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6816787719726562, -0.6529083251953125, -0.6241378784179688, -0.595367431640625, -0.5665969848632812, -0.5378265380859375, -0.5090560913085938, -0.48028564453125, -0.45151519775390625, -0.4227447509765625, -0.39397430419921875, -0.365203857421875, -0.33643341064453125, -0.3076629638671875, -0.27889251708984375, -0.2501220703125, -0.22135162353515625, -0.1925811767578125, -0.16381072998046875, -0.135040283203125, -0.10626983642578125, -0.0774993896484375, -0.04872894287109375, -0.01995849609375, 0.00881195068359375, 0.0375823974609375, 0.06635284423828125, 0.095123291015625, 0.12389373779296875, 0.1526641845703125, 0.18143463134765625, 0.210205078125, 0.23897552490234375, 0.2677459716796875, 0.29651641845703125, 0.325286865234375, 0.35405731201171875, 0.3828277587890625, 0.41159820556640625, 0.44036865234375, 0.46913909912109375, 0.4979095458984375, 0.5266799926757812, 0.555450439453125, 0.5842208862304688, 0.6129913330078125, 0.6417617797851562, 0.6705322265625, 0.6993026733398438, 0.7280731201171875, 0.7568435668945312, 0.785614013671875, 0.8143844604492188, 0.8431549072265625, 0.8719253540039062, 0.90069580078125, 0.9294662475585938, 0.9582366943359375, 0.9870071411132812, 1.015777587890625, 1.0445480346679688, 1.0733184814453125, 1.1020889282226562, 1.130859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 7.0, 17.0, 25.0, 33.0, 51.0, 61.0, 138.0, 222.0, 448.0, 988.0, 2234.0, 5843.0, 17948.0, 84015.0, 3640573.0, 383782.0, 40267.0, 10724.0, 3909.0, 1570.0, 654.0, 361.0, 167.0, 90.0, 48.0, 36.0, 22.0, 12.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.59552001953125, -7.3707275390625, -7.14593505859375, -6.921142578125, -6.69635009765625, -6.4715576171875, -6.24676513671875, -6.02197265625, -5.79718017578125, -5.5723876953125, -5.34759521484375, -5.122802734375, -4.89801025390625, -4.6732177734375, -4.44842529296875, -4.2236328125, -3.99884033203125, -3.7740478515625, -3.54925537109375, -3.324462890625, -3.09967041015625, -2.8748779296875, -2.65008544921875, -2.42529296875, -2.20050048828125, -1.9757080078125, -1.75091552734375, -1.526123046875, -1.30133056640625, -1.0765380859375, -0.85174560546875, -0.626953125, -0.40216064453125, -0.1773681640625, 0.04742431640625, 0.272216796875, 0.49700927734375, 0.7218017578125, 0.94659423828125, 1.17138671875, 1.39617919921875, 1.6209716796875, 1.84576416015625, 2.070556640625, 2.29534912109375, 2.5201416015625, 2.74493408203125, 2.9697265625, 3.19451904296875, 3.4193115234375, 3.64410400390625, 3.868896484375, 4.09368896484375, 4.3184814453125, 4.54327392578125, 4.76806640625, 4.99285888671875, 5.2176513671875, 5.44244384765625, 5.667236328125, 5.89202880859375, 6.1168212890625, 6.34161376953125, 6.56640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 14.0, 18.0, 14.0, 19.0, 33.0, 59.0, 93.0, 178.0, 325.0, 2147.0, 615.0, 214.0, 134.0, 66.0, 37.0, 30.0, 24.0, 20.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2167816162109375, -1.184539794921875, -1.1522979736328125, -1.12005615234375, -1.0878143310546875, -1.055572509765625, -1.0233306884765625, -0.9910888671875, -0.9588470458984375, -0.926605224609375, -0.8943634033203125, -0.86212158203125, -0.8298797607421875, -0.797637939453125, -0.7653961181640625, -0.733154296875, -0.7009124755859375, -0.668670654296875, -0.6364288330078125, -0.60418701171875, -0.5719451904296875, -0.539703369140625, -0.5074615478515625, -0.4752197265625, -0.4429779052734375, -0.410736083984375, -0.3784942626953125, -0.34625244140625, -0.3140106201171875, -0.281768798828125, -0.2495269775390625, -0.21728515625, -0.1850433349609375, -0.152801513671875, -0.1205596923828125, -0.08831787109375, -0.0560760498046875, -0.023834228515625, 0.0084075927734375, 0.0406494140625, 0.0728912353515625, 0.105133056640625, 0.1373748779296875, 0.16961669921875, 0.2018585205078125, 0.234100341796875, 0.2663421630859375, 0.298583984375, 0.3308258056640625, 0.363067626953125, 0.3953094482421875, 0.42755126953125, 0.4597930908203125, 0.492034912109375, 0.5242767333984375, 0.5565185546875, 0.5887603759765625, 0.621002197265625, 0.6532440185546875, 0.68548583984375, 0.7177276611328125, 0.749969482421875, 0.7822113037109375, 0.814453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 48.0, 169.0, 450.0, 246.0, 56.0, 16.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.364155769348145, -9.9586820602417, -9.553208351135254, -9.147734642028809, -8.742260932922363, -8.336787223815918, -7.9313130378723145, -7.525839328765869, -7.120365619659424, -6.7148919105529785, -6.309418201446533, -5.90394401550293, -5.498470306396484, -5.092996597290039, -4.687522888183594, -4.282049179077148, -3.876575469970703, -3.471101760864258, -3.0656280517578125, -2.660154104232788, -2.2546803951263428, -1.8492066860198975, -1.443732738494873, -1.0382590293884277, -0.6327853202819824, -0.22731155157089233, 0.17816221714019775, 0.5836360454559326, 0.9891097545623779, 1.3945834636688232, 1.8000574111938477, 2.205531120300293, 2.611003875732422, 3.016477584838867, 3.4219512939453125, 3.827425241470337, 4.232898712158203, 4.638372421264648, 5.043846607208252, 5.449320316314697, 5.854794025421143, 6.260267734527588, 6.665741443634033, 7.071215629577637, 7.476689338684082, 7.882163047790527, 8.287636756896973, 8.693110466003418, 9.098584175109863, 9.504057884216309, 9.909531593322754, 10.3150053024292, 10.720479011535645, 11.12595272064209, 11.531427383422852, 11.936901092529297, 12.342374801635742, 12.747848510742188, 13.153322219848633, 13.558795928955078, 13.964269638061523, 14.369743347167969, 14.775217056274414, 15.18069076538086, 15.586164474487305]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 10.0, 8.0, 11.0, 16.0, 15.0, 34.0, 34.0, 34.0, 44.0, 63.0, 80.0, 65.0, 75.0, 68.0, 55.0, 79.0, 43.0, 58.0, 37.0, 28.0, 24.0, 25.0, 19.0, 16.0, 11.0, 9.0, 2.0, 4.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.959841251373291, -3.85481333732605, -3.7497856616973877, -3.6447577476501465, -3.5397298336029053, -3.434701919555664, -3.329674243927002, -3.2246463298797607, -3.1196184158325195, -3.0145905017852783, -2.909562826156616, -2.804534912109375, -2.699506998062134, -2.5944790840148926, -2.4894514083862305, -2.3844234943389893, -2.279395818710327, -2.174367904663086, -2.069340229034424, -1.9643123149871826, -1.8592844009399414, -1.7542566061019897, -1.649228811264038, -1.5442008972167969, -1.4391731023788452, -1.3341453075408936, -1.2291173934936523, -1.1240895986557007, -1.019061803817749, -0.9140338897705078, -0.8090060949325562, -0.7039782404899597, -0.5989501476287842, -0.49392229318618774, -0.3888944685459137, -0.28386664390563965, -0.1788387894630432, -0.07381093502044678, 0.031216859817504883, 0.13624471426010132, 0.24127256870269775, 0.3463004231452942, 0.45132824778556824, 0.5563560724258423, 0.6613839268684387, 0.7664117813110352, 0.8714395761489868, 0.9764674305915833, 1.0814952850341797, 1.1865230798721313, 1.2915509939193726, 1.3965787887573242, 1.5016067028045654, 1.606634497642517, 1.7116622924804688, 1.81669020652771, 1.9217180013656616, 2.0267457962036133, 2.1317737102508545, 2.2368016242980957, 2.341829299926758, 2.446857213973999, 2.5518851280212402, 2.6569128036499023, 2.7619407176971436]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 12.0, 8.0, 12.0, 16.0, 21.0, 24.0, 30.0, 46.0, 55.0, 94.0, 142.0, 164.0, 233.0, 374.0, 569.0, 936.0, 1510.0, 2494.0, 4326.0, 8399.0, 19191.0, 71619.0, 816896.0, 81192.0, 20206.0, 8621.0, 4401.0, 2520.0, 1565.0, 1001.0, 620.0, 359.0, 273.0, 193.0, 120.0, 93.0, 64.0, 38.0, 29.0, 28.0, 17.0, 13.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.9375, -4.79022216796875, -4.6429443359375, -4.49566650390625, -4.348388671875, -4.20111083984375, -4.0538330078125, -3.90655517578125, -3.75927734375, -3.61199951171875, -3.4647216796875, -3.31744384765625, -3.170166015625, -3.02288818359375, -2.8756103515625, -2.72833251953125, -2.5810546875, -2.43377685546875, -2.2864990234375, -2.13922119140625, -1.991943359375, -1.84466552734375, -1.6973876953125, -1.55010986328125, -1.40283203125, -1.25555419921875, -1.1082763671875, -0.96099853515625, -0.813720703125, -0.66644287109375, -0.5191650390625, -0.37188720703125, -0.224609375, -0.07733154296875, 0.0699462890625, 0.21722412109375, 0.364501953125, 0.51177978515625, 0.6590576171875, 0.80633544921875, 0.95361328125, 1.10089111328125, 1.2481689453125, 1.39544677734375, 1.542724609375, 1.69000244140625, 1.8372802734375, 1.98455810546875, 2.1318359375, 2.27911376953125, 2.4263916015625, 2.57366943359375, 2.720947265625, 2.86822509765625, 3.0155029296875, 3.16278076171875, 3.31005859375, 3.45733642578125, 3.6046142578125, 3.75189208984375, 3.899169921875, 4.04644775390625, 4.1937255859375, 4.34100341796875, 4.48828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 10.0, 3.0, 7.0, 18.0, 13.0, 27.0, 80.0, 221.0, 335.0, 161.0, 35.0, 19.0, 8.0, 11.0, 13.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7085494995117188, -0.6793060302734375, -0.6500625610351562, -0.620819091796875, -0.5915756225585938, -0.5623321533203125, -0.5330886840820312, -0.50384521484375, -0.47460174560546875, -0.4453582763671875, -0.41611480712890625, -0.386871337890625, -0.35762786865234375, -0.3283843994140625, -0.29914093017578125, -0.2698974609375, -0.24065399169921875, -0.2114105224609375, -0.18216705322265625, -0.152923583984375, -0.12368011474609375, -0.0944366455078125, -0.06519317626953125, -0.03594970703125, -0.00670623779296875, 0.0225372314453125, 0.05178070068359375, 0.081024169921875, 0.11026763916015625, 0.1395111083984375, 0.16875457763671875, 0.197998046875, 0.22724151611328125, 0.2564849853515625, 0.28572845458984375, 0.314971923828125, 0.34421539306640625, 0.3734588623046875, 0.40270233154296875, 0.43194580078125, 0.46118927001953125, 0.4904327392578125, 0.5196762084960938, 0.548919677734375, 0.5781631469726562, 0.6074066162109375, 0.6366500854492188, 0.6658935546875, 0.6951370239257812, 0.7243804931640625, 0.7536239624023438, 0.782867431640625, 0.8121109008789062, 0.8413543701171875, 0.8705978393554688, 0.89984130859375, 0.9290847778320312, 0.9583282470703125, 0.9875717163085938, 1.016815185546875, 1.0460586547851562, 1.0753021240234375, 1.1045455932617188, 1.1337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 11.0, 28.0, 39.0, 50.0, 93.0, 130.0, 266.0, 508.0, 1103.0, 2501.0, 6683.0, 23871.0, 171364.0, 706805.0, 109010.0, 17475.0, 4996.0, 1870.0, 804.0, 399.0, 209.0, 116.0, 74.0, 50.0, 24.0, 9.0, 13.0, 15.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.33843994140625, -4.2003173828125, -4.06219482421875, -3.924072265625, -3.78594970703125, -3.6478271484375, -3.50970458984375, -3.37158203125, -3.23345947265625, -3.0953369140625, -2.95721435546875, -2.819091796875, -2.68096923828125, -2.5428466796875, -2.40472412109375, -2.2666015625, -2.12847900390625, -1.9903564453125, -1.85223388671875, -1.714111328125, -1.57598876953125, -1.4378662109375, -1.29974365234375, -1.16162109375, -1.02349853515625, -0.8853759765625, -0.74725341796875, -0.609130859375, -0.47100830078125, -0.3328857421875, -0.19476318359375, -0.056640625, 0.08148193359375, 0.2196044921875, 0.35772705078125, 0.495849609375, 0.63397216796875, 0.7720947265625, 0.91021728515625, 1.04833984375, 1.18646240234375, 1.3245849609375, 1.46270751953125, 1.600830078125, 1.73895263671875, 1.8770751953125, 2.01519775390625, 2.1533203125, 2.29144287109375, 2.4295654296875, 2.56768798828125, 2.705810546875, 2.84393310546875, 2.9820556640625, 3.12017822265625, 3.25830078125, 3.39642333984375, 3.5345458984375, 3.67266845703125, 3.810791015625, 3.94891357421875, 4.0870361328125, 4.22515869140625, 4.36328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 10.0, 7.0, 17.0, 20.0, 29.0, 33.0, 30.0, 59.0, 46.0, 50.0, 54.0, 50.0, 56.0, 57.0, 49.0, 59.0, 57.0, 52.0, 55.0, 33.0, 38.0, 24.0, 20.0, 13.0, 17.0, 9.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.311767578125, -2.23095703125, -2.150146484375, -2.0693359375, -1.988525390625, -1.90771484375, -1.826904296875, -1.74609375, -1.665283203125, -1.58447265625, -1.503662109375, -1.4228515625, -1.342041015625, -1.26123046875, -1.180419921875, -1.099609375, -1.018798828125, -0.93798828125, -0.857177734375, -0.7763671875, -0.695556640625, -0.61474609375, -0.533935546875, -0.453125, -0.372314453125, -0.29150390625, -0.210693359375, -0.1298828125, -0.049072265625, 0.03173828125, 0.112548828125, 0.193359375, 0.274169921875, 0.35498046875, 0.435791015625, 0.5166015625, 0.597412109375, 0.67822265625, 0.759033203125, 0.83984375, 0.920654296875, 1.00146484375, 1.082275390625, 1.1630859375, 1.243896484375, 1.32470703125, 1.405517578125, 1.486328125, 1.567138671875, 1.64794921875, 1.728759765625, 1.8095703125, 1.890380859375, 1.97119140625, 2.052001953125, 2.1328125, 2.213623046875, 2.29443359375, 2.375244140625, 2.4560546875, 2.536865234375, 2.61767578125, 2.698486328125, 2.779296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 2.0, 4.0, 6.0, 13.0, 16.0, 27.0, 33.0, 42.0, 83.0, 96.0, 158.0, 200.0, 344.0, 504.0, 855.0, 1437.0, 2501.0, 5119.0, 10919.0, 28276.0, 93382.0, 376147.0, 382392.0, 94680.0, 28702.0, 11088.0, 5105.0, 2602.0, 1454.0, 860.0, 455.0, 328.0, 231.0, 145.0, 90.0, 72.0, 41.0, 30.0, 31.0, 22.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.865234375, -2.769744873046875, -2.67425537109375, -2.578765869140625, -2.4832763671875, -2.387786865234375, -2.29229736328125, -2.196807861328125, -2.101318359375, -2.005828857421875, -1.91033935546875, -1.814849853515625, -1.7193603515625, -1.623870849609375, -1.52838134765625, -1.432891845703125, -1.33740234375, -1.241912841796875, -1.14642333984375, -1.050933837890625, -0.9554443359375, -0.859954833984375, -0.76446533203125, -0.668975830078125, -0.573486328125, -0.477996826171875, -0.38250732421875, -0.287017822265625, -0.1915283203125, -0.096038818359375, -0.00054931640625, 0.094940185546875, 0.1904296875, 0.285919189453125, 0.38140869140625, 0.476898193359375, 0.5723876953125, 0.667877197265625, 0.76336669921875, 0.858856201171875, 0.954345703125, 1.049835205078125, 1.14532470703125, 1.240814208984375, 1.3363037109375, 1.431793212890625, 1.52728271484375, 1.622772216796875, 1.71826171875, 1.813751220703125, 1.90924072265625, 2.004730224609375, 2.1002197265625, 2.195709228515625, 2.29119873046875, 2.386688232421875, 2.482177734375, 2.577667236328125, 2.67315673828125, 2.768646240234375, 2.8641357421875, 2.959625244140625, 3.05511474609375, 3.150604248046875, 3.24609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 10.0, 15.0, 18.0, 32.0, 63.0, 120.0, 213.0, 187.0, 140.0, 76.0, 41.0, 24.0, 14.0, 9.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006275177001953125, -0.0006133057177066803, -0.0005990937352180481, -0.0005848817527294159, -0.0005706697702407837, -0.0005564577877521515, -0.0005422458052635193, -0.0005280338227748871, -0.0005138218402862549, -0.0004996098577976227, -0.0004853978753089905, -0.0004711858928203583, -0.0004569739103317261, -0.00044276192784309387, -0.00042854994535446167, -0.00041433796286582947, -0.00040012598037719727, -0.00038591399788856506, -0.00037170201539993286, -0.00035749003291130066, -0.00034327805042266846, -0.00032906606793403625, -0.00031485408544540405, -0.00030064210295677185, -0.00028643012046813965, -0.00027221813797950745, -0.00025800615549087524, -0.00024379417300224304, -0.00022958219051361084, -0.00021537020802497864, -0.00020115822553634644, -0.00018694624304771423, -0.00017273426055908203, -0.00015852227807044983, -0.00014431029558181763, -0.00013009831309318542, -0.00011588633060455322, -0.00010167434811592102, -8.746236562728882e-05, -7.325038313865662e-05, -5.9038400650024414e-05, -4.482641816139221e-05, -3.061443567276001e-05, -1.6402453184127808e-05, -2.1904706954956055e-06, 1.2021511793136597e-05, 2.62334942817688e-05, 4.0445476770401e-05, 5.46574592590332e-05, 6.88694417476654e-05, 8.308142423629761e-05, 9.729340672492981e-05, 0.00011150538921356201, 0.00012571737170219421, 0.00013992935419082642, 0.00015414133667945862, 0.00016835331916809082, 0.00018256530165672302, 0.00019677728414535522, 0.00021098926663398743, 0.00022520124912261963, 0.00023941323161125183, 0.00025362521409988403, 0.00026783719658851624, 0.00028204917907714844]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 6.0, 6.0, 9.0, 21.0, 24.0, 28.0, 27.0, 60.0, 98.0, 135.0, 220.0, 373.0, 653.0, 1156.0, 2226.0, 4661.0, 10747.0, 30802.0, 114591.0, 448379.0, 320218.0, 75375.0, 22356.0, 8429.0, 3635.0, 1818.0, 1024.0, 544.0, 312.0, 190.0, 119.0, 85.0, 53.0, 45.0, 30.0, 24.0, 16.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.2236328125, -3.119140625, -3.0146484375, -2.91015625, -2.8056640625, -2.701171875, -2.5966796875, -2.4921875, -2.3876953125, -2.283203125, -2.1787109375, -2.07421875, -1.9697265625, -1.865234375, -1.7607421875, -1.65625, -1.5517578125, -1.447265625, -1.3427734375, -1.23828125, -1.1337890625, -1.029296875, -0.9248046875, -0.8203125, -0.7158203125, -0.611328125, -0.5068359375, -0.40234375, -0.2978515625, -0.193359375, -0.0888671875, 0.015625, 0.1201171875, 0.224609375, 0.3291015625, 0.43359375, 0.5380859375, 0.642578125, 0.7470703125, 0.8515625, 0.9560546875, 1.060546875, 1.1650390625, 1.26953125, 1.3740234375, 1.478515625, 1.5830078125, 1.6875, 1.7919921875, 1.896484375, 2.0009765625, 2.10546875, 2.2099609375, 2.314453125, 2.4189453125, 2.5234375, 2.6279296875, 2.732421875, 2.8369140625, 2.94140625, 3.0458984375, 3.150390625, 3.2548828125, 3.359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 8.0, 11.0, 11.0, 9.0, 25.0, 19.0, 38.0, 43.0, 48.0, 59.0, 58.0, 97.0, 82.0, 70.0, 70.0, 54.0, 46.0, 47.0, 37.0, 35.0, 26.0, 21.0, 21.0, 9.0, 9.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.79913330078125, -1.7388916015625, -1.67864990234375, -1.618408203125, -1.55816650390625, -1.4979248046875, -1.43768310546875, -1.37744140625, -1.31719970703125, -1.2569580078125, -1.19671630859375, -1.136474609375, -1.07623291015625, -1.0159912109375, -0.95574951171875, -0.8955078125, -0.83526611328125, -0.7750244140625, -0.71478271484375, -0.654541015625, -0.59429931640625, -0.5340576171875, -0.47381591796875, -0.41357421875, -0.35333251953125, -0.2930908203125, -0.23284912109375, -0.172607421875, -0.11236572265625, -0.0521240234375, 0.00811767578125, 0.068359375, 0.12860107421875, 0.1888427734375, 0.24908447265625, 0.309326171875, 0.36956787109375, 0.4298095703125, 0.49005126953125, 0.55029296875, 0.61053466796875, 0.6707763671875, 0.73101806640625, 0.791259765625, 0.85150146484375, 0.9117431640625, 0.97198486328125, 1.0322265625, 1.09246826171875, 1.1527099609375, 1.21295166015625, 1.273193359375, 1.33343505859375, 1.3936767578125, 1.45391845703125, 1.51416015625, 1.57440185546875, 1.6346435546875, 1.69488525390625, 1.755126953125, 1.81536865234375, 1.8756103515625, 1.93585205078125, 1.99609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 24.0, 46.0, 92.0, 181.0, 258.0, 190.0, 110.0, 47.0, 24.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.348005294799805, -16.413665771484375, -15.479326248168945, -14.544986724853516, -13.610647201538086, -12.676307678222656, -11.741968154907227, -10.807628631591797, -9.873289108276367, -8.938949584960938, -8.004610061645508, -7.070270538330078, -6.135931015014648, -5.201591491699219, -4.267251968383789, -3.3329124450683594, -2.3985729217529297, -1.4642333984375, -0.5298938751220703, 0.4044456481933594, 1.338785171508789, 2.2731246948242188, 3.2074642181396484, 4.141803741455078, 5.076143264770508, 6.0104827880859375, 6.944822311401367, 7.879161834716797, 8.813501358032227, 9.747840881347656, 10.682180404663086, 11.616519927978516, 12.550857543945312, 13.485197067260742, 14.419536590576172, 15.353876113891602, 16.28821563720703, 17.22255516052246, 18.15689468383789, 19.09123420715332, 20.02557373046875, 20.95991325378418, 21.89425277709961, 22.82859230041504, 23.76293182373047, 24.6972713470459, 25.631610870361328, 26.565950393676758, 27.500289916992188, 28.434629440307617, 29.368968963623047, 30.303308486938477, 31.237648010253906, 32.17198944091797, 33.106327056884766, 34.04066467285156, 34.975006103515625, 35.90934753417969, 36.843685150146484, 37.77802276611328, 38.712364196777344, 39.646705627441406, 40.5810432434082, 41.515380859375, 42.44972229003906]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 12.0, 11.0, 11.0, 15.0, 22.0, 31.0, 34.0, 48.0, 43.0, 50.0, 63.0, 81.0, 68.0, 64.0, 69.0, 61.0, 57.0, 71.0, 40.0, 28.0, 26.0, 28.0, 13.0, 10.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.886821746826172, -17.308025360107422, -16.729228973388672, -16.150432586669922, -15.571636199951172, -14.992839813232422, -14.414044380187988, -13.835247993469238, -13.256451606750488, -12.677655220031738, -12.098858833312988, -11.520062446594238, -10.941267013549805, -10.362470626831055, -9.783674240112305, -9.204877853393555, -8.626081466674805, -8.047285079956055, -7.468488693237305, -6.889692783355713, -6.310896396636963, -5.732100009918213, -5.153304100036621, -4.574507713317871, -3.995711326599121, -3.416914939880371, -2.8381187915802, -2.2593226432800293, -1.6805262565612793, -1.1017298698425293, -0.5229337215423584, 0.0558624267578125, 0.6346588134765625, 1.213455080986023, 1.7922513484954834, 2.3710474967956543, 2.9498438835144043, 3.5286402702331543, 4.107436180114746, 4.686232566833496, 5.265028953552246, 5.843825340270996, 6.422621726989746, 7.001417636871338, 7.580214023590088, 8.15900993347168, 8.73780632019043, 9.31660270690918, 9.89539909362793, 10.47419548034668, 11.05299186706543, 11.63178825378418, 12.21058464050293, 12.78938102722168, 13.368176460266113, 13.946972846984863, 14.525769233703613, 15.104565620422363, 15.683362007141113, 16.262157440185547, 16.840953826904297, 17.419750213623047, 17.998546600341797, 18.577342987060547, 19.156139373779297]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 22.0, 21.0, 42.0, 51.0, 77.0, 100.0, 145.0, 225.0, 355.0, 448.0, 753.0, 1253.0, 2364.0, 4718.0, 11505.0, 45814.0, 3873722.0, 217062.0, 20971.0, 7079.0, 3088.0, 1709.0, 954.0, 607.0, 369.0, 256.0, 156.0, 111.0, 72.0, 65.0, 35.0, 22.0, 22.0, 12.0, 19.0, 6.0, 9.0, 3.0, 4.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9921875, -11.6370849609375, -11.281982421875, -10.9268798828125, -10.57177734375, -10.2166748046875, -9.861572265625, -9.5064697265625, -9.1513671875, -8.7962646484375, -8.441162109375, -8.0860595703125, -7.73095703125, -7.3758544921875, -7.020751953125, -6.6656494140625, -6.310546875, -5.9554443359375, -5.600341796875, -5.2452392578125, -4.89013671875, -4.5350341796875, -4.179931640625, -3.8248291015625, -3.4697265625, -3.1146240234375, -2.759521484375, -2.4044189453125, -2.04931640625, -1.6942138671875, -1.339111328125, -0.9840087890625, -0.62890625, -0.2738037109375, 0.081298828125, 0.4364013671875, 0.79150390625, 1.1466064453125, 1.501708984375, 1.8568115234375, 2.2119140625, 2.5670166015625, 2.922119140625, 3.2772216796875, 3.63232421875, 3.9874267578125, 4.342529296875, 4.6976318359375, 5.052734375, 5.4078369140625, 5.762939453125, 6.1180419921875, 6.47314453125, 6.8282470703125, 7.183349609375, 7.5384521484375, 7.8935546875, 8.2486572265625, 8.603759765625, 8.9588623046875, 9.31396484375, 9.6690673828125, 10.024169921875, 10.3792724609375, 10.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 11.0, 7.0, 18.0, 31.0, 54.0, 171.0, 287.0, 208.0, 101.0, 31.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7702255249023438, -0.7401580810546875, -0.7100906372070312, -0.680023193359375, -0.6499557495117188, -0.6198883056640625, -0.5898208618164062, -0.55975341796875, -0.5296859741210938, -0.4996185302734375, -0.46955108642578125, -0.439483642578125, -0.40941619873046875, -0.3793487548828125, -0.34928131103515625, -0.3192138671875, -0.28914642333984375, -0.2590789794921875, -0.22901153564453125, -0.198944091796875, -0.16887664794921875, -0.1388092041015625, -0.10874176025390625, -0.07867431640625, -0.04860687255859375, -0.0185394287109375, 0.01152801513671875, 0.041595458984375, 0.07166290283203125, 0.1017303466796875, 0.13179779052734375, 0.161865234375, 0.19193267822265625, 0.2220001220703125, 0.25206756591796875, 0.282135009765625, 0.31220245361328125, 0.3422698974609375, 0.37233734130859375, 0.40240478515625, 0.43247222900390625, 0.4625396728515625, 0.49260711669921875, 0.522674560546875, 0.5527420043945312, 0.5828094482421875, 0.6128768920898438, 0.6429443359375, 0.6730117797851562, 0.7030792236328125, 0.7331466674804688, 0.763214111328125, 0.7932815551757812, 0.8233489990234375, 0.8534164428710938, 0.88348388671875, 0.9135513305664062, 0.9436187744140625, 0.9736862182617188, 1.003753662109375, 1.0338211059570312, 1.0638885498046875, 1.0939559936523438, 1.1240234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 19.0, 34.0, 48.0, 86.0, 181.0, 335.0, 702.0, 1723.0, 4663.0, 15274.0, 63631.0, 653954.0, 3311489.0, 108230.0, 22858.0, 6786.0, 2382.0, 972.0, 400.0, 211.0, 118.0, 68.0, 36.0, 25.0, 10.0, 5.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.6072998046875, -8.339599609375, -8.0718994140625, -7.80419921875, -7.5364990234375, -7.268798828125, -7.0010986328125, -6.7333984375, -6.4656982421875, -6.197998046875, -5.9302978515625, -5.66259765625, -5.3948974609375, -5.127197265625, -4.8594970703125, -4.591796875, -4.3240966796875, -4.056396484375, -3.7886962890625, -3.52099609375, -3.2532958984375, -2.985595703125, -2.7178955078125, -2.4501953125, -2.1824951171875, -1.914794921875, -1.6470947265625, -1.37939453125, -1.1116943359375, -0.843994140625, -0.5762939453125, -0.30859375, -0.0408935546875, 0.226806640625, 0.4945068359375, 0.76220703125, 1.0299072265625, 1.297607421875, 1.5653076171875, 1.8330078125, 2.1007080078125, 2.368408203125, 2.6361083984375, 2.90380859375, 3.1715087890625, 3.439208984375, 3.7069091796875, 3.974609375, 4.2423095703125, 4.510009765625, 4.7777099609375, 5.04541015625, 5.3131103515625, 5.580810546875, 5.8485107421875, 6.1162109375, 6.3839111328125, 6.651611328125, 6.9193115234375, 7.18701171875, 7.4547119140625, 7.722412109375, 7.9901123046875, 8.2578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 7.0, 13.0, 20.0, 11.0, 25.0, 33.0, 50.0, 58.0, 112.0, 172.0, 293.0, 640.0, 1705.0, 383.0, 157.0, 111.0, 69.0, 45.0, 43.0, 27.0, 21.0, 11.0, 15.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.203125, -1.169891357421875, -1.13665771484375, -1.103424072265625, -1.0701904296875, -1.036956787109375, -1.00372314453125, -0.970489501953125, -0.937255859375, -0.904022216796875, -0.87078857421875, -0.837554931640625, -0.8043212890625, -0.771087646484375, -0.73785400390625, -0.704620361328125, -0.67138671875, -0.638153076171875, -0.60491943359375, -0.571685791015625, -0.5384521484375, -0.505218505859375, -0.47198486328125, -0.438751220703125, -0.405517578125, -0.372283935546875, -0.33905029296875, -0.305816650390625, -0.2725830078125, -0.239349365234375, -0.20611572265625, -0.172882080078125, -0.1396484375, -0.106414794921875, -0.07318115234375, -0.039947509765625, -0.0067138671875, 0.026519775390625, 0.05975341796875, 0.092987060546875, 0.126220703125, 0.159454345703125, 0.19268798828125, 0.225921630859375, 0.2591552734375, 0.292388916015625, 0.32562255859375, 0.358856201171875, 0.39208984375, 0.425323486328125, 0.45855712890625, 0.491790771484375, 0.5250244140625, 0.558258056640625, 0.59149169921875, 0.624725341796875, 0.657958984375, 0.691192626953125, 0.72442626953125, 0.757659912109375, 0.7908935546875, 0.824127197265625, 0.85736083984375, 0.890594482421875, 0.923828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 12.0, 30.0, 42.0, 113.0, 169.0, 245.0, 185.0, 96.0, 51.0, 26.0, 15.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.81429672241211, -16.46824836730957, -16.1221981048584, -15.776148796081543, -15.430099487304688, -15.084050178527832, -14.738000869750977, -14.391952514648438, -14.045902252197266, -13.69985294342041, -13.353803634643555, -13.0077543258667, -12.661705017089844, -12.315655708312988, -11.969606399536133, -11.623558044433594, -11.277508735656738, -10.931459426879883, -10.585410118103027, -10.239360809326172, -9.893311500549316, -9.547262191772461, -9.201213836669922, -8.85516357421875, -8.509115219116211, -8.163065910339355, -7.8170166015625, -7.4709672927856445, -7.124917984008789, -6.778868675231934, -6.432819843292236, -6.086770534515381, -5.740721702575684, -5.394672393798828, -5.048623085021973, -4.702573776245117, -4.356524467468262, -4.010475158691406, -3.664426326751709, -3.3183770179748535, -2.972327709197998, -2.6262784004211426, -2.280229091644287, -1.9341800212860107, -1.5881307125091553, -1.2420814037322998, -0.8960323333740234, -0.549983024597168, -0.2039337158203125, 0.1421155333518982, 0.4881647825241089, 0.8342139720916748, 1.1802632808685303, 1.5263125896453857, 1.872361660003662, 2.2184109687805176, 2.564460277557373, 2.9105095863342285, 3.256558895111084, 3.6026079654693604, 3.948657274246216, 4.294706344604492, 4.640755653381348, 4.986804962158203, 5.332854270935059]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 7.0, 6.0, 10.0, 14.0, 13.0, 14.0, 24.0, 21.0, 34.0, 28.0, 25.0, 27.0, 36.0, 40.0, 36.0, 47.0, 43.0, 34.0, 40.0, 35.0, 40.0, 46.0, 34.0, 34.0, 32.0, 42.0, 41.0, 23.0, 25.0, 20.0, 28.0, 14.0, 14.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2092902660369873, -3.1037561893463135, -2.9982218742370605, -2.8926877975463867, -2.787153720855713, -2.681619644165039, -2.5760855674743652, -2.4705512523651123, -2.3650171756744385, -2.2594830989837646, -2.1539487838745117, -2.048414707183838, -1.942880630493164, -1.8373465538024902, -1.7318123579025269, -1.6262781620025635, -1.5207440853118896, -1.4152100086212158, -1.3096758127212524, -1.204141616821289, -1.0986075401306152, -0.9930734038352966, -0.887539267539978, -0.7820051312446594, -0.6764709949493408, -0.5709368586540222, -0.4654027223587036, -0.359868586063385, -0.2543344497680664, -0.1488003134727478, -0.0432661771774292, 0.062267959117889404, 0.1678023338317871, 0.2733364701271057, 0.3788706064224243, 0.4844047427177429, 0.5899388790130615, 0.6954730153083801, 0.8010071516036987, 0.9065412878990173, 1.012075424194336, 1.1176095008850098, 1.2231436967849731, 1.3286778926849365, 1.4342119693756104, 1.5397460460662842, 1.6452802419662476, 1.750814437866211, 1.8563485145568848, 1.9618825912475586, 2.0674166679382324, 2.1729509830474854, 2.278485059738159, 2.384019136428833, 2.489553451538086, 2.5950875282287598, 2.7006216049194336, 2.8061556816101074, 2.9116897583007812, 3.017224073410034, 3.122758150100708, 3.228292226791382, 3.3338265419006348, 3.4393606185913086, 3.5448946952819824]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 13.0, 16.0, 19.0, 24.0, 31.0, 54.0, 73.0, 87.0, 109.0, 153.0, 238.0, 350.0, 523.0, 720.0, 1019.0, 1721.0, 2740.0, 5000.0, 10529.0, 28765.0, 145161.0, 653135.0, 145427.0, 28923.0, 10583.0, 5234.0, 2829.0, 1640.0, 1092.0, 681.0, 472.0, 340.0, 252.0, 166.0, 129.0, 90.0, 56.0, 38.0, 37.0, 22.0, 16.0, 13.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.953125, -5.76995849609375, -5.5867919921875, -5.40362548828125, -5.220458984375, -5.03729248046875, -4.8541259765625, -4.67095947265625, -4.48779296875, -4.30462646484375, -4.1214599609375, -3.93829345703125, -3.755126953125, -3.57196044921875, -3.3887939453125, -3.20562744140625, -3.0224609375, -2.83929443359375, -2.6561279296875, -2.47296142578125, -2.289794921875, -2.10662841796875, -1.9234619140625, -1.74029541015625, -1.55712890625, -1.37396240234375, -1.1907958984375, -1.00762939453125, -0.824462890625, -0.64129638671875, -0.4581298828125, -0.27496337890625, -0.091796875, 0.09136962890625, 0.2745361328125, 0.45770263671875, 0.640869140625, 0.82403564453125, 1.0072021484375, 1.19036865234375, 1.37353515625, 1.55670166015625, 1.7398681640625, 1.92303466796875, 2.106201171875, 2.28936767578125, 2.4725341796875, 2.65570068359375, 2.8388671875, 3.02203369140625, 3.2052001953125, 3.38836669921875, 3.571533203125, 3.75469970703125, 3.9378662109375, 4.12103271484375, 4.30419921875, 4.48736572265625, 4.6705322265625, 4.85369873046875, 5.036865234375, 5.22003173828125, 5.4031982421875, 5.58636474609375, 5.76953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 8.0, 23.0, 39.0, 100.0, 181.0, 232.0, 184.0, 106.0, 40.0, 22.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.771484375, -0.74224853515625, -0.7130126953125, -0.68377685546875, -0.654541015625, -0.62530517578125, -0.5960693359375, -0.56683349609375, -0.53759765625, -0.50836181640625, -0.4791259765625, -0.44989013671875, -0.420654296875, -0.39141845703125, -0.3621826171875, -0.33294677734375, -0.3037109375, -0.27447509765625, -0.2452392578125, -0.21600341796875, -0.186767578125, -0.15753173828125, -0.1282958984375, -0.09906005859375, -0.06982421875, -0.04058837890625, -0.0113525390625, 0.01788330078125, 0.047119140625, 0.07635498046875, 0.1055908203125, 0.13482666015625, 0.1640625, 0.19329833984375, 0.2225341796875, 0.25177001953125, 0.281005859375, 0.31024169921875, 0.3394775390625, 0.36871337890625, 0.39794921875, 0.42718505859375, 0.4564208984375, 0.48565673828125, 0.514892578125, 0.54412841796875, 0.5733642578125, 0.60260009765625, 0.6318359375, 0.66107177734375, 0.6903076171875, 0.71954345703125, 0.748779296875, 0.77801513671875, 0.8072509765625, 0.83648681640625, 0.86572265625, 0.89495849609375, 0.9241943359375, 0.95343017578125, 0.982666015625, 1.01190185546875, 1.0411376953125, 1.07037353515625, 1.099609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 2.0, 9.0, 9.0, 12.0, 15.0, 29.0, 34.0, 36.0, 81.0, 99.0, 124.0, 249.0, 370.0, 654.0, 1230.0, 2689.0, 6844.0, 21901.0, 87491.0, 390794.0, 407232.0, 93030.0, 22956.0, 6888.0, 2684.0, 1278.0, 681.0, 363.0, 239.0, 175.0, 93.0, 64.0, 48.0, 44.0, 25.0, 17.0, 12.0, 11.0, 9.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.48046875, -6.29541015625, -6.1103515625, -5.92529296875, -5.740234375, -5.55517578125, -5.3701171875, -5.18505859375, -5.0, -4.81494140625, -4.6298828125, -4.44482421875, -4.259765625, -4.07470703125, -3.8896484375, -3.70458984375, -3.51953125, -3.33447265625, -3.1494140625, -2.96435546875, -2.779296875, -2.59423828125, -2.4091796875, -2.22412109375, -2.0390625, -1.85400390625, -1.6689453125, -1.48388671875, -1.298828125, -1.11376953125, -0.9287109375, -0.74365234375, -0.55859375, -0.37353515625, -0.1884765625, -0.00341796875, 0.181640625, 0.36669921875, 0.5517578125, 0.73681640625, 0.921875, 1.10693359375, 1.2919921875, 1.47705078125, 1.662109375, 1.84716796875, 2.0322265625, 2.21728515625, 2.40234375, 2.58740234375, 2.7724609375, 2.95751953125, 3.142578125, 3.32763671875, 3.5126953125, 3.69775390625, 3.8828125, 4.06787109375, 4.2529296875, 4.43798828125, 4.623046875, 4.80810546875, 4.9931640625, 5.17822265625, 5.36328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 5.0, 13.0, 9.0, 19.0, 23.0, 13.0, 29.0, 29.0, 30.0, 38.0, 54.0, 45.0, 61.0, 51.0, 47.0, 39.0, 52.0, 53.0, 45.0, 42.0, 47.0, 39.0, 27.0, 19.0, 38.0, 18.0, 19.0, 16.0, 14.0, 8.0, 10.0, 4.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.95703125, -2.875640869140625, -2.79425048828125, -2.712860107421875, -2.6314697265625, -2.550079345703125, -2.46868896484375, -2.387298583984375, -2.305908203125, -2.224517822265625, -2.14312744140625, -2.061737060546875, -1.9803466796875, -1.898956298828125, -1.81756591796875, -1.736175537109375, -1.65478515625, -1.573394775390625, -1.49200439453125, -1.410614013671875, -1.3292236328125, -1.247833251953125, -1.16644287109375, -1.085052490234375, -1.003662109375, -0.922271728515625, -0.84088134765625, -0.759490966796875, -0.6781005859375, -0.596710205078125, -0.51531982421875, -0.433929443359375, -0.3525390625, -0.271148681640625, -0.18975830078125, -0.108367919921875, -0.0269775390625, 0.054412841796875, 0.13580322265625, 0.217193603515625, 0.298583984375, 0.379974365234375, 0.46136474609375, 0.542755126953125, 0.6241455078125, 0.705535888671875, 0.78692626953125, 0.868316650390625, 0.94970703125, 1.031097412109375, 1.11248779296875, 1.193878173828125, 1.2752685546875, 1.356658935546875, 1.43804931640625, 1.519439697265625, 1.600830078125, 1.682220458984375, 1.76361083984375, 1.845001220703125, 1.9263916015625, 2.007781982421875, 2.08917236328125, 2.170562744140625, 2.251953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 18.0, 21.0, 33.0, 59.0, 81.0, 131.0, 174.0, 293.0, 490.0, 840.0, 1589.0, 3063.0, 6688.0, 15785.0, 48731.0, 234242.0, 568875.0, 116137.0, 30152.0, 10957.0, 4837.0, 2325.0, 1213.0, 670.0, 405.0, 241.0, 155.0, 104.0, 62.0, 39.0, 32.0, 21.0, 19.0, 8.0, 12.0, 4.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.54296875, -6.36273193359375, -6.1824951171875, -6.00225830078125, -5.822021484375, -5.64178466796875, -5.4615478515625, -5.28131103515625, -5.10107421875, -4.92083740234375, -4.7406005859375, -4.56036376953125, -4.380126953125, -4.19989013671875, -4.0196533203125, -3.83941650390625, -3.6591796875, -3.47894287109375, -3.2987060546875, -3.11846923828125, -2.938232421875, -2.75799560546875, -2.5777587890625, -2.39752197265625, -2.21728515625, -2.03704833984375, -1.8568115234375, -1.67657470703125, -1.496337890625, -1.31610107421875, -1.1358642578125, -0.95562744140625, -0.775390625, -0.59515380859375, -0.4149169921875, -0.23468017578125, -0.054443359375, 0.12579345703125, 0.3060302734375, 0.48626708984375, 0.66650390625, 0.84674072265625, 1.0269775390625, 1.20721435546875, 1.387451171875, 1.56768798828125, 1.7479248046875, 1.92816162109375, 2.1083984375, 2.28863525390625, 2.4688720703125, 2.64910888671875, 2.829345703125, 3.00958251953125, 3.1898193359375, 3.37005615234375, 3.55029296875, 3.73052978515625, 3.9107666015625, 4.09100341796875, 4.271240234375, 4.45147705078125, 4.6317138671875, 4.81195068359375, 4.9921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 10.0, 20.0, 30.0, 47.0, 66.0, 125.0, 172.0, 162.0, 101.0, 57.0, 49.0, 41.0, 16.0, 21.0, 13.0, 7.0, 6.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000965118408203125, -0.0009358823299407959, -0.0009066462516784668, -0.0008774101734161377, -0.0008481740951538086, -0.0008189380168914795, -0.0007897019386291504, -0.0007604658603668213, -0.0007312297821044922, -0.0007019937038421631, -0.000672757625579834, -0.0006435215473175049, -0.0006142854690551758, -0.0005850493907928467, -0.0005558133125305176, -0.0005265772342681885, -0.0004973411560058594, -0.0004681050777435303, -0.00043886899948120117, -0.00040963292121887207, -0.00038039684295654297, -0.00035116076469421387, -0.00032192468643188477, -0.00029268860816955566, -0.00026345252990722656, -0.00023421645164489746, -0.00020498037338256836, -0.00017574429512023926, -0.00014650821685791016, -0.00011727213859558105, -8.803606033325195e-05, -5.879998207092285e-05, -2.956390380859375e-05, -3.2782554626464844e-07, 2.8908252716064453e-05, 5.8144330978393555e-05, 8.738040924072266e-05, 0.00011661648750305176, 0.00014585256576538086, 0.00017508864402770996, 0.00020432472229003906, 0.00023356080055236816, 0.00026279687881469727, 0.00029203295707702637, 0.00032126903533935547, 0.00035050511360168457, 0.00037974119186401367, 0.0004089772701263428, 0.0004382133483886719, 0.000467449426651001, 0.0004966855049133301, 0.0005259215831756592, 0.0005551576614379883, 0.0005843937397003174, 0.0006136298179626465, 0.0006428658962249756, 0.0006721019744873047, 0.0007013380527496338, 0.0007305741310119629, 0.000759810209274292, 0.0007890462875366211, 0.0008182823657989502, 0.0008475184440612793, 0.0008767545223236084, 0.0009059906005859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 11.0, 14.0, 15.0, 19.0, 21.0, 38.0, 64.0, 90.0, 105.0, 202.0, 323.0, 558.0, 1041.0, 2177.0, 4694.0, 12211.0, 41054.0, 301913.0, 593989.0, 62293.0, 16286.0, 5886.0, 2580.0, 1188.0, 711.0, 366.0, 233.0, 131.0, 79.0, 69.0, 52.0, 28.0, 35.0, 13.0, 13.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.947998046875, -7.70068359375, -7.453369140625, -7.2060546875, -6.958740234375, -6.71142578125, -6.464111328125, -6.216796875, -5.969482421875, -5.72216796875, -5.474853515625, -5.2275390625, -4.980224609375, -4.73291015625, -4.485595703125, -4.23828125, -3.990966796875, -3.74365234375, -3.496337890625, -3.2490234375, -3.001708984375, -2.75439453125, -2.507080078125, -2.259765625, -2.012451171875, -1.76513671875, -1.517822265625, -1.2705078125, -1.023193359375, -0.77587890625, -0.528564453125, -0.28125, -0.033935546875, 0.21337890625, 0.460693359375, 0.7080078125, 0.955322265625, 1.20263671875, 1.449951171875, 1.697265625, 1.944580078125, 2.19189453125, 2.439208984375, 2.6865234375, 2.933837890625, 3.18115234375, 3.428466796875, 3.67578125, 3.923095703125, 4.17041015625, 4.417724609375, 4.6650390625, 4.912353515625, 5.15966796875, 5.406982421875, 5.654296875, 5.901611328125, 6.14892578125, 6.396240234375, 6.6435546875, 6.890869140625, 7.13818359375, 7.385498046875, 7.6328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 13.0, 11.0, 14.0, 14.0, 22.0, 28.0, 26.0, 60.0, 86.0, 102.0, 126.0, 120.0, 94.0, 66.0, 33.0, 32.0, 23.0, 21.0, 14.0, 16.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.265625, -3.165283203125, -3.06494140625, -2.964599609375, -2.8642578125, -2.763916015625, -2.66357421875, -2.563232421875, -2.462890625, -2.362548828125, -2.26220703125, -2.161865234375, -2.0615234375, -1.961181640625, -1.86083984375, -1.760498046875, -1.66015625, -1.559814453125, -1.45947265625, -1.359130859375, -1.2587890625, -1.158447265625, -1.05810546875, -0.957763671875, -0.857421875, -0.757080078125, -0.65673828125, -0.556396484375, -0.4560546875, -0.355712890625, -0.25537109375, -0.155029296875, -0.0546875, 0.045654296875, 0.14599609375, 0.246337890625, 0.3466796875, 0.447021484375, 0.54736328125, 0.647705078125, 0.748046875, 0.848388671875, 0.94873046875, 1.049072265625, 1.1494140625, 1.249755859375, 1.35009765625, 1.450439453125, 1.55078125, 1.651123046875, 1.75146484375, 1.851806640625, 1.9521484375, 2.052490234375, 2.15283203125, 2.253173828125, 2.353515625, 2.453857421875, 2.55419921875, 2.654541015625, 2.7548828125, 2.855224609375, 2.95556640625, 3.055908203125, 3.15625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 9.0, 8.0, 13.0, 23.0, 56.0, 136.0, 213.0, 258.0, 169.0, 60.0, 34.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.481258392333984, -39.60136795043945, -37.721473693847656, -35.841583251953125, -33.961692810058594, -32.08180236816406, -30.201908111572266, -28.322017669677734, -26.44212532043457, -24.562232971191406, -22.682342529296875, -20.80245018005371, -18.922557830810547, -17.042667388916016, -15.162775039672852, -13.282883644104004, -11.402992248535156, -9.523100852966309, -7.643208980560303, -5.763317108154297, -3.883425712585449, -2.0035343170166016, -0.1236419677734375, 1.7562494277954102, 3.636140823364258, 5.5160322189331055, 7.395924091339111, 9.275815963745117, 11.155707359313965, 13.035598754882812, 14.915491104125977, 16.79538345336914, 18.675270080566406, 20.55516242980957, 22.4350528717041, 24.314945220947266, 26.194835662841797, 28.07472801208496, 29.954620361328125, 31.834510803222656, 33.71440124511719, 35.59429168701172, 37.474185943603516, 39.35407638549805, 41.23396682739258, 43.113861083984375, 44.993751525878906, 46.87364196777344, 48.753536224365234, 50.633426666259766, 52.51332092285156, 54.393211364746094, 56.273101806640625, 58.152992248535156, 60.03288650512695, 61.912776947021484, 63.79267120361328, 65.67256164550781, 67.55245208740234, 69.43234252929688, 71.31224060058594, 73.19213104248047, 75.072021484375, 76.95191192626953, 78.83180236816406]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 10.0, 12.0, 10.0, 27.0, 14.0, 31.0, 44.0, 42.0, 36.0, 37.0, 62.0, 59.0, 49.0, 62.0, 51.0, 62.0, 72.0, 49.0, 35.0, 39.0, 38.0, 30.0, 27.0, 18.0, 22.0, 9.0, 11.0, 13.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.923093795776367, -19.154081344604492, -18.385068893432617, -17.616056442260742, -16.847043991088867, -16.078033447265625, -15.309020042419434, -14.540008544921875, -13.77099609375, -13.001983642578125, -12.23297119140625, -11.463958740234375, -10.694947242736816, -9.925934791564941, -9.156922340393066, -8.387910842895508, -7.618897438049316, -6.849884986877441, -6.080873012542725, -5.31186056137085, -4.542848587036133, -3.773836135864258, -3.004823684692383, -2.235811710357666, -1.466799259185791, -0.6977869868278503, 0.07122528553009033, 0.8402376174926758, 1.6092498302459717, 2.3782620429992676, 3.1472744941711426, 3.9162864685058594, 4.685298919677734, 5.454311370849609, 6.223323345184326, 6.992335796356201, 7.761347770690918, 8.530360221862793, 9.299372673034668, 10.068384170532227, 10.837396621704102, 11.606409072875977, 12.375421524047852, 13.144433975219727, 13.913445472717285, 14.68245792388916, 15.451470375061035, 16.220481872558594, 16.98949432373047, 17.758506774902344, 18.52751922607422, 19.296531677246094, 20.06554412841797, 20.834556579589844, 21.60356903076172, 22.37257957458496, 23.14159393310547, 23.910606384277344, 24.67961883544922, 25.448631286621094, 26.21764373779297, 26.986656188964844, 27.75566864013672, 28.52467918395996, 29.293691635131836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 59.0, 103.0, 188.0, 462.0, 1393.0, 6387.0, 145844.0, 4020212.0, 16420.0, 2106.0, 592.0, 244.0, 111.0, 43.0, 25.0, 15.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.372314453125, -20.55712890625, -19.741943359375, -18.9267578125, -18.111572265625, -17.29638671875, -16.481201171875, -15.666015625, -14.850830078125, -14.03564453125, -13.220458984375, -12.4052734375, -11.590087890625, -10.77490234375, -9.959716796875, -9.14453125, -8.329345703125, -7.51416015625, -6.698974609375, -5.8837890625, -5.068603515625, -4.25341796875, -3.438232421875, -2.623046875, -1.807861328125, -0.99267578125, -0.177490234375, 0.6376953125, 1.452880859375, 2.26806640625, 3.083251953125, 3.8984375, 4.713623046875, 5.52880859375, 6.343994140625, 7.1591796875, 7.974365234375, 8.78955078125, 9.604736328125, 10.419921875, 11.235107421875, 12.05029296875, 12.865478515625, 13.6806640625, 14.495849609375, 15.31103515625, 16.126220703125, 16.94140625, 17.756591796875, 18.57177734375, 19.386962890625, 20.2021484375, 21.017333984375, 21.83251953125, 22.647705078125, 23.462890625, 24.278076171875, 25.09326171875, 25.908447265625, 26.7236328125, 27.538818359375, 28.35400390625, 29.169189453125, 29.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 10.0, 29.0, 54.0, 83.0, 153.0, 202.0, 184.0, 127.0, 57.0, 41.0, 21.0, 5.0, 5.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06781005859375, -1.0291748046875, -0.99053955078125, -0.951904296875, -0.91326904296875, -0.8746337890625, -0.83599853515625, -0.79736328125, -0.75872802734375, -0.7200927734375, -0.68145751953125, -0.642822265625, -0.60418701171875, -0.5655517578125, -0.52691650390625, -0.48828125, -0.44964599609375, -0.4110107421875, -0.37237548828125, -0.333740234375, -0.29510498046875, -0.2564697265625, -0.21783447265625, -0.17919921875, -0.14056396484375, -0.1019287109375, -0.06329345703125, -0.024658203125, 0.01397705078125, 0.0526123046875, 0.09124755859375, 0.1298828125, 0.16851806640625, 0.2071533203125, 0.24578857421875, 0.284423828125, 0.32305908203125, 0.3616943359375, 0.40032958984375, 0.43896484375, 0.47760009765625, 0.5162353515625, 0.55487060546875, 0.593505859375, 0.63214111328125, 0.6707763671875, 0.70941162109375, 0.748046875, 0.78668212890625, 0.8253173828125, 0.86395263671875, 0.902587890625, 0.94122314453125, 0.9798583984375, 1.01849365234375, 1.05712890625, 1.09576416015625, 1.1343994140625, 1.17303466796875, 1.211669921875, 1.25030517578125, 1.2889404296875, 1.32757568359375, 1.3662109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 14.0, 15.0, 24.0, 31.0, 47.0, 92.0, 122.0, 252.0, 467.0, 893.0, 2000.0, 5125.0, 14209.0, 49329.0, 265451.0, 3451968.0, 322015.0, 56395.0, 16041.0, 5547.0, 2209.0, 960.0, 484.0, 240.0, 127.0, 90.0, 41.0, 38.0, 22.0, 17.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.6640625, -8.43328857421875, -8.2025146484375, -7.97174072265625, -7.740966796875, -7.51019287109375, -7.2794189453125, -7.04864501953125, -6.81787109375, -6.58709716796875, -6.3563232421875, -6.12554931640625, -5.894775390625, -5.66400146484375, -5.4332275390625, -5.20245361328125, -4.9716796875, -4.74090576171875, -4.5101318359375, -4.27935791015625, -4.048583984375, -3.81781005859375, -3.5870361328125, -3.35626220703125, -3.12548828125, -2.89471435546875, -2.6639404296875, -2.43316650390625, -2.202392578125, -1.97161865234375, -1.7408447265625, -1.51007080078125, -1.279296875, -1.04852294921875, -0.8177490234375, -0.58697509765625, -0.356201171875, -0.12542724609375, 0.1053466796875, 0.33612060546875, 0.56689453125, 0.79766845703125, 1.0284423828125, 1.25921630859375, 1.489990234375, 1.72076416015625, 1.9515380859375, 2.18231201171875, 2.4130859375, 2.64385986328125, 2.8746337890625, 3.10540771484375, 3.336181640625, 3.56695556640625, 3.7977294921875, 4.02850341796875, 4.25927734375, 4.49005126953125, 4.7208251953125, 4.95159912109375, 5.182373046875, 5.41314697265625, 5.6439208984375, 5.87469482421875, 6.10546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 12.0, 11.0, 13.0, 15.0, 36.0, 44.0, 74.0, 84.0, 132.0, 222.0, 452.0, 1610.0, 575.0, 288.0, 141.0, 102.0, 58.0, 48.0, 31.0, 31.0, 14.0, 11.0, 15.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5686492919921875, -1.526947021484375, -1.4852447509765625, -1.44354248046875, -1.4018402099609375, -1.360137939453125, -1.3184356689453125, -1.2767333984375, -1.2350311279296875, -1.193328857421875, -1.1516265869140625, -1.10992431640625, -1.0682220458984375, -1.026519775390625, -0.9848175048828125, -0.943115234375, -0.9014129638671875, -0.859710693359375, -0.8180084228515625, -0.77630615234375, -0.7346038818359375, -0.692901611328125, -0.6511993408203125, -0.6094970703125, -0.5677947998046875, -0.526092529296875, -0.4843902587890625, -0.44268798828125, -0.4009857177734375, -0.359283447265625, -0.3175811767578125, -0.27587890625, -0.2341766357421875, -0.192474365234375, -0.1507720947265625, -0.10906982421875, -0.0673675537109375, -0.025665283203125, 0.0160369873046875, 0.0577392578125, 0.0994415283203125, 0.141143798828125, 0.1828460693359375, 0.22454833984375, 0.2662506103515625, 0.307952880859375, 0.3496551513671875, 0.391357421875, 0.4330596923828125, 0.474761962890625, 0.5164642333984375, 0.55816650390625, 0.5998687744140625, 0.641571044921875, 0.6832733154296875, 0.7249755859375, 0.7666778564453125, 0.808380126953125, 0.8500823974609375, 0.89178466796875, 0.9334869384765625, 0.975189208984375, 1.0168914794921875, 1.05859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 8.0, 18.0, 30.0, 81.0, 100.0, 177.0, 197.0, 165.0, 104.0, 62.0, 28.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.885089874267578, -17.483036041259766, -17.080982208251953, -16.678926467895508, -16.276872634887695, -15.874818801879883, -15.47276496887207, -15.070710182189941, -14.668655395507812, -14.2666015625, -13.864546775817871, -13.462492942810059, -13.06043815612793, -12.658384323120117, -12.256330490112305, -11.854275703430176, -11.452221870422363, -11.05016803741455, -10.648113250732422, -10.24605941772461, -9.84400463104248, -9.441950798034668, -9.039896011352539, -8.637842178344727, -8.235788345336914, -7.833734035491943, -7.431679725646973, -7.02962589263916, -6.627571105957031, -6.225517272949219, -5.823462963104248, -5.421408653259277, -5.019352912902832, -4.617298603057861, -4.215244293212891, -3.813190221786499, -3.4111359119415283, -3.0090816020965576, -2.607027530670166, -2.2049732208251953, -1.8029189109802246, -1.400864601135254, -0.9988104104995728, -0.5967562198638916, -0.1947019100189209, 0.2073523998260498, 0.6094064712524414, 1.011460781097412, 1.4135150909423828, 1.8155694007873535, 2.217623710632324, 2.619677782058716, 3.0217320919036865, 3.4237864017486572, 3.825840473175049, 4.2278947830200195, 4.62994909286499, 5.032003402709961, 5.434057712554932, 5.836112022399902, 6.238165855407715, 6.640220642089844, 7.042274475097656, 7.444328784942627, 7.846383094787598]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 9.0, 6.0, 8.0, 14.0, 10.0, 12.0, 16.0, 18.0, 19.0, 26.0, 26.0, 22.0, 28.0, 29.0, 34.0, 35.0, 32.0, 37.0, 28.0, 38.0, 41.0, 39.0, 28.0, 39.0, 31.0, 26.0, 35.0, 34.0, 20.0, 24.0, 24.0, 32.0, 22.0, 23.0, 20.0, 14.0, 20.0, 14.0, 7.0, 5.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.4001901149749756, -3.2787041664123535, -3.1572182178497314, -3.0357322692871094, -2.914246082305908, -2.792760133743286, -2.671274185180664, -2.549788236618042, -2.42830228805542, -2.306816339492798, -2.185330390930176, -2.0638442039489746, -1.9423582553863525, -1.8208723068237305, -1.6993863582611084, -1.5779004096984863, -1.4564142227172852, -1.334928274154663, -1.2134422063827515, -1.0919562578201294, -0.9704702496528625, -0.8489842414855957, -0.7274982929229736, -0.6060122847557068, -0.48452627658843994, -0.3630402684211731, -0.24155429005622864, -0.12006831169128418, 0.001417696475982666, 0.12290370464324951, 0.24438965320587158, 0.3658756613731384, 0.4873619079589844, 0.6088479161262512, 0.7303339242935181, 0.8518198728561401, 0.973305881023407, 1.0947918891906738, 1.216277837753296, 1.337763786315918, 1.4592498540878296, 1.5807358026504517, 1.7022218704223633, 1.8237078189849854, 1.9451937675476074, 2.0666799545288086, 2.1881656646728516, 2.3096518516540527, 2.431137800216675, 2.552623748779297, 2.674109697341919, 2.795595645904541, 2.917081832885742, 3.0385677814483643, 3.1600537300109863, 3.2815396785736084, 3.4030256271362305, 3.5245115756988525, 3.6459975242614746, 3.767483711242676, 3.888969659805298, 4.01045560836792, 4.131941795349121, 4.253427505493164, 4.374913692474365]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 4.0, 12.0, 19.0, 17.0, 42.0, 46.0, 59.0, 111.0, 160.0, 237.0, 419.0, 680.0, 1180.0, 2105.0, 4493.0, 11510.0, 42890.0, 239968.0, 571687.0, 130760.0, 26437.0, 8082.0, 3373.0, 1699.0, 1022.0, 603.0, 323.0, 178.0, 151.0, 80.0, 68.0, 48.0, 23.0, 15.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.86737060546875, -5.6527099609375, -5.43804931640625, -5.223388671875, -5.00872802734375, -4.7940673828125, -4.57940673828125, -4.36474609375, -4.15008544921875, -3.9354248046875, -3.72076416015625, -3.506103515625, -3.29144287109375, -3.0767822265625, -2.86212158203125, -2.6474609375, -2.43280029296875, -2.2181396484375, -2.00347900390625, -1.788818359375, -1.57415771484375, -1.3594970703125, -1.14483642578125, -0.93017578125, -0.71551513671875, -0.5008544921875, -0.28619384765625, -0.071533203125, 0.14312744140625, 0.3577880859375, 0.57244873046875, 0.787109375, 1.00177001953125, 1.2164306640625, 1.43109130859375, 1.645751953125, 1.86041259765625, 2.0750732421875, 2.28973388671875, 2.50439453125, 2.71905517578125, 2.9337158203125, 3.14837646484375, 3.363037109375, 3.57769775390625, 3.7923583984375, 4.00701904296875, 4.2216796875, 4.43634033203125, 4.6510009765625, 4.86566162109375, 5.080322265625, 5.29498291015625, 5.5096435546875, 5.72430419921875, 5.93896484375, 6.15362548828125, 6.3682861328125, 6.58294677734375, 6.797607421875, 7.01226806640625, 7.2269287109375, 7.44158935546875, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 7.0, 11.0, 14.0, 28.0, 42.0, 75.0, 129.0, 152.0, 188.0, 125.0, 113.0, 53.0, 31.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0396575927734375, -1.001190185546875, -0.9627227783203125, -0.92425537109375, -0.8857879638671875, -0.847320556640625, -0.8088531494140625, -0.7703857421875, -0.7319183349609375, -0.693450927734375, -0.6549835205078125, -0.61651611328125, -0.5780487060546875, -0.539581298828125, -0.5011138916015625, -0.462646484375, -0.4241790771484375, -0.385711669921875, -0.3472442626953125, -0.30877685546875, -0.2703094482421875, -0.231842041015625, -0.1933746337890625, -0.1549072265625, -0.1164398193359375, -0.077972412109375, -0.0395050048828125, -0.00103759765625, 0.0374298095703125, 0.075897216796875, 0.1143646240234375, 0.15283203125, 0.1912994384765625, 0.229766845703125, 0.2682342529296875, 0.30670166015625, 0.3451690673828125, 0.383636474609375, 0.4221038818359375, 0.4605712890625, 0.4990386962890625, 0.537506103515625, 0.5759735107421875, 0.61444091796875, 0.6529083251953125, 0.691375732421875, 0.7298431396484375, 0.768310546875, 0.8067779541015625, 0.845245361328125, 0.8837127685546875, 0.92218017578125, 0.9606475830078125, 0.999114990234375, 1.0375823974609375, 1.0760498046875, 1.1145172119140625, 1.152984619140625, 1.1914520263671875, 1.22991943359375, 1.2683868408203125, 1.306854248046875, 1.3453216552734375, 1.3837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 15.0, 23.0, 38.0, 56.0, 86.0, 141.0, 256.0, 479.0, 903.0, 2403.0, 7191.0, 32804.0, 203136.0, 625222.0, 142090.0, 24083.0, 5758.0, 2002.0, 824.0, 404.0, 232.0, 134.0, 70.0, 65.0, 30.0, 18.0, 13.0, 11.0, 11.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70050048828125, -8.4400634765625, -8.17962646484375, -7.919189453125, -7.65875244140625, -7.3983154296875, -7.13787841796875, -6.87744140625, -6.61700439453125, -6.3565673828125, -6.09613037109375, -5.835693359375, -5.57525634765625, -5.3148193359375, -5.05438232421875, -4.7939453125, -4.53350830078125, -4.2730712890625, -4.01263427734375, -3.752197265625, -3.49176025390625, -3.2313232421875, -2.97088623046875, -2.71044921875, -2.45001220703125, -2.1895751953125, -1.92913818359375, -1.668701171875, -1.40826416015625, -1.1478271484375, -0.88739013671875, -0.626953125, -0.36651611328125, -0.1060791015625, 0.15435791015625, 0.414794921875, 0.67523193359375, 0.9356689453125, 1.19610595703125, 1.45654296875, 1.71697998046875, 1.9774169921875, 2.23785400390625, 2.498291015625, 2.75872802734375, 3.0191650390625, 3.27960205078125, 3.5400390625, 3.80047607421875, 4.0609130859375, 4.32135009765625, 4.581787109375, 4.84222412109375, 5.1026611328125, 5.36309814453125, 5.62353515625, 5.88397216796875, 6.1444091796875, 6.40484619140625, 6.665283203125, 6.92572021484375, 7.1861572265625, 7.44659423828125, 7.70703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 10.0, 7.0, 15.0, 15.0, 33.0, 34.0, 47.0, 40.0, 36.0, 45.0, 48.0, 62.0, 67.0, 67.0, 53.0, 53.0, 45.0, 46.0, 42.0, 31.0, 39.0, 28.0, 23.0, 14.0, 18.0, 14.0, 12.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.33526611328125, -3.2135009765625, -3.09173583984375, -2.969970703125, -2.84820556640625, -2.7264404296875, -2.60467529296875, -2.48291015625, -2.36114501953125, -2.2393798828125, -2.11761474609375, -1.995849609375, -1.87408447265625, -1.7523193359375, -1.63055419921875, -1.5087890625, -1.38702392578125, -1.2652587890625, -1.14349365234375, -1.021728515625, -0.89996337890625, -0.7781982421875, -0.65643310546875, -0.53466796875, -0.41290283203125, -0.2911376953125, -0.16937255859375, -0.047607421875, 0.07415771484375, 0.1959228515625, 0.31768798828125, 0.439453125, 0.56121826171875, 0.6829833984375, 0.80474853515625, 0.926513671875, 1.04827880859375, 1.1700439453125, 1.29180908203125, 1.41357421875, 1.53533935546875, 1.6571044921875, 1.77886962890625, 1.900634765625, 2.02239990234375, 2.1441650390625, 2.26593017578125, 2.3876953125, 2.50946044921875, 2.6312255859375, 2.75299072265625, 2.874755859375, 2.99652099609375, 3.1182861328125, 3.24005126953125, 3.36181640625, 3.48358154296875, 3.6053466796875, 3.72711181640625, 3.848876953125, 3.97064208984375, 4.0924072265625, 4.21417236328125, 4.3359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 11.0, 18.0, 26.0, 31.0, 44.0, 55.0, 80.0, 109.0, 189.0, 301.0, 474.0, 700.0, 1161.0, 2024.0, 3493.0, 6328.0, 11906.0, 25485.0, 59884.0, 169111.0, 423191.0, 211939.0, 72035.0, 29632.0, 13778.0, 7043.0, 3785.0, 2205.0, 1284.0, 780.0, 476.0, 283.0, 226.0, 134.0, 91.0, 77.0, 45.0, 30.0, 20.0, 17.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.00830078125, -2.9130859375, -2.81787109375, -2.72265625, -2.62744140625, -2.5322265625, -2.43701171875, -2.341796875, -2.24658203125, -2.1513671875, -2.05615234375, -1.9609375, -1.86572265625, -1.7705078125, -1.67529296875, -1.580078125, -1.48486328125, -1.3896484375, -1.29443359375, -1.19921875, -1.10400390625, -1.0087890625, -0.91357421875, -0.818359375, -0.72314453125, -0.6279296875, -0.53271484375, -0.4375, -0.34228515625, -0.2470703125, -0.15185546875, -0.056640625, 0.03857421875, 0.1337890625, 0.22900390625, 0.32421875, 0.41943359375, 0.5146484375, 0.60986328125, 0.705078125, 0.80029296875, 0.8955078125, 0.99072265625, 1.0859375, 1.18115234375, 1.2763671875, 1.37158203125, 1.466796875, 1.56201171875, 1.6572265625, 1.75244140625, 1.84765625, 1.94287109375, 2.0380859375, 2.13330078125, 2.228515625, 2.32373046875, 2.4189453125, 2.51416015625, 2.609375, 2.70458984375, 2.7998046875, 2.89501953125, 2.990234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 25.0, 23.0, 27.0, 56.0, 83.0, 98.0, 164.0, 130.0, 88.0, 56.0, 38.0, 31.0, 29.0, 23.0, 14.0, 16.0, 9.0, 11.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006909370422363281, -0.0006668046116828918, -0.0006426721811294556, -0.0006185397505760193, -0.000594407320022583, -0.0005702748894691467, -0.0005461424589157104, -0.0005220100283622742, -0.0004978775978088379, -0.0004737451672554016, -0.00044961273670196533, -0.00042548030614852905, -0.0004013478755950928, -0.0003772154450416565, -0.0003530830144882202, -0.00032895058393478394, -0.00030481815338134766, -0.0002806857228279114, -0.0002565532922744751, -0.00023242086172103882, -0.00020828843116760254, -0.00018415600061416626, -0.00016002357006072998, -0.0001358911395072937, -0.00011175870895385742, -8.762627840042114e-05, -6.349384784698486e-05, -3.9361417293548584e-05, -1.5228986740112305e-05, 8.903443813323975e-06, 3.3035874366760254e-05, 5.716830492019653e-05, 8.130073547363281e-05, 0.00010543316602706909, 0.00012956559658050537, 0.00015369802713394165, 0.00017783045768737793, 0.0002019628882408142, 0.0002260953187942505, 0.00025022774934768677, 0.00027436017990112305, 0.0002984926104545593, 0.0003226250410079956, 0.0003467574715614319, 0.00037088990211486816, 0.00039502233266830444, 0.0004191547632217407, 0.000443287193775177, 0.0004674196243286133, 0.0004915520548820496, 0.0005156844854354858, 0.0005398169159889221, 0.0005639493465423584, 0.0005880817770957947, 0.000612214207649231, 0.0006363466382026672, 0.0006604790687561035, 0.0006846114993095398, 0.0007087439298629761, 0.0007328763604164124, 0.0007570087909698486, 0.0007811412215232849, 0.0008052736520767212, 0.0008294060826301575, 0.0008535385131835938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 16.0, 25.0, 39.0, 41.0, 93.0, 160.0, 327.0, 676.0, 1715.0, 5229.0, 20304.0, 132743.0, 761225.0, 101652.0, 17079.0, 4424.0, 1496.0, 579.0, 292.0, 153.0, 77.0, 48.0, 32.0, 26.0, 18.0, 13.0, 5.0, 3.0, 4.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-9.0625, -8.79150390625, -8.5205078125, -8.24951171875, -7.978515625, -7.70751953125, -7.4365234375, -7.16552734375, -6.89453125, -6.62353515625, -6.3525390625, -6.08154296875, -5.810546875, -5.53955078125, -5.2685546875, -4.99755859375, -4.7265625, -4.45556640625, -4.1845703125, -3.91357421875, -3.642578125, -3.37158203125, -3.1005859375, -2.82958984375, -2.55859375, -2.28759765625, -2.0166015625, -1.74560546875, -1.474609375, -1.20361328125, -0.9326171875, -0.66162109375, -0.390625, -0.11962890625, 0.1513671875, 0.42236328125, 0.693359375, 0.96435546875, 1.2353515625, 1.50634765625, 1.77734375, 2.04833984375, 2.3193359375, 2.59033203125, 2.861328125, 3.13232421875, 3.4033203125, 3.67431640625, 3.9453125, 4.21630859375, 4.4873046875, 4.75830078125, 5.029296875, 5.30029296875, 5.5712890625, 5.84228515625, 6.11328125, 6.38427734375, 6.6552734375, 6.92626953125, 7.197265625, 7.46826171875, 7.7392578125, 8.01025390625, 8.28125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 10.0, 9.0, 19.0, 20.0, 16.0, 24.0, 32.0, 50.0, 82.0, 104.0, 135.0, 128.0, 99.0, 58.0, 42.0, 31.0, 32.0, 14.0, 17.0, 8.0, 8.0, 7.0, 5.0, 7.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.515625, -3.40191650390625, -3.2882080078125, -3.17449951171875, -3.060791015625, -2.94708251953125, -2.8333740234375, -2.71966552734375, -2.60595703125, -2.49224853515625, -2.3785400390625, -2.26483154296875, -2.151123046875, -2.03741455078125, -1.9237060546875, -1.80999755859375, -1.6962890625, -1.58258056640625, -1.4688720703125, -1.35516357421875, -1.241455078125, -1.12774658203125, -1.0140380859375, -0.90032958984375, -0.78662109375, -0.67291259765625, -0.5592041015625, -0.44549560546875, -0.331787109375, -0.21807861328125, -0.1043701171875, 0.00933837890625, 0.123046875, 0.23675537109375, 0.3504638671875, 0.46417236328125, 0.577880859375, 0.69158935546875, 0.8052978515625, 0.91900634765625, 1.03271484375, 1.14642333984375, 1.2601318359375, 1.37384033203125, 1.487548828125, 1.60125732421875, 1.7149658203125, 1.82867431640625, 1.9423828125, 2.05609130859375, 2.1697998046875, 2.28350830078125, 2.397216796875, 2.51092529296875, 2.6246337890625, 2.73834228515625, 2.85205078125, 2.96575927734375, 3.0794677734375, 3.19317626953125, 3.306884765625, 3.42059326171875, 3.5343017578125, 3.64801025390625, 3.76171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 20.0, 49.0, 117.0, 194.0, 278.0, 187.0, 90.0, 29.0, 16.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.77375411987305, -57.32360076904297, -54.87344741821289, -52.42329406738281, -49.97313690185547, -47.522987365722656, -45.07283020019531, -42.622676849365234, -40.172523498535156, -37.72237014770508, -35.272216796875, -32.82206344604492, -30.37190818786621, -27.921754837036133, -25.471599578857422, -23.021446228027344, -20.571292877197266, -18.121139526367188, -15.670985221862793, -13.220830917358398, -10.77067756652832, -8.320524215698242, -5.870369911193848, -3.420215606689453, -0.970062255859375, 1.4800915718078613, 3.9302453994750977, 6.380399227142334, 8.83055305480957, 11.280706405639648, 13.730860710144043, 16.181015014648438, 18.63116455078125, 21.081317901611328, 23.531471252441406, 25.981626510620117, 28.431779861450195, 30.881933212280273, 33.332088470458984, 35.78224182128906, 38.23239517211914, 40.68254852294922, 43.1327018737793, 45.582855224609375, 48.03301239013672, 50.48316192626953, 52.933319091796875, 55.38347244262695, 57.83362579345703, 60.28377914428711, 62.73393249511719, 65.18408966064453, 67.63423919677734, 70.08439636230469, 72.5345458984375, 74.98470306396484, 77.43486022949219, 79.88501739501953, 82.33516693115234, 84.78532409667969, 87.2354736328125, 89.68563079833984, 92.13578033447266, 94.5859375, 97.03608703613281]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 17.0, 18.0, 23.0, 13.0, 29.0, 35.0, 39.0, 35.0, 35.0, 43.0, 60.0, 58.0, 54.0, 45.0, 64.0, 51.0, 50.0, 46.0, 40.0, 37.0, 38.0, 36.0, 14.0, 27.0, 19.0, 12.0, 12.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.994770050048828, -28.134937286376953, -27.275104522705078, -26.415271759033203, -25.555437088012695, -24.69560432434082, -23.835771560668945, -22.97593879699707, -22.116104125976562, -21.256271362304688, -20.396438598632812, -19.536605834960938, -18.67677116394043, -17.816938400268555, -16.95710563659668, -16.097272872924805, -15.23744010925293, -14.377607345581055, -13.517773628234863, -12.657940864562988, -11.798107147216797, -10.938274383544922, -10.078441619873047, -9.218608856201172, -8.35877513885498, -7.498941898345947, -6.639108657836914, -5.779275894165039, -4.919442653656006, -4.059609413146973, -3.1997766494750977, -2.3399434089660645, -1.480112075805664, -0.6202789545059204, 0.23955416679382324, 1.0993871688842773, 1.9592204093933105, 2.8190536499023438, 3.6788864135742188, 4.538719654083252, 5.398552894592285, 6.258386135101318, 7.118219375610352, 7.978052139282227, 8.837884902954102, 9.697718620300293, 10.557551383972168, 11.41738510131836, 12.277217864990234, 13.13705062866211, 13.9968843460083, 14.856717109680176, 15.716550827026367, 16.576383590698242, 17.436216354370117, 18.296049118041992, 19.1558837890625, 20.015716552734375, 20.87554931640625, 21.735382080078125, 22.595216751098633, 23.455049514770508, 24.314882278442383, 25.174715042114258, 26.034547805786133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 16.0, 22.0, 58.0, 58.0, 118.0, 194.0, 324.0, 782.0, 1832.0, 5656.0, 27244.0, 626878.0, 3481757.0, 38190.0, 7131.0, 2134.0, 860.0, 436.0, 213.0, 108.0, 79.0, 49.0, 35.0, 20.0, 12.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.05926513671875, -6.7396240234375, -6.41998291015625, -6.100341796875, -5.78070068359375, -5.4610595703125, -5.14141845703125, -4.82177734375, -4.50213623046875, -4.1824951171875, -3.86285400390625, -3.543212890625, -3.22357177734375, -2.9039306640625, -2.58428955078125, -2.2646484375, -1.94500732421875, -1.6253662109375, -1.30572509765625, -0.986083984375, -0.66644287109375, -0.3468017578125, -0.02716064453125, 0.29248046875, 0.61212158203125, 0.9317626953125, 1.25140380859375, 1.571044921875, 1.89068603515625, 2.2103271484375, 2.52996826171875, 2.849609375, 3.16925048828125, 3.4888916015625, 3.80853271484375, 4.128173828125, 4.44781494140625, 4.7674560546875, 5.08709716796875, 5.40673828125, 5.72637939453125, 6.0460205078125, 6.36566162109375, 6.685302734375, 7.00494384765625, 7.3245849609375, 7.64422607421875, 7.9638671875, 8.28350830078125, 8.6031494140625, 8.92279052734375, 9.242431640625, 9.56207275390625, 9.8817138671875, 10.20135498046875, 10.52099609375, 10.84063720703125, 11.1602783203125, 11.47991943359375, 11.799560546875, 12.11920166015625, 12.4388427734375, 12.75848388671875, 13.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 16.0, 30.0, 46.0, 55.0, 95.0, 98.0, 138.0, 135.0, 111.0, 78.0, 72.0, 50.0, 25.0, 11.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.01593017578125, -0.9752197265625, -0.93450927734375, -0.893798828125, -0.85308837890625, -0.8123779296875, -0.77166748046875, -0.73095703125, -0.69024658203125, -0.6495361328125, -0.60882568359375, -0.568115234375, -0.52740478515625, -0.4866943359375, -0.44598388671875, -0.4052734375, -0.36456298828125, -0.3238525390625, -0.28314208984375, -0.242431640625, -0.20172119140625, -0.1610107421875, -0.12030029296875, -0.07958984375, -0.03887939453125, 0.0018310546875, 0.04254150390625, 0.083251953125, 0.12396240234375, 0.1646728515625, 0.20538330078125, 0.24609375, 0.28680419921875, 0.3275146484375, 0.36822509765625, 0.408935546875, 0.44964599609375, 0.4903564453125, 0.53106689453125, 0.57177734375, 0.61248779296875, 0.6531982421875, 0.69390869140625, 0.734619140625, 0.77532958984375, 0.8160400390625, 0.85675048828125, 0.8974609375, 0.93817138671875, 0.9788818359375, 1.01959228515625, 1.060302734375, 1.10101318359375, 1.1417236328125, 1.18243408203125, 1.22314453125, 1.26385498046875, 1.3045654296875, 1.34527587890625, 1.385986328125, 1.42669677734375, 1.4674072265625, 1.50811767578125, 1.548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 0.0, 7.0, 12.0, 25.0, 29.0, 42.0, 57.0, 98.0, 148.0, 222.0, 372.0, 648.0, 1113.0, 1958.0, 3672.0, 7020.0, 14395.0, 33207.0, 96828.0, 500747.0, 3151702.0, 266699.0, 66730.0, 24830.0, 11204.0, 5696.0, 2902.0, 1566.0, 906.0, 503.0, 319.0, 206.0, 140.0, 82.0, 45.0, 42.0, 34.0, 17.0, 14.0, 12.0, 14.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.18359375, -4.05010986328125, -3.9166259765625, -3.78314208984375, -3.649658203125, -3.51617431640625, -3.3826904296875, -3.24920654296875, -3.11572265625, -2.98223876953125, -2.8487548828125, -2.71527099609375, -2.581787109375, -2.44830322265625, -2.3148193359375, -2.18133544921875, -2.0478515625, -1.91436767578125, -1.7808837890625, -1.64739990234375, -1.513916015625, -1.38043212890625, -1.2469482421875, -1.11346435546875, -0.97998046875, -0.84649658203125, -0.7130126953125, -0.57952880859375, -0.446044921875, -0.31256103515625, -0.1790771484375, -0.04559326171875, 0.087890625, 0.22137451171875, 0.3548583984375, 0.48834228515625, 0.621826171875, 0.75531005859375, 0.8887939453125, 1.02227783203125, 1.15576171875, 1.28924560546875, 1.4227294921875, 1.55621337890625, 1.689697265625, 1.82318115234375, 1.9566650390625, 2.09014892578125, 2.2236328125, 2.35711669921875, 2.4906005859375, 2.62408447265625, 2.757568359375, 2.89105224609375, 3.0245361328125, 3.15802001953125, 3.29150390625, 3.42498779296875, 3.5584716796875, 3.69195556640625, 3.825439453125, 3.95892333984375, 4.0924072265625, 4.22589111328125, 4.359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 10.0, 8.0, 11.0, 16.0, 28.0, 34.0, 50.0, 67.0, 109.0, 158.0, 291.0, 731.0, 1479.0, 377.0, 212.0, 132.0, 80.0, 50.0, 57.0, 25.0, 19.0, 16.0, 14.0, 16.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9782867431640625, -0.940948486328125, -0.9036102294921875, -0.86627197265625, -0.8289337158203125, -0.791595458984375, -0.7542572021484375, -0.7169189453125, -0.6795806884765625, -0.642242431640625, -0.6049041748046875, -0.56756591796875, -0.5302276611328125, -0.492889404296875, -0.4555511474609375, -0.418212890625, -0.3808746337890625, -0.343536376953125, -0.3061981201171875, -0.26885986328125, -0.2315216064453125, -0.194183349609375, -0.1568450927734375, -0.1195068359375, -0.0821685791015625, -0.044830322265625, -0.0074920654296875, 0.02984619140625, 0.0671844482421875, 0.104522705078125, 0.1418609619140625, 0.17919921875, 0.2165374755859375, 0.253875732421875, 0.2912139892578125, 0.32855224609375, 0.3658905029296875, 0.403228759765625, 0.4405670166015625, 0.4779052734375, 0.5152435302734375, 0.552581787109375, 0.5899200439453125, 0.62725830078125, 0.6645965576171875, 0.701934814453125, 0.7392730712890625, 0.776611328125, 0.8139495849609375, 0.851287841796875, 0.8886260986328125, 0.92596435546875, 0.9633026123046875, 1.000640869140625, 1.0379791259765625, 1.0753173828125, 1.1126556396484375, 1.149993896484375, 1.1873321533203125, 1.22467041015625, 1.2620086669921875, 1.299346923828125, 1.3366851806640625, 1.3740234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 21.0, 19.0, 33.0, 67.0, 128.0, 181.0, 198.0, 145.0, 90.0, 53.0, 36.0, 14.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.241500854492188, -19.847503662109375, -19.45350456237793, -19.059507369995117, -18.665508270263672, -18.27151107788086, -17.877513885498047, -17.4835147857666, -17.08951759338379, -16.695520401000977, -16.30152130126953, -15.907524108886719, -15.51352596282959, -15.119527816772461, -14.725530624389648, -14.33153247833252, -13.93753433227539, -13.543536186218262, -13.149538040161133, -12.75554084777832, -12.361542701721191, -11.967544555664062, -11.57354736328125, -11.179549217224121, -10.785551071166992, -10.391552925109863, -9.997554779052734, -9.603557586669922, -9.209559440612793, -8.815561294555664, -8.421564102172852, -8.027565956115723, -7.633566856384277, -7.239568710327148, -6.845571041107178, -6.451573371887207, -6.057575225830078, -5.663577079772949, -5.2695794105529785, -4.875581741333008, -4.481583595275879, -4.08758544921875, -3.6935877799987793, -3.2995898723602295, -2.9055919647216797, -2.51159405708313, -2.11759614944458, -1.7235982418060303, -1.3296003341674805, -0.9356024265289307, -0.5416045188903809, -0.14760661125183105, 0.24639129638671875, 0.6403892040252686, 1.0343871116638184, 1.4283850193023682, 1.822382926940918, 2.2163808345794678, 2.6103787422180176, 3.0043766498565674, 3.398374557495117, 3.792372465133667, 4.186370372772217, 4.5803680419921875, 4.974366188049316]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 7.0, 6.0, 7.0, 7.0, 13.0, 9.0, 9.0, 13.0, 17.0, 25.0, 33.0, 25.0, 30.0, 35.0, 48.0, 49.0, 45.0, 45.0, 54.0, 41.0, 64.0, 50.0, 41.0, 37.0, 48.0, 28.0, 42.0, 25.0, 28.0, 18.0, 23.0, 20.0, 18.0, 7.0, 14.0, 6.0, 10.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.262031316757202, -3.100661277770996, -2.93929123878479, -2.777921199798584, -2.616550922393799, -2.455181121826172, -2.2938108444213867, -2.1324408054351807, -1.9710707664489746, -1.8097007274627686, -1.6483306884765625, -1.486960530281067, -1.3255904912948608, -1.1642204523086548, -1.0028502941131592, -0.8414802551269531, -0.6801102161407471, -0.518740177154541, -0.3573700785636902, -0.19600000977516174, -0.0346299409866333, 0.12674009799957275, 0.2881101965904236, 0.4494802951812744, 0.6108503341674805, 0.7722203731536865, 0.9335904717445374, 1.0949605703353882, 1.2563306093215942, 1.4177006483078003, 1.579070806503296, 1.740440845489502, 1.901810646057129, 2.063180685043335, 2.224550724029541, 2.385920763015747, 2.547290802001953, 2.7086610794067383, 2.8700311183929443, 3.0314011573791504, 3.1927711963653564, 3.3541412353515625, 3.5155112743377686, 3.6768813133239746, 3.8382515907287598, 3.9996213912963867, 4.160991668701172, 4.322361946105957, 4.483731746673584, 4.645102024078369, 4.806471824645996, 4.967842102050781, 5.129211902618408, 5.290582180023193, 5.45195198059082, 5.6133222579956055, 5.774692535400391, 5.936062812805176, 6.097432613372803, 6.258802890777588, 6.420172691345215, 6.58154296875, 6.742912769317627, 6.904283046722412, 7.065652847290039]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 9.0, 4.0, 6.0, 14.0, 21.0, 28.0, 36.0, 59.0, 66.0, 125.0, 157.0, 253.0, 430.0, 605.0, 1049.0, 1742.0, 3388.0, 7162.0, 17812.0, 50655.0, 161836.0, 431787.0, 249894.0, 75936.0, 25553.0, 9890.0, 4519.0, 2169.0, 1207.0, 745.0, 444.0, 291.0, 222.0, 117.0, 95.0, 71.0, 29.0, 29.0, 25.0, 11.0, 14.0, 10.0, 11.0, 4.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.8125, -4.66961669921875, -4.5267333984375, -4.38385009765625, -4.240966796875, -4.09808349609375, -3.9552001953125, -3.81231689453125, -3.66943359375, -3.52655029296875, -3.3836669921875, -3.24078369140625, -3.097900390625, -2.95501708984375, -2.8121337890625, -2.66925048828125, -2.5263671875, -2.38348388671875, -2.2406005859375, -2.09771728515625, -1.954833984375, -1.81195068359375, -1.6690673828125, -1.52618408203125, -1.38330078125, -1.24041748046875, -1.0975341796875, -0.95465087890625, -0.811767578125, -0.66888427734375, -0.5260009765625, -0.38311767578125, -0.240234375, -0.09735107421875, 0.0455322265625, 0.18841552734375, 0.331298828125, 0.47418212890625, 0.6170654296875, 0.75994873046875, 0.90283203125, 1.04571533203125, 1.1885986328125, 1.33148193359375, 1.474365234375, 1.61724853515625, 1.7601318359375, 1.90301513671875, 2.0458984375, 2.18878173828125, 2.3316650390625, 2.47454833984375, 2.617431640625, 2.76031494140625, 2.9031982421875, 3.04608154296875, 3.18896484375, 3.33184814453125, 3.4747314453125, 3.61761474609375, 3.760498046875, 3.90338134765625, 4.0462646484375, 4.18914794921875, 4.33203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 5.0, 10.0, 12.0, 25.0, 30.0, 69.0, 70.0, 91.0, 117.0, 131.0, 112.0, 94.0, 84.0, 55.0, 36.0, 31.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.062347412109375, -1.02215576171875, -0.981964111328125, -0.9417724609375, -0.901580810546875, -0.86138916015625, -0.821197509765625, -0.781005859375, -0.740814208984375, -0.70062255859375, -0.660430908203125, -0.6202392578125, -0.580047607421875, -0.53985595703125, -0.499664306640625, -0.45947265625, -0.419281005859375, -0.37908935546875, -0.338897705078125, -0.2987060546875, -0.258514404296875, -0.21832275390625, -0.178131103515625, -0.137939453125, -0.097747802734375, -0.05755615234375, -0.017364501953125, 0.0228271484375, 0.063018798828125, 0.10321044921875, 0.143402099609375, 0.18359375, 0.223785400390625, 0.26397705078125, 0.304168701171875, 0.3443603515625, 0.384552001953125, 0.42474365234375, 0.464935302734375, 0.505126953125, 0.545318603515625, 0.58551025390625, 0.625701904296875, 0.6658935546875, 0.706085205078125, 0.74627685546875, 0.786468505859375, 0.82666015625, 0.866851806640625, 0.90704345703125, 0.947235107421875, 0.9874267578125, 1.027618408203125, 1.06781005859375, 1.108001708984375, 1.148193359375, 1.188385009765625, 1.22857666015625, 1.268768310546875, 1.3089599609375, 1.349151611328125, 1.38934326171875, 1.429534912109375, 1.4697265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 1.0, 6.0, 4.0, 4.0, 11.0, 15.0, 25.0, 39.0, 40.0, 86.0, 137.0, 210.0, 366.0, 739.0, 1474.0, 3810.0, 12596.0, 52643.0, 259240.0, 532264.0, 142092.0, 29710.0, 7937.0, 2642.0, 1102.0, 556.0, 264.0, 178.0, 102.0, 80.0, 61.0, 30.0, 20.0, 18.0, 13.0, 10.0, 9.0, 1.0, 2.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.6798095703125, -5.492431640625, -5.3050537109375, -5.11767578125, -4.9302978515625, -4.742919921875, -4.5555419921875, -4.3681640625, -4.1807861328125, -3.993408203125, -3.8060302734375, -3.61865234375, -3.4312744140625, -3.243896484375, -3.0565185546875, -2.869140625, -2.6817626953125, -2.494384765625, -2.3070068359375, -2.11962890625, -1.9322509765625, -1.744873046875, -1.5574951171875, -1.3701171875, -1.1827392578125, -0.995361328125, -0.8079833984375, -0.62060546875, -0.4332275390625, -0.245849609375, -0.0584716796875, 0.12890625, 0.3162841796875, 0.503662109375, 0.6910400390625, 0.87841796875, 1.0657958984375, 1.253173828125, 1.4405517578125, 1.6279296875, 1.8153076171875, 2.002685546875, 2.1900634765625, 2.37744140625, 2.5648193359375, 2.752197265625, 2.9395751953125, 3.126953125, 3.3143310546875, 3.501708984375, 3.6890869140625, 3.87646484375, 4.0638427734375, 4.251220703125, 4.4385986328125, 4.6259765625, 4.8133544921875, 5.000732421875, 5.1881103515625, 5.37548828125, 5.5628662109375, 5.750244140625, 5.9376220703125, 6.125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 11.0, 9.0, 10.0, 15.0, 15.0, 29.0, 17.0, 32.0, 40.0, 39.0, 40.0, 50.0, 44.0, 34.0, 43.0, 44.0, 56.0, 48.0, 46.0, 34.0, 46.0, 37.0, 36.0, 36.0, 18.0, 22.0, 27.0, 19.0, 12.0, 19.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.604583740234375, -3.49237060546875, -3.380157470703125, -3.2679443359375, -3.155731201171875, -3.04351806640625, -2.931304931640625, -2.819091796875, -2.706878662109375, -2.59466552734375, -2.482452392578125, -2.3702392578125, -2.258026123046875, -2.14581298828125, -2.033599853515625, -1.92138671875, -1.809173583984375, -1.69696044921875, -1.584747314453125, -1.4725341796875, -1.360321044921875, -1.24810791015625, -1.135894775390625, -1.023681640625, -0.911468505859375, -0.79925537109375, -0.687042236328125, -0.5748291015625, -0.462615966796875, -0.35040283203125, -0.238189697265625, -0.1259765625, -0.013763427734375, 0.09844970703125, 0.210662841796875, 0.3228759765625, 0.435089111328125, 0.54730224609375, 0.659515380859375, 0.771728515625, 0.883941650390625, 0.99615478515625, 1.108367919921875, 1.2205810546875, 1.332794189453125, 1.44500732421875, 1.557220458984375, 1.66943359375, 1.781646728515625, 1.89385986328125, 2.006072998046875, 2.1182861328125, 2.230499267578125, 2.34271240234375, 2.454925537109375, 2.567138671875, 2.679351806640625, 2.79156494140625, 2.903778076171875, 3.0159912109375, 3.128204345703125, 3.24041748046875, 3.352630615234375, 3.46484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 9.0, 19.0, 41.0, 40.0, 68.0, 103.0, 179.0, 287.0, 505.0, 983.0, 1942.0, 3864.0, 9139.0, 21850.0, 61417.0, 198992.0, 431662.0, 211673.0, 64951.0, 23139.0, 9180.0, 4166.0, 1977.0, 974.0, 528.0, 315.0, 183.0, 110.0, 64.0, 55.0, 36.0, 18.0, 23.0, 13.0, 6.0, 10.0, 3.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.33258056640625, -2.2608642578125, -2.18914794921875, -2.117431640625, -2.04571533203125, -1.9739990234375, -1.90228271484375, -1.83056640625, -1.75885009765625, -1.6871337890625, -1.61541748046875, -1.543701171875, -1.47198486328125, -1.4002685546875, -1.32855224609375, -1.2568359375, -1.18511962890625, -1.1134033203125, -1.04168701171875, -0.969970703125, -0.89825439453125, -0.8265380859375, -0.75482177734375, -0.68310546875, -0.61138916015625, -0.5396728515625, -0.46795654296875, -0.396240234375, -0.32452392578125, -0.2528076171875, -0.18109130859375, -0.109375, -0.03765869140625, 0.0340576171875, 0.10577392578125, 0.177490234375, 0.24920654296875, 0.3209228515625, 0.39263916015625, 0.46435546875, 0.53607177734375, 0.6077880859375, 0.67950439453125, 0.751220703125, 0.82293701171875, 0.8946533203125, 0.96636962890625, 1.0380859375, 1.10980224609375, 1.1815185546875, 1.25323486328125, 1.324951171875, 1.39666748046875, 1.4683837890625, 1.54010009765625, 1.61181640625, 1.68353271484375, 1.7552490234375, 1.82696533203125, 1.898681640625, 1.97039794921875, 2.0421142578125, 2.11383056640625, 2.185546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 6.0, 11.0, 18.0, 14.0, 22.0, 18.0, 40.0, 40.0, 62.0, 83.0, 96.0, 142.0, 103.0, 86.0, 62.0, 43.0, 36.0, 20.0, 19.0, 15.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006465911865234375, -0.0006297975778579712, -0.0006130039691925049, -0.0005962103605270386, -0.0005794167518615723, -0.000562623143196106, -0.0005458295345306396, -0.0005290359258651733, -0.000512242317199707, -0.0004954487085342407, -0.0004786550998687744, -0.0004618614912033081, -0.0004450678825378418, -0.0004282742738723755, -0.0004114806652069092, -0.00039468705654144287, -0.00037789344787597656, -0.00036109983921051025, -0.00034430623054504395, -0.00032751262187957764, -0.00031071901321411133, -0.000293925404548645, -0.0002771317958831787, -0.0002603381872177124, -0.0002435445785522461, -0.00022675096988677979, -0.00020995736122131348, -0.00019316375255584717, -0.00017637014389038086, -0.00015957653522491455, -0.00014278292655944824, -0.00012598931789398193, -0.00010919570922851562, -9.240210056304932e-05, -7.560849189758301e-05, -5.88148832321167e-05, -4.202127456665039e-05, -2.5227665901184082e-05, -8.434057235717773e-06, 8.359551429748535e-06, 2.5153160095214844e-05, 4.194676876068115e-05, 5.874037742614746e-05, 7.553398609161377e-05, 9.232759475708008e-05, 0.00010912120342254639, 0.0001259148120880127, 0.000142708420753479, 0.0001595020294189453, 0.00017629563808441162, 0.00019308924674987793, 0.00020988285541534424, 0.00022667646408081055, 0.00024347007274627686, 0.00026026368141174316, 0.00027705729007720947, 0.0002938508987426758, 0.0003106445074081421, 0.0003274381160736084, 0.0003442317247390747, 0.000361025333404541, 0.0003778189420700073, 0.00039461255073547363, 0.00041140615940093994, 0.00042819976806640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 17.0, 26.0, 33.0, 81.0, 136.0, 283.0, 661.0, 1782.0, 6038.0, 29931.0, 266575.0, 653319.0, 72826.0, 12132.0, 2916.0, 952.0, 397.0, 175.0, 104.0, 55.0, 27.0, 20.0, 13.0, 9.0, 5.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4493408203125, -4.297119140625, -4.1448974609375, -3.99267578125, -3.8404541015625, -3.688232421875, -3.5360107421875, -3.3837890625, -3.2315673828125, -3.079345703125, -2.9271240234375, -2.77490234375, -2.6226806640625, -2.470458984375, -2.3182373046875, -2.166015625, -2.0137939453125, -1.861572265625, -1.7093505859375, -1.55712890625, -1.4049072265625, -1.252685546875, -1.1004638671875, -0.9482421875, -0.7960205078125, -0.643798828125, -0.4915771484375, -0.33935546875, -0.1871337890625, -0.034912109375, 0.1173095703125, 0.26953125, 0.4217529296875, 0.573974609375, 0.7261962890625, 0.87841796875, 1.0306396484375, 1.182861328125, 1.3350830078125, 1.4873046875, 1.6395263671875, 1.791748046875, 1.9439697265625, 2.09619140625, 2.2484130859375, 2.400634765625, 2.5528564453125, 2.705078125, 2.8572998046875, 3.009521484375, 3.1617431640625, 3.31396484375, 3.4661865234375, 3.618408203125, 3.7706298828125, 3.9228515625, 4.0750732421875, 4.227294921875, 4.3795166015625, 4.53173828125, 4.6839599609375, 4.836181640625, 4.9884033203125, 5.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 5.0, 8.0, 4.0, 10.0, 8.0, 10.0, 18.0, 20.0, 14.0, 23.0, 36.0, 46.0, 56.0, 59.0, 63.0, 81.0, 86.0, 67.0, 83.0, 55.0, 55.0, 41.0, 32.0, 30.0, 18.0, 14.0, 10.0, 15.0, 7.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6953125, -1.63916015625, -1.5830078125, -1.52685546875, -1.470703125, -1.41455078125, -1.3583984375, -1.30224609375, -1.24609375, -1.18994140625, -1.1337890625, -1.07763671875, -1.021484375, -0.96533203125, -0.9091796875, -0.85302734375, -0.796875, -0.74072265625, -0.6845703125, -0.62841796875, -0.572265625, -0.51611328125, -0.4599609375, -0.40380859375, -0.34765625, -0.29150390625, -0.2353515625, -0.17919921875, -0.123046875, -0.06689453125, -0.0107421875, 0.04541015625, 0.1015625, 0.15771484375, 0.2138671875, 0.27001953125, 0.326171875, 0.38232421875, 0.4384765625, 0.49462890625, 0.55078125, 0.60693359375, 0.6630859375, 0.71923828125, 0.775390625, 0.83154296875, 0.8876953125, 0.94384765625, 1.0, 1.05615234375, 1.1123046875, 1.16845703125, 1.224609375, 1.28076171875, 1.3369140625, 1.39306640625, 1.44921875, 1.50537109375, 1.5615234375, 1.61767578125, 1.673828125, 1.72998046875, 1.7861328125, 1.84228515625, 1.8984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 10.0, 25.0, 46.0, 86.0, 192.0, 213.0, 219.0, 107.0, 70.0, 21.0, 13.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.60674285888672, -48.90692901611328, -47.20711898803711, -45.50730514526367, -43.807491302490234, -42.10768127441406, -40.407867431640625, -38.70805358886719, -37.00823974609375, -35.30842590332031, -33.60861587524414, -31.908802032470703, -30.208988189697266, -28.50917625427246, -26.809364318847656, -25.10955047607422, -23.409740447998047, -21.709928512573242, -20.010114669799805, -18.310302734375, -16.610488891601562, -14.910676956176758, -13.210865020751953, -11.511052131652832, -9.811239242553711, -8.11142635345459, -6.411613941192627, -4.711801528930664, -3.011988639831543, -1.3121757507324219, 0.3876361846923828, 2.087449073791504, 3.7872581481933594, 5.4870710372924805, 7.186883449554443, 8.886695861816406, 10.586508750915527, 12.286321640014648, 13.986133575439453, 15.685946464538574, 17.385759353637695, 19.0855712890625, 20.785385131835938, 22.485197067260742, 24.185009002685547, 25.884822845458984, 27.58463478088379, 29.284446716308594, 30.98426055908203, 32.68407440185547, 34.38388442993164, 36.08369827270508, 37.783512115478516, 39.48332214355469, 41.183135986328125, 42.88294982910156, 44.582763671875, 46.28257751464844, 47.98238754272461, 49.68220138549805, 51.382015228271484, 53.081825256347656, 54.781639099121094, 56.48145294189453, 58.1812629699707]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 16.0, 16.0, 17.0, 28.0, 28.0, 34.0, 31.0, 49.0, 33.0, 40.0, 49.0, 51.0, 39.0, 40.0, 40.0, 35.0, 45.0, 32.0, 35.0, 28.0, 22.0, 30.0, 16.0, 28.0, 23.0, 18.0, 14.0, 15.0, 12.0, 9.0, 10.0, 5.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.762094497680664, -18.190765380859375, -17.61943817138672, -17.04810905456543, -16.47677993774414, -15.905450820922852, -15.334122657775879, -14.762794494628906, -14.191465377807617, -13.620136260986328, -13.048808097839355, -12.477479934692383, -11.906150817871094, -11.334821701049805, -10.763493537902832, -10.19216537475586, -9.62083625793457, -9.049507141113281, -8.478178977966309, -7.906850337982178, -7.335521697998047, -6.764193058013916, -6.192864418029785, -5.621535778045654, -5.050207138061523, -4.478878498077393, -3.9075498580932617, -3.336221218109131, -2.764892578125, -2.193563938140869, -1.6222352981567383, -1.0509066581726074, -0.47957611083984375, 0.09175252914428711, 0.663081169128418, 1.2344098091125488, 1.8057384490966797, 2.3770670890808105, 2.9483957290649414, 3.5197243690490723, 4.091053009033203, 4.662381649017334, 5.233710289001465, 5.805038928985596, 6.376367568969727, 6.947696208953857, 7.519024848937988, 8.090353012084961, 8.66168212890625, 9.233011245727539, 9.804339408874512, 10.375667572021484, 10.946996688842773, 11.518325805664062, 12.089653968811035, 12.660982131958008, 13.232311248779297, 13.803640365600586, 14.374968528747559, 14.946296691894531, 15.51762580871582, 16.08895492553711, 16.660282135009766, 17.231611251831055, 17.802940368652344]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 10.0, 5.0, 16.0, 18.0, 32.0, 58.0, 124.0, 172.0, 375.0, 849.0, 2433.0, 8437.0, 52844.0, 3877006.0, 226523.0, 18629.0, 4189.0, 1348.0, 567.0, 281.0, 147.0, 85.0, 49.0, 26.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.73583984375, -8.4091796875, -8.08251953125, -7.755859375, -7.42919921875, -7.1025390625, -6.77587890625, -6.44921875, -6.12255859375, -5.7958984375, -5.46923828125, -5.142578125, -4.81591796875, -4.4892578125, -4.16259765625, -3.8359375, -3.50927734375, -3.1826171875, -2.85595703125, -2.529296875, -2.20263671875, -1.8759765625, -1.54931640625, -1.22265625, -0.89599609375, -0.5693359375, -0.24267578125, 0.083984375, 0.41064453125, 0.7373046875, 1.06396484375, 1.390625, 1.71728515625, 2.0439453125, 2.37060546875, 2.697265625, 3.02392578125, 3.3505859375, 3.67724609375, 4.00390625, 4.33056640625, 4.6572265625, 4.98388671875, 5.310546875, 5.63720703125, 5.9638671875, 6.29052734375, 6.6171875, 6.94384765625, 7.2705078125, 7.59716796875, 7.923828125, 8.25048828125, 8.5771484375, 8.90380859375, 9.23046875, 9.55712890625, 9.8837890625, 10.21044921875, 10.537109375, 10.86376953125, 11.1904296875, 11.51708984375, 11.84375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 11.0, 12.0, 16.0, 36.0, 45.0, 67.0, 69.0, 85.0, 101.0, 114.0, 95.0, 91.0, 74.0, 57.0, 48.0, 27.0, 15.0, 16.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.2063446044921875, -1.166595458984375, -1.1268463134765625, -1.08709716796875, -1.0473480224609375, -1.007598876953125, -0.9678497314453125, -0.9281005859375, -0.8883514404296875, -0.848602294921875, -0.8088531494140625, -0.76910400390625, -0.7293548583984375, -0.689605712890625, -0.6498565673828125, -0.610107421875, -0.5703582763671875, -0.530609130859375, -0.4908599853515625, -0.45111083984375, -0.4113616943359375, -0.371612548828125, -0.3318634033203125, -0.2921142578125, -0.2523651123046875, -0.212615966796875, -0.1728668212890625, -0.13311767578125, -0.0933685302734375, -0.053619384765625, -0.0138702392578125, 0.02587890625, 0.0656280517578125, 0.105377197265625, 0.1451263427734375, 0.18487548828125, 0.2246246337890625, 0.264373779296875, 0.3041229248046875, 0.3438720703125, 0.3836212158203125, 0.423370361328125, 0.4631195068359375, 0.50286865234375, 0.5426177978515625, 0.582366943359375, 0.6221160888671875, 0.661865234375, 0.7016143798828125, 0.741363525390625, 0.7811126708984375, 0.82086181640625, 0.8606109619140625, 0.900360107421875, 0.9401092529296875, 0.9798583984375, 1.0196075439453125, 1.059356689453125, 1.0991058349609375, 1.13885498046875, 1.1786041259765625, 1.218353271484375, 1.2581024169921875, 1.2978515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 8.0, 11.0, 29.0, 43.0, 83.0, 104.0, 164.0, 272.0, 429.0, 768.0, 1307.0, 2433.0, 5325.0, 12096.0, 31155.0, 106755.0, 858664.0, 2940553.0, 161164.0, 42999.0, 15817.0, 6814.0, 3344.0, 1757.0, 933.0, 496.0, 281.0, 195.0, 98.0, 58.0, 37.0, 23.0, 25.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.29296875, -5.150421142578125, -5.00787353515625, -4.865325927734375, -4.7227783203125, -4.580230712890625, -4.43768310546875, -4.295135498046875, -4.152587890625, -4.010040283203125, -3.86749267578125, -3.724945068359375, -3.5823974609375, -3.439849853515625, -3.29730224609375, -3.154754638671875, -3.01220703125, -2.869659423828125, -2.72711181640625, -2.584564208984375, -2.4420166015625, -2.299468994140625, -2.15692138671875, -2.014373779296875, -1.871826171875, -1.729278564453125, -1.58673095703125, -1.444183349609375, -1.3016357421875, -1.159088134765625, -1.01654052734375, -0.873992919921875, -0.7314453125, -0.588897705078125, -0.44635009765625, -0.303802490234375, -0.1612548828125, -0.018707275390625, 0.12384033203125, 0.266387939453125, 0.408935546875, 0.551483154296875, 0.69403076171875, 0.836578369140625, 0.9791259765625, 1.121673583984375, 1.26422119140625, 1.406768798828125, 1.54931640625, 1.691864013671875, 1.83441162109375, 1.976959228515625, 2.1195068359375, 2.262054443359375, 2.40460205078125, 2.547149658203125, 2.689697265625, 2.832244873046875, 2.97479248046875, 3.117340087890625, 3.2598876953125, 3.402435302734375, 3.54498291015625, 3.687530517578125, 3.830078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 12.0, 12.0, 18.0, 29.0, 24.0, 50.0, 51.0, 90.0, 149.0, 234.0, 600.0, 1646.0, 481.0, 199.0, 146.0, 76.0, 60.0, 38.0, 31.0, 26.0, 16.0, 9.0, 22.0, 10.0, 0.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.3683929443359375, -1.328582763671875, -1.2887725830078125, -1.24896240234375, -1.2091522216796875, -1.169342041015625, -1.1295318603515625, -1.0897216796875, -1.0499114990234375, -1.010101318359375, -0.9702911376953125, -0.93048095703125, -0.8906707763671875, -0.850860595703125, -0.8110504150390625, -0.771240234375, -0.7314300537109375, -0.691619873046875, -0.6518096923828125, -0.61199951171875, -0.5721893310546875, -0.532379150390625, -0.4925689697265625, -0.4527587890625, -0.4129486083984375, -0.373138427734375, -0.3333282470703125, -0.29351806640625, -0.2537078857421875, -0.213897705078125, -0.1740875244140625, -0.13427734375, -0.0944671630859375, -0.054656982421875, -0.0148468017578125, 0.02496337890625, 0.0647735595703125, 0.104583740234375, 0.1443939208984375, 0.1842041015625, 0.2240142822265625, 0.263824462890625, 0.3036346435546875, 0.34344482421875, 0.3832550048828125, 0.423065185546875, 0.4628753662109375, 0.502685546875, 0.5424957275390625, 0.582305908203125, 0.6221160888671875, 0.66192626953125, 0.7017364501953125, 0.741546630859375, 0.7813568115234375, 0.8211669921875, 0.8609771728515625, 0.900787353515625, 0.9405975341796875, 0.98040771484375, 1.0202178955078125, 1.060028076171875, 1.0998382568359375, 1.1396484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 23.0, 39.0, 103.0, 199.0, 244.0, 201.0, 122.0, 43.0, 14.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.255008697509766, -8.690715789794922, -8.126422882080078, -7.562129974365234, -6.997837066650391, -6.433544158935547, -5.869251251220703, -5.304958343505859, -4.740665435791016, -4.176372528076172, -3.612079620361328, -3.0477867126464844, -2.4834938049316406, -1.9192008972167969, -1.3549079895019531, -0.7906150817871094, -0.22632217407226562, 0.3379707336425781, 0.9022636413574219, 1.4665565490722656, 2.0308494567871094, 2.595142364501953, 3.159435272216797, 3.7237281799316406, 4.288021087646484, 4.852313995361328, 5.416606903076172, 5.980899810791016, 6.545192718505859, 7.109485626220703, 7.673778533935547, 8.23807144165039, 8.802366256713867, 9.366659164428711, 9.930952072143555, 10.495244979858398, 11.059537887573242, 11.623830795288086, 12.18812370300293, 12.752416610717773, 13.316709518432617, 13.881002426147461, 14.445295333862305, 15.009588241577148, 15.573881149291992, 16.138174057006836, 16.70246696472168, 17.266759872436523, 17.831052780151367, 18.39534568786621, 18.959638595581055, 19.5239315032959, 20.088224411010742, 20.652517318725586, 21.21681022644043, 21.781103134155273, 22.345396041870117, 22.90968894958496, 23.473981857299805, 24.03827476501465, 24.602567672729492, 25.166860580444336, 25.73115348815918, 26.295446395874023, 26.859739303588867]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 8.0, 7.0, 13.0, 5.0, 13.0, 16.0, 19.0, 19.0, 16.0, 12.0, 25.0, 40.0, 30.0, 34.0, 48.0, 34.0, 49.0, 39.0, 49.0, 55.0, 48.0, 54.0, 43.0, 44.0, 34.0, 33.0, 27.0, 23.0, 31.0, 15.0, 20.0, 19.0, 11.0, 15.0, 9.0, 11.0, 8.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.036235809326172, -4.883856296539307, -4.7314772605896, -4.579097747802734, -4.426718711853027, -4.274339199066162, -4.121959686279297, -3.9695804119110107, -3.8172011375427246, -3.6648218631744385, -3.5124425888061523, -3.360063076019287, -3.207683801651001, -3.055304527282715, -2.9029250144958496, -2.7505457401275635, -2.5981664657592773, -2.445787191390991, -2.293407917022705, -2.14102840423584, -1.9886491298675537, -1.8362698554992676, -1.683890461921692, -1.5315110683441162, -1.37913179397583, -1.226752519607544, -1.0743731260299683, -0.9219937920570374, -0.7696144580841064, -0.6172351241111755, -0.46485579013824463, -0.31247639656066895, -0.1600966453552246, -0.007717311382293701, 0.1446620225906372, 0.2970413565635681, 0.449420690536499, 0.6018000245094299, 0.7541793584823608, 0.9065587520599365, 1.0589380264282227, 1.2113173007965088, 1.3636966943740845, 1.5160760879516602, 1.6684553623199463, 1.8208346366882324, 1.973214030265808, 2.125593423843384, 2.27797269821167, 2.430351972579956, 2.582731246948242, 2.7351107597351074, 2.8874900341033936, 3.0398693084716797, 3.192248821258545, 3.344628095626831, 3.497007369995117, 3.6493866443634033, 3.8017659187316895, 3.9541454315185547, 4.106524467468262, 4.258903980255127, 4.411283493041992, 4.563662528991699, 4.7160420417785645]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 12.0, 20.0, 21.0, 35.0, 56.0, 67.0, 138.0, 224.0, 403.0, 637.0, 1264.0, 2524.0, 5935.0, 16749.0, 58984.0, 249263.0, 507625.0, 147737.0, 36771.0, 11397.0, 4421.0, 1929.0, 949.0, 570.0, 303.0, 177.0, 116.0, 73.0, 44.0, 39.0, 17.0, 9.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.71539306640625, -4.5362548828125, -4.35711669921875, -4.177978515625, -3.99884033203125, -3.8197021484375, -3.64056396484375, -3.46142578125, -3.28228759765625, -3.1031494140625, -2.92401123046875, -2.744873046875, -2.56573486328125, -2.3865966796875, -2.20745849609375, -2.0283203125, -1.84918212890625, -1.6700439453125, -1.49090576171875, -1.311767578125, -1.13262939453125, -0.9534912109375, -0.77435302734375, -0.59521484375, -0.41607666015625, -0.2369384765625, -0.05780029296875, 0.121337890625, 0.30047607421875, 0.4796142578125, 0.65875244140625, 0.837890625, 1.01702880859375, 1.1961669921875, 1.37530517578125, 1.554443359375, 1.73358154296875, 1.9127197265625, 2.09185791015625, 2.27099609375, 2.45013427734375, 2.6292724609375, 2.80841064453125, 2.987548828125, 3.16668701171875, 3.3458251953125, 3.52496337890625, 3.7041015625, 3.88323974609375, 4.0623779296875, 4.24151611328125, 4.420654296875, 4.59979248046875, 4.7789306640625, 4.95806884765625, 5.13720703125, 5.31634521484375, 5.4954833984375, 5.67462158203125, 5.853759765625, 6.03289794921875, 6.2120361328125, 6.39117431640625, 6.5703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 9.0, 14.0, 21.0, 26.0, 60.0, 52.0, 63.0, 68.0, 95.0, 99.0, 99.0, 88.0, 77.0, 61.0, 51.0, 32.0, 25.0, 21.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.0929718017578125, -1.056060791015625, -1.0191497802734375, -0.98223876953125, -0.9453277587890625, -0.908416748046875, -0.8715057373046875, -0.8345947265625, -0.7976837158203125, -0.760772705078125, -0.7238616943359375, -0.68695068359375, -0.6500396728515625, -0.613128662109375, -0.5762176513671875, -0.539306640625, -0.5023956298828125, -0.465484619140625, -0.4285736083984375, -0.39166259765625, -0.3547515869140625, -0.317840576171875, -0.2809295654296875, -0.2440185546875, -0.2071075439453125, -0.170196533203125, -0.1332855224609375, -0.09637451171875, -0.0594635009765625, -0.022552490234375, 0.0143585205078125, 0.05126953125, 0.0881805419921875, 0.125091552734375, 0.1620025634765625, 0.19891357421875, 0.2358245849609375, 0.272735595703125, 0.3096466064453125, 0.3465576171875, 0.3834686279296875, 0.420379638671875, 0.4572906494140625, 0.49420166015625, 0.5311126708984375, 0.568023681640625, 0.6049346923828125, 0.641845703125, 0.6787567138671875, 0.715667724609375, 0.7525787353515625, 0.78948974609375, 0.8264007568359375, 0.863311767578125, 0.9002227783203125, 0.9371337890625, 0.9740447998046875, 1.010955810546875, 1.0478668212890625, 1.08477783203125, 1.1216888427734375, 1.158599853515625, 1.1955108642578125, 1.232421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 7.0, 6.0, 14.0, 12.0, 16.0, 13.0, 32.0, 33.0, 51.0, 77.0, 127.0, 221.0, 357.0, 604.0, 1232.0, 3127.0, 10091.0, 45702.0, 255098.0, 563580.0, 132593.0, 24930.0, 6258.0, 2169.0, 953.0, 485.0, 281.0, 167.0, 92.0, 60.0, 48.0, 25.0, 16.0, 20.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.30078125, -6.11163330078125, -5.9224853515625, -5.73333740234375, -5.544189453125, -5.35504150390625, -5.1658935546875, -4.97674560546875, -4.78759765625, -4.59844970703125, -4.4093017578125, -4.22015380859375, -4.031005859375, -3.84185791015625, -3.6527099609375, -3.46356201171875, -3.2744140625, -3.08526611328125, -2.8961181640625, -2.70697021484375, -2.517822265625, -2.32867431640625, -2.1395263671875, -1.95037841796875, -1.76123046875, -1.57208251953125, -1.3829345703125, -1.19378662109375, -1.004638671875, -0.81549072265625, -0.6263427734375, -0.43719482421875, -0.248046875, -0.05889892578125, 0.1302490234375, 0.31939697265625, 0.508544921875, 0.69769287109375, 0.8868408203125, 1.07598876953125, 1.26513671875, 1.45428466796875, 1.6434326171875, 1.83258056640625, 2.021728515625, 2.21087646484375, 2.4000244140625, 2.58917236328125, 2.7783203125, 2.96746826171875, 3.1566162109375, 3.34576416015625, 3.534912109375, 3.72406005859375, 3.9132080078125, 4.10235595703125, 4.29150390625, 4.48065185546875, 4.6697998046875, 4.85894775390625, 5.048095703125, 5.23724365234375, 5.4263916015625, 5.61553955078125, 5.8046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 2.0, 9.0, 7.0, 13.0, 4.0, 15.0, 13.0, 16.0, 17.0, 33.0, 27.0, 33.0, 23.0, 38.0, 29.0, 32.0, 34.0, 34.0, 35.0, 33.0, 43.0, 41.0, 44.0, 26.0, 39.0, 39.0, 29.0, 34.0, 26.0, 35.0, 34.0, 27.0, 20.0, 26.0, 10.0, 9.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.947265625, -2.85589599609375, -2.7645263671875, -2.67315673828125, -2.581787109375, -2.49041748046875, -2.3990478515625, -2.30767822265625, -2.21630859375, -2.12493896484375, -2.0335693359375, -1.94219970703125, -1.850830078125, -1.75946044921875, -1.6680908203125, -1.57672119140625, -1.4853515625, -1.39398193359375, -1.3026123046875, -1.21124267578125, -1.119873046875, -1.02850341796875, -0.9371337890625, -0.84576416015625, -0.75439453125, -0.66302490234375, -0.5716552734375, -0.48028564453125, -0.388916015625, -0.29754638671875, -0.2061767578125, -0.11480712890625, -0.0234375, 0.06793212890625, 0.1593017578125, 0.25067138671875, 0.342041015625, 0.43341064453125, 0.5247802734375, 0.61614990234375, 0.70751953125, 0.79888916015625, 0.8902587890625, 0.98162841796875, 1.072998046875, 1.16436767578125, 1.2557373046875, 1.34710693359375, 1.4384765625, 1.52984619140625, 1.6212158203125, 1.71258544921875, 1.803955078125, 1.89532470703125, 1.9866943359375, 2.07806396484375, 2.16943359375, 2.26080322265625, 2.3521728515625, 2.44354248046875, 2.534912109375, 2.62628173828125, 2.7176513671875, 2.80902099609375, 2.900390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 12.0, 38.0, 57.0, 106.0, 251.0, 595.0, 1508.0, 4319.0, 20946.0, 250414.0, 706343.0, 51986.0, 7984.0, 2411.0, 861.0, 371.0, 152.0, 71.0, 39.0, 23.0, 15.0, 12.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.647216796875, -5.46630859375, -5.285400390625, -5.1044921875, -4.923583984375, -4.74267578125, -4.561767578125, -4.380859375, -4.199951171875, -4.01904296875, -3.838134765625, -3.6572265625, -3.476318359375, -3.29541015625, -3.114501953125, -2.93359375, -2.752685546875, -2.57177734375, -2.390869140625, -2.2099609375, -2.029052734375, -1.84814453125, -1.667236328125, -1.486328125, -1.305419921875, -1.12451171875, -0.943603515625, -0.7626953125, -0.581787109375, -0.40087890625, -0.219970703125, -0.0390625, 0.141845703125, 0.32275390625, 0.503662109375, 0.6845703125, 0.865478515625, 1.04638671875, 1.227294921875, 1.408203125, 1.589111328125, 1.77001953125, 1.950927734375, 2.1318359375, 2.312744140625, 2.49365234375, 2.674560546875, 2.85546875, 3.036376953125, 3.21728515625, 3.398193359375, 3.5791015625, 3.760009765625, 3.94091796875, 4.121826171875, 4.302734375, 4.483642578125, 4.66455078125, 4.845458984375, 5.0263671875, 5.207275390625, 5.38818359375, 5.569091796875, 5.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 5.0, 14.0, 10.0, 23.0, 37.0, 50.0, 87.0, 138.0, 214.0, 157.0, 86.0, 50.0, 35.0, 33.0, 16.0, 13.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010004043579101562, -0.0009697899222373962, -0.0009391754865646362, -0.0009085610508918762, -0.0008779466152191162, -0.0008473321795463562, -0.0008167177438735962, -0.0007861033082008362, -0.0007554888725280762, -0.0007248744368553162, -0.0006942600011825562, -0.0006636455655097961, -0.0006330311298370361, -0.0006024166941642761, -0.0005718022584915161, -0.0005411878228187561, -0.0005105733871459961, -0.0004799589514732361, -0.0004493445158004761, -0.00041873008012771606, -0.00038811564445495605, -0.00035750120878219604, -0.00032688677310943604, -0.000296272337436676, -0.000265657901763916, -0.000235043466091156, -0.000204429030418396, -0.00017381459474563599, -0.00014320015907287598, -0.00011258572340011597, -8.197128772735596e-05, -5.135685205459595e-05, -2.0742416381835938e-05, 9.872019290924072e-06, 4.048645496368408e-05, 7.110089063644409e-05, 0.0001017153263092041, 0.0001323297619819641, 0.00016294419765472412, 0.00019355863332748413, 0.00022417306900024414, 0.00025478750467300415, 0.00028540194034576416, 0.00031601637601852417, 0.0003466308116912842, 0.0003772452473640442, 0.0004078596830368042, 0.0004384741187095642, 0.0004690885543823242, 0.0004997029900550842, 0.0005303174257278442, 0.0005609318614006042, 0.0005915462970733643, 0.0006221607327461243, 0.0006527751684188843, 0.0006833896040916443, 0.0007140040397644043, 0.0007446184754371643, 0.0007752329111099243, 0.0008058473467826843, 0.0008364617824554443, 0.0008670762181282043, 0.0008976906538009644, 0.0009283050894737244, 0.0009589195251464844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 21.0, 30.0, 46.0, 95.0, 165.0, 430.0, 943.0, 2772.0, 12141.0, 201717.0, 793554.0, 29205.0, 4933.0, 1426.0, 515.0, 259.0, 131.0, 72.0, 19.0, 13.0, 19.0, 4.0, 7.0, 12.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.95574951171875, -7.7161865234375, -7.47662353515625, -7.237060546875, -6.99749755859375, -6.7579345703125, -6.51837158203125, -6.27880859375, -6.03924560546875, -5.7996826171875, -5.56011962890625, -5.320556640625, -5.08099365234375, -4.8414306640625, -4.60186767578125, -4.3623046875, -4.12274169921875, -3.8831787109375, -3.64361572265625, -3.404052734375, -3.16448974609375, -2.9249267578125, -2.68536376953125, -2.44580078125, -2.20623779296875, -1.9666748046875, -1.72711181640625, -1.487548828125, -1.24798583984375, -1.0084228515625, -0.76885986328125, -0.529296875, -0.28973388671875, -0.0501708984375, 0.18939208984375, 0.428955078125, 0.66851806640625, 0.9080810546875, 1.14764404296875, 1.38720703125, 1.62677001953125, 1.8663330078125, 2.10589599609375, 2.345458984375, 2.58502197265625, 2.8245849609375, 3.06414794921875, 3.3037109375, 3.54327392578125, 3.7828369140625, 4.02239990234375, 4.261962890625, 4.50152587890625, 4.7410888671875, 4.98065185546875, 5.22021484375, 5.45977783203125, 5.6993408203125, 5.93890380859375, 6.178466796875, 6.41802978515625, 6.6575927734375, 6.89715576171875, 7.13671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 4.0, 10.0, 8.0, 11.0, 24.0, 30.0, 61.0, 112.0, 140.0, 170.0, 145.0, 108.0, 48.0, 29.0, 19.0, 21.0, 13.0, 9.0, 8.0, 3.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4765625, -3.36602783203125, -3.2554931640625, -3.14495849609375, -3.034423828125, -2.92388916015625, -2.8133544921875, -2.70281982421875, -2.59228515625, -2.48175048828125, -2.3712158203125, -2.26068115234375, -2.150146484375, -2.03961181640625, -1.9290771484375, -1.81854248046875, -1.7080078125, -1.59747314453125, -1.4869384765625, -1.37640380859375, -1.265869140625, -1.15533447265625, -1.0447998046875, -0.93426513671875, -0.82373046875, -0.71319580078125, -0.6026611328125, -0.49212646484375, -0.381591796875, -0.27105712890625, -0.1605224609375, -0.04998779296875, 0.060546875, 0.17108154296875, 0.2816162109375, 0.39215087890625, 0.502685546875, 0.61322021484375, 0.7237548828125, 0.83428955078125, 0.94482421875, 1.05535888671875, 1.1658935546875, 1.27642822265625, 1.386962890625, 1.49749755859375, 1.6080322265625, 1.71856689453125, 1.8291015625, 1.93963623046875, 2.0501708984375, 2.16070556640625, 2.271240234375, 2.38177490234375, 2.4923095703125, 2.60284423828125, 2.71337890625, 2.82391357421875, 2.9344482421875, 3.04498291015625, 3.155517578125, 3.26605224609375, 3.3765869140625, 3.48712158203125, 3.59765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 22.0, 32.0, 56.0, 79.0, 121.0, 123.0, 134.0, 132.0, 101.0, 69.0, 30.0, 24.0, 20.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.876922607421875, -17.836334228515625, -16.795745849609375, -15.755155563354492, -14.714567184448242, -13.673978805541992, -12.633389472961426, -11.59280014038086, -10.55221176147461, -9.51162338256836, -8.471034049987793, -7.430445194244385, -6.389856338500977, -5.349267482757568, -4.30867862701416, -3.268089771270752, -2.2275009155273438, -1.1869120597839355, -0.14632320404052734, 0.8942656517028809, 1.934854507446289, 2.9754433631896973, 4.0160322189331055, 5.056621074676514, 6.097209930419922, 7.13779878616333, 8.178387641906738, 9.218976974487305, 10.259565353393555, 11.300153732299805, 12.340743064880371, 13.381332397460938, 14.421920776367188, 15.462509155273438, 16.503097534179688, 17.54368782043457, 18.58427619934082, 19.62486457824707, 20.665454864501953, 21.706043243408203, 22.746631622314453, 23.787220001220703, 24.827808380126953, 25.868398666381836, 26.908987045288086, 27.949575424194336, 28.99016571044922, 30.03075408935547, 31.07134246826172, 32.11193084716797, 33.15251922607422, 34.19310760498047, 35.23369598388672, 36.274288177490234, 37.314876556396484, 38.355464935302734, 39.396053314208984, 40.436641693115234, 41.477230072021484, 42.517818450927734, 43.55841064453125, 44.5989990234375, 45.63958740234375, 46.68017578125, 47.72076416015625]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 8.0, 3.0, 7.0, 8.0, 12.0, 9.0, 16.0, 11.0, 16.0, 14.0, 21.0, 21.0, 33.0, 35.0, 37.0, 41.0, 44.0, 34.0, 51.0, 51.0, 52.0, 50.0, 53.0, 54.0, 37.0, 37.0, 41.0, 34.0, 31.0, 24.0, 24.0, 22.0, 11.0, 15.0, 7.0, 6.0, 6.0, 5.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.13074493408203, -19.472129821777344, -18.813514709472656, -18.1549015045166, -17.496286392211914, -16.837671279907227, -16.179058074951172, -15.520442962646484, -14.861827850341797, -14.20321273803711, -13.544598579406738, -12.885984420776367, -12.22736930847168, -11.568754196166992, -10.910140037536621, -10.25152587890625, -9.592910766601562, -8.934295654296875, -8.275681495666504, -7.617066860198975, -6.958452224731445, -6.299837589263916, -5.641222953796387, -4.982608318328857, -4.323993682861328, -3.665379047393799, -3.0067644119262695, -2.3481497764587402, -1.689535140991211, -1.0309205055236816, -0.37230587005615234, 0.28630876541137695, 0.9449214935302734, 1.6035361289978027, 2.262150764465332, 2.9207653999328613, 3.5793800354003906, 4.23799467086792, 4.896609306335449, 5.5552239418029785, 6.213838577270508, 6.872453212738037, 7.531067848205566, 8.189682006835938, 8.848297119140625, 9.506912231445312, 10.165526390075684, 10.824140548706055, 11.482755661010742, 12.14137077331543, 12.7999849319458, 13.458599090576172, 14.11721420288086, 14.775829315185547, 15.434443473815918, 16.09305763244629, 16.751672744750977, 17.410287857055664, 18.06890106201172, 18.727516174316406, 19.386131286621094, 20.04474639892578, 20.70336151123047, 21.361974716186523, 22.02058982849121]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 15.0, 14.0, 32.0, 56.0, 89.0, 171.0, 323.0, 782.0, 2145.0, 7431.0, 37323.0, 728180.0, 3346537.0, 56766.0, 9883.0, 2724.0, 974.0, 398.0, 179.0, 93.0, 57.0, 29.0, 30.0, 13.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.25238037109375, -4.9774169921875, -4.70245361328125, -4.427490234375, -4.15252685546875, -3.8775634765625, -3.60260009765625, -3.32763671875, -3.05267333984375, -2.7777099609375, -2.50274658203125, -2.227783203125, -1.95281982421875, -1.6778564453125, -1.40289306640625, -1.1279296875, -0.85296630859375, -0.5780029296875, -0.30303955078125, -0.028076171875, 0.24688720703125, 0.5218505859375, 0.79681396484375, 1.07177734375, 1.34674072265625, 1.6217041015625, 1.89666748046875, 2.171630859375, 2.44659423828125, 2.7215576171875, 2.99652099609375, 3.271484375, 3.54644775390625, 3.8214111328125, 4.09637451171875, 4.371337890625, 4.64630126953125, 4.9212646484375, 5.19622802734375, 5.47119140625, 5.74615478515625, 6.0211181640625, 6.29608154296875, 6.571044921875, 6.84600830078125, 7.1209716796875, 7.39593505859375, 7.6708984375, 7.94586181640625, 8.2208251953125, 8.49578857421875, 8.770751953125, 9.04571533203125, 9.3206787109375, 9.59564208984375, 9.87060546875, 10.14556884765625, 10.4205322265625, 10.69549560546875, 10.970458984375, 11.24542236328125, 11.5203857421875, 11.79534912109375, 12.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 16.0, 20.0, 27.0, 45.0, 54.0, 55.0, 76.0, 69.0, 88.0, 86.0, 98.0, 74.0, 70.0, 53.0, 44.0, 30.0, 30.0, 17.0, 7.0, 3.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1135101318359375, -1.076629638671875, -1.0397491455078125, -1.00286865234375, -0.9659881591796875, -0.929107666015625, -0.8922271728515625, -0.8553466796875, -0.8184661865234375, -0.781585693359375, -0.7447052001953125, -0.70782470703125, -0.6709442138671875, -0.634063720703125, -0.5971832275390625, -0.560302734375, -0.5234222412109375, -0.486541748046875, -0.4496612548828125, -0.41278076171875, -0.3759002685546875, -0.339019775390625, -0.3021392822265625, -0.2652587890625, -0.2283782958984375, -0.191497802734375, -0.1546173095703125, -0.11773681640625, -0.0808563232421875, -0.043975830078125, -0.0070953369140625, 0.02978515625, 0.0666656494140625, 0.103546142578125, 0.1404266357421875, 0.17730712890625, 0.2141876220703125, 0.251068115234375, 0.2879486083984375, 0.3248291015625, 0.3617095947265625, 0.398590087890625, 0.4354705810546875, 0.47235107421875, 0.5092315673828125, 0.546112060546875, 0.5829925537109375, 0.619873046875, 0.6567535400390625, 0.693634033203125, 0.7305145263671875, 0.76739501953125, 0.8042755126953125, 0.841156005859375, 0.8780364990234375, 0.9149169921875, 0.9517974853515625, 0.988677978515625, 1.0255584716796875, 1.06243896484375, 1.0993194580078125, 1.136199951171875, 1.1730804443359375, 1.2099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 17.0, 15.0, 18.0, 34.0, 31.0, 38.0, 71.0, 113.0, 162.0, 246.0, 410.0, 702.0, 1271.0, 2203.0, 4345.0, 9463.0, 22310.0, 63793.0, 228615.0, 2433427.0, 1171587.0, 169443.0, 50498.0, 18662.0, 8103.0, 3994.0, 1928.0, 1060.0, 611.0, 397.0, 224.0, 146.0, 90.0, 72.0, 49.0, 26.0, 27.0, 12.0, 9.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.92578125, -3.809967041015625, -3.69415283203125, -3.578338623046875, -3.4625244140625, -3.346710205078125, -3.23089599609375, -3.115081787109375, -2.999267578125, -2.883453369140625, -2.76763916015625, -2.651824951171875, -2.5360107421875, -2.420196533203125, -2.30438232421875, -2.188568115234375, -2.07275390625, -1.956939697265625, -1.84112548828125, -1.725311279296875, -1.6094970703125, -1.493682861328125, -1.37786865234375, -1.262054443359375, -1.146240234375, -1.030426025390625, -0.91461181640625, -0.798797607421875, -0.6829833984375, -0.567169189453125, -0.45135498046875, -0.335540771484375, -0.2197265625, -0.103912353515625, 0.01190185546875, 0.127716064453125, 0.2435302734375, 0.359344482421875, 0.47515869140625, 0.590972900390625, 0.706787109375, 0.822601318359375, 0.93841552734375, 1.054229736328125, 1.1700439453125, 1.285858154296875, 1.40167236328125, 1.517486572265625, 1.63330078125, 1.749114990234375, 1.86492919921875, 1.980743408203125, 2.0965576171875, 2.212371826171875, 2.32818603515625, 2.444000244140625, 2.559814453125, 2.675628662109375, 2.79144287109375, 2.907257080078125, 3.0230712890625, 3.138885498046875, 3.25469970703125, 3.370513916015625, 3.486328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 21.0, 18.0, 21.0, 36.0, 48.0, 58.0, 71.0, 112.0, 198.0, 298.0, 687.0, 1234.0, 471.0, 231.0, 166.0, 91.0, 72.0, 59.0, 39.0, 29.0, 18.0, 22.0, 10.0, 6.0, 10.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.625244140625, -1.56982421875, -1.514404296875, -1.458984375, -1.403564453125, -1.34814453125, -1.292724609375, -1.2373046875, -1.181884765625, -1.12646484375, -1.071044921875, -1.015625, -0.960205078125, -0.90478515625, -0.849365234375, -0.7939453125, -0.738525390625, -0.68310546875, -0.627685546875, -0.572265625, -0.516845703125, -0.46142578125, -0.406005859375, -0.3505859375, -0.295166015625, -0.23974609375, -0.184326171875, -0.12890625, -0.073486328125, -0.01806640625, 0.037353515625, 0.0927734375, 0.148193359375, 0.20361328125, 0.259033203125, 0.314453125, 0.369873046875, 0.42529296875, 0.480712890625, 0.5361328125, 0.591552734375, 0.64697265625, 0.702392578125, 0.7578125, 0.813232421875, 0.86865234375, 0.924072265625, 0.9794921875, 1.034912109375, 1.09033203125, 1.145751953125, 1.201171875, 1.256591796875, 1.31201171875, 1.367431640625, 1.4228515625, 1.478271484375, 1.53369140625, 1.589111328125, 1.64453125, 1.699951171875, 1.75537109375, 1.810791015625, 1.8662109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 13.0, 10.0, 17.0, 12.0, 27.0, 45.0, 70.0, 63.0, 72.0, 97.0, 91.0, 87.0, 73.0, 72.0, 65.0, 61.0, 31.0, 23.0, 19.0, 11.0, 1.0, 7.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.557207107543945, -12.254907608032227, -11.952608108520508, -11.650307655334473, -11.348008155822754, -11.045708656311035, -10.743408203125, -10.441108703613281, -10.138809204101562, -9.836509704589844, -9.534210205078125, -9.23190975189209, -8.929610252380371, -8.627310752868652, -8.325010299682617, -8.022710800170898, -7.72041130065918, -7.418111801147461, -7.115811824798584, -6.813511848449707, -6.511212348937988, -6.2089128494262695, -5.906612873077393, -5.604312896728516, -5.302013397216797, -4.999713897705078, -4.697413921356201, -4.395113945007324, -4.0928144454956055, -3.7905147075653076, -3.4882149696350098, -3.185915231704712, -2.8836164474487305, -2.5813167095184326, -2.2790169715881348, -1.976717233657837, -1.674417495727539, -1.3721177577972412, -1.0698180198669434, -0.7675182819366455, -0.46521854400634766, -0.1629188060760498, 0.13938093185424805, 0.4416806697845459, 0.7439804077148438, 1.0462801456451416, 1.3485798835754395, 1.6508796215057373, 1.9531793594360352, 2.255479097366333, 2.557778835296631, 2.8600785732269287, 3.1623783111572266, 3.4646780490875244, 3.7669777870178223, 4.069277763366699, 4.371577262878418, 4.673876762390137, 4.976176738739014, 5.278476715087891, 5.580776214599609, 5.883075714111328, 6.185375690460205, 6.487675666809082, 6.789975166320801]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 13.0, 10.0, 13.0, 19.0, 20.0, 23.0, 24.0, 21.0, 39.0, 28.0, 36.0, 38.0, 42.0, 43.0, 42.0, 52.0, 35.0, 20.0, 40.0, 31.0, 37.0, 34.0, 43.0, 39.0, 22.0, 27.0, 21.0, 26.0, 26.0, 23.0, 13.0, 14.0, 8.0, 10.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.001309394836426, -5.808198928833008, -5.61508846282959, -5.421977996826172, -5.228867530822754, -5.035757064819336, -4.842646598815918, -4.649536609649658, -4.45642614364624, -4.263315677642822, -4.070205211639404, -3.8770947456359863, -3.6839845180511475, -3.4908740520477295, -3.2977635860443115, -3.1046533584594727, -2.9115426540374756, -2.7184321880340576, -2.5253217220306396, -2.332211494445801, -2.139101028442383, -1.9459905624389648, -1.7528800964355469, -1.5597697496414185, -1.3666592836380005, -1.1735488176345825, -0.9804384708404541, -0.7873280048370361, -0.5942175984382629, -0.40110719203948975, -0.20799672603607178, -0.01488637924194336, 0.1782240867614746, 0.3713344931602478, 0.564444899559021, 0.757555365562439, 0.9506657719612122, 1.1437761783599854, 1.3368866443634033, 1.5299969911575317, 1.7231074571609497, 1.9162179231643677, 2.109328269958496, 2.302438735961914, 2.495549201965332, 2.68865966796875, 2.881770133972168, 3.074880361557007, 3.267990827560425, 3.4611012935638428, 3.6542117595672607, 3.8473219871520996, 4.040432453155518, 4.2335429191589355, 4.4266533851623535, 4.6197638511657715, 4.8128743171691895, 5.005984783172607, 5.199095249176025, 5.392205715179443, 5.585316181182861, 5.778426170349121, 5.971536636352539, 6.164647102355957, 6.357757568359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 18.0, 23.0, 37.0, 61.0, 66.0, 116.0, 205.0, 350.0, 529.0, 931.0, 1829.0, 3563.0, 7608.0, 17744.0, 46329.0, 143289.0, 461900.0, 245233.0, 72031.0, 26134.0, 10571.0, 4680.0, 2273.0, 1190.0, 691.0, 418.0, 230.0, 149.0, 108.0, 62.0, 41.0, 33.0, 18.0, 14.0, 9.0, 15.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.6484375, -5.498626708984375, -5.34881591796875, -5.199005126953125, -5.0491943359375, -4.899383544921875, -4.74957275390625, -4.599761962890625, -4.449951171875, -4.300140380859375, -4.15032958984375, -4.000518798828125, -3.8507080078125, -3.700897216796875, -3.55108642578125, -3.401275634765625, -3.25146484375, -3.101654052734375, -2.95184326171875, -2.802032470703125, -2.6522216796875, -2.502410888671875, -2.35260009765625, -2.202789306640625, -2.052978515625, -1.903167724609375, -1.75335693359375, -1.603546142578125, -1.4537353515625, -1.303924560546875, -1.15411376953125, -1.004302978515625, -0.8544921875, -0.704681396484375, -0.55487060546875, -0.405059814453125, -0.2552490234375, -0.105438232421875, 0.04437255859375, 0.194183349609375, 0.343994140625, 0.493804931640625, 0.64361572265625, 0.793426513671875, 0.9432373046875, 1.093048095703125, 1.24285888671875, 1.392669677734375, 1.54248046875, 1.692291259765625, 1.84210205078125, 1.991912841796875, 2.1417236328125, 2.291534423828125, 2.44134521484375, 2.591156005859375, 2.740966796875, 2.890777587890625, 3.04058837890625, 3.190399169921875, 3.3402099609375, 3.490020751953125, 3.63983154296875, 3.789642333984375, 3.939453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 13.0, 13.0, 21.0, 29.0, 39.0, 45.0, 44.0, 64.0, 74.0, 77.0, 92.0, 83.0, 70.0, 80.0, 65.0, 49.0, 43.0, 25.0, 24.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.09783935546875, -1.0609130859375, -1.02398681640625, -0.987060546875, -0.95013427734375, -0.9132080078125, -0.87628173828125, -0.83935546875, -0.80242919921875, -0.7655029296875, -0.72857666015625, -0.691650390625, -0.65472412109375, -0.6177978515625, -0.58087158203125, -0.5439453125, -0.50701904296875, -0.4700927734375, -0.43316650390625, -0.396240234375, -0.35931396484375, -0.3223876953125, -0.28546142578125, -0.24853515625, -0.21160888671875, -0.1746826171875, -0.13775634765625, -0.100830078125, -0.06390380859375, -0.0269775390625, 0.00994873046875, 0.046875, 0.08380126953125, 0.1207275390625, 0.15765380859375, 0.194580078125, 0.23150634765625, 0.2684326171875, 0.30535888671875, 0.34228515625, 0.37921142578125, 0.4161376953125, 0.45306396484375, 0.489990234375, 0.52691650390625, 0.5638427734375, 0.60076904296875, 0.6376953125, 0.67462158203125, 0.7115478515625, 0.74847412109375, 0.785400390625, 0.82232666015625, 0.8592529296875, 0.89617919921875, 0.93310546875, 0.97003173828125, 1.0069580078125, 1.04388427734375, 1.080810546875, 1.11773681640625, 1.1546630859375, 1.19158935546875, 1.228515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 11.0, 13.0, 18.0, 32.0, 40.0, 55.0, 81.0, 149.0, 232.0, 409.0, 810.0, 1687.0, 4137.0, 13064.0, 47918.0, 224149.0, 578638.0, 131655.0, 30762.0, 8697.0, 3118.0, 1271.0, 637.0, 343.0, 199.0, 114.0, 85.0, 50.0, 46.0, 29.0, 27.0, 15.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.890625, -4.71173095703125, -4.5328369140625, -4.35394287109375, -4.175048828125, -3.99615478515625, -3.8172607421875, -3.63836669921875, -3.45947265625, -3.28057861328125, -3.1016845703125, -2.92279052734375, -2.743896484375, -2.56500244140625, -2.3861083984375, -2.20721435546875, -2.0283203125, -1.84942626953125, -1.6705322265625, -1.49163818359375, -1.312744140625, -1.13385009765625, -0.9549560546875, -0.77606201171875, -0.59716796875, -0.41827392578125, -0.2393798828125, -0.06048583984375, 0.118408203125, 0.29730224609375, 0.4761962890625, 0.65509033203125, 0.833984375, 1.01287841796875, 1.1917724609375, 1.37066650390625, 1.549560546875, 1.72845458984375, 1.9073486328125, 2.08624267578125, 2.26513671875, 2.44403076171875, 2.6229248046875, 2.80181884765625, 2.980712890625, 3.15960693359375, 3.3385009765625, 3.51739501953125, 3.6962890625, 3.87518310546875, 4.0540771484375, 4.23297119140625, 4.411865234375, 4.59075927734375, 4.7696533203125, 4.94854736328125, 5.12744140625, 5.30633544921875, 5.4852294921875, 5.66412353515625, 5.843017578125, 6.02191162109375, 6.2008056640625, 6.37969970703125, 6.55859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 8.0, 15.0, 19.0, 14.0, 16.0, 25.0, 23.0, 38.0, 36.0, 40.0, 49.0, 52.0, 43.0, 50.0, 56.0, 53.0, 45.0, 48.0, 50.0, 53.0, 35.0, 40.0, 24.0, 25.0, 23.0, 19.0, 25.0, 11.0, 8.0, 6.0, 9.0, 11.0, 1.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.977783203125, -3.84619140625, -3.714599609375, -3.5830078125, -3.451416015625, -3.31982421875, -3.188232421875, -3.056640625, -2.925048828125, -2.79345703125, -2.661865234375, -2.5302734375, -2.398681640625, -2.26708984375, -2.135498046875, -2.00390625, -1.872314453125, -1.74072265625, -1.609130859375, -1.4775390625, -1.345947265625, -1.21435546875, -1.082763671875, -0.951171875, -0.819580078125, -0.68798828125, -0.556396484375, -0.4248046875, -0.293212890625, -0.16162109375, -0.030029296875, 0.1015625, 0.233154296875, 0.36474609375, 0.496337890625, 0.6279296875, 0.759521484375, 0.89111328125, 1.022705078125, 1.154296875, 1.285888671875, 1.41748046875, 1.549072265625, 1.6806640625, 1.812255859375, 1.94384765625, 2.075439453125, 2.20703125, 2.338623046875, 2.47021484375, 2.601806640625, 2.7333984375, 2.864990234375, 2.99658203125, 3.128173828125, 3.259765625, 3.391357421875, 3.52294921875, 3.654541015625, 3.7861328125, 3.917724609375, 4.04931640625, 4.180908203125, 4.3125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 14.0, 18.0, 28.0, 52.0, 80.0, 167.0, 340.0, 733.0, 1689.0, 5140.0, 22475.0, 180985.0, 720277.0, 95582.0, 14499.0, 3878.0, 1386.0, 609.0, 251.0, 140.0, 79.0, 36.0, 26.0, 15.0, 10.0, 9.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.85247802734375, -5.6658935546875, -5.47930908203125, -5.292724609375, -5.10614013671875, -4.9195556640625, -4.73297119140625, -4.54638671875, -4.35980224609375, -4.1732177734375, -3.98663330078125, -3.800048828125, -3.61346435546875, -3.4268798828125, -3.24029541015625, -3.0537109375, -2.86712646484375, -2.6805419921875, -2.49395751953125, -2.307373046875, -2.12078857421875, -1.9342041015625, -1.74761962890625, -1.56103515625, -1.37445068359375, -1.1878662109375, -1.00128173828125, -0.814697265625, -0.62811279296875, -0.4415283203125, -0.25494384765625, -0.068359375, 0.11822509765625, 0.3048095703125, 0.49139404296875, 0.677978515625, 0.86456298828125, 1.0511474609375, 1.23773193359375, 1.42431640625, 1.61090087890625, 1.7974853515625, 1.98406982421875, 2.170654296875, 2.35723876953125, 2.5438232421875, 2.73040771484375, 2.9169921875, 3.10357666015625, 3.2901611328125, 3.47674560546875, 3.663330078125, 3.84991455078125, 4.0364990234375, 4.22308349609375, 4.40966796875, 4.59625244140625, 4.7828369140625, 4.96942138671875, 5.156005859375, 5.34259033203125, 5.5291748046875, 5.71575927734375, 5.90234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 19.0, 21.0, 22.0, 36.0, 84.0, 180.0, 257.0, 126.0, 83.0, 48.0, 29.0, 16.0, 14.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.0009905099868774414, -0.0009529590606689453, -0.0009154081344604492, -0.0008778572082519531, -0.000840306282043457, -0.0008027553558349609, -0.0007652044296264648, -0.0007276535034179688, -0.0006901025772094727, -0.0006525516510009766, -0.0006150007247924805, -0.0005774497985839844, -0.0005398988723754883, -0.0005023479461669922, -0.0004647970199584961, -0.00042724609375, -0.0003896951675415039, -0.0003521442413330078, -0.0003145933151245117, -0.0002770423889160156, -0.00023949146270751953, -0.00020194053649902344, -0.00016438961029052734, -0.00012683868408203125, -8.928775787353516e-05, -5.173683166503906e-05, -1.4185905456542969e-05, 2.3365020751953125e-05, 6.091594696044922e-05, 9.846687316894531e-05, 0.0001360177993774414, 0.0001735687255859375, 0.0002111196517944336, 0.0002486705780029297, 0.0002862215042114258, 0.0003237724304199219, 0.00036132335662841797, 0.00039887428283691406, 0.00043642520904541016, 0.00047397613525390625, 0.0005115270614624023, 0.0005490779876708984, 0.0005866289138793945, 0.0006241798400878906, 0.0006617307662963867, 0.0006992816925048828, 0.0007368326187133789, 0.000774383544921875, 0.0008119344711303711, 0.0008494853973388672, 0.0008870363235473633, 0.0009245872497558594, 0.0009621381759643555, 0.0009996891021728516, 0.0010372400283813477, 0.0010747909545898438, 0.0011123418807983398, 0.001149892807006836, 0.001187443733215332, 0.0012249946594238281, 0.0012625455856323242, 0.0013000965118408203, 0.0013376474380493164, 0.0013751983642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 6.0, 8.0, 10.0, 12.0, 23.0, 41.0, 33.0, 48.0, 112.0, 211.0, 509.0, 1216.0, 3551.0, 13769.0, 88331.0, 731933.0, 178599.0, 22049.0, 5269.0, 1581.0, 605.0, 292.0, 129.0, 88.0, 44.0, 30.0, 18.0, 17.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.9296875, -6.7503662109375, -6.571044921875, -6.3917236328125, -6.21240234375, -6.0330810546875, -5.853759765625, -5.6744384765625, -5.4951171875, -5.3157958984375, -5.136474609375, -4.9571533203125, -4.77783203125, -4.5985107421875, -4.419189453125, -4.2398681640625, -4.060546875, -3.8812255859375, -3.701904296875, -3.5225830078125, -3.34326171875, -3.1639404296875, -2.984619140625, -2.8052978515625, -2.6259765625, -2.4466552734375, -2.267333984375, -2.0880126953125, -1.90869140625, -1.7293701171875, -1.550048828125, -1.3707275390625, -1.19140625, -1.0120849609375, -0.832763671875, -0.6534423828125, -0.47412109375, -0.2947998046875, -0.115478515625, 0.0638427734375, 0.2431640625, 0.4224853515625, 0.601806640625, 0.7811279296875, 0.96044921875, 1.1397705078125, 1.319091796875, 1.4984130859375, 1.677734375, 1.8570556640625, 2.036376953125, 2.2156982421875, 2.39501953125, 2.5743408203125, 2.753662109375, 2.9329833984375, 3.1123046875, 3.2916259765625, 3.470947265625, 3.6502685546875, 3.82958984375, 4.0089111328125, 4.188232421875, 4.3675537109375, 4.546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 6.0, 14.0, 23.0, 30.0, 52.0, 60.0, 81.0, 132.0, 153.0, 121.0, 77.0, 54.0, 39.0, 33.0, 22.0, 19.0, 14.0, 14.0, 6.0, 5.0, 2.0, 1.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.91156005859375, -3.8074951171875, -3.70343017578125, -3.599365234375, -3.49530029296875, -3.3912353515625, -3.28717041015625, -3.18310546875, -3.07904052734375, -2.9749755859375, -2.87091064453125, -2.766845703125, -2.66278076171875, -2.5587158203125, -2.45465087890625, -2.3505859375, -2.24652099609375, -2.1424560546875, -2.03839111328125, -1.934326171875, -1.83026123046875, -1.7261962890625, -1.62213134765625, -1.51806640625, -1.41400146484375, -1.3099365234375, -1.20587158203125, -1.101806640625, -0.99774169921875, -0.8936767578125, -0.78961181640625, -0.685546875, -0.58148193359375, -0.4774169921875, -0.37335205078125, -0.269287109375, -0.16522216796875, -0.0611572265625, 0.04290771484375, 0.14697265625, 0.25103759765625, 0.3551025390625, 0.45916748046875, 0.563232421875, 0.66729736328125, 0.7713623046875, 0.87542724609375, 0.9794921875, 1.08355712890625, 1.1876220703125, 1.29168701171875, 1.395751953125, 1.49981689453125, 1.6038818359375, 1.70794677734375, 1.81201171875, 1.91607666015625, 2.0201416015625, 2.12420654296875, 2.228271484375, 2.33233642578125, 2.4364013671875, 2.54046630859375, 2.64453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 16.0, 30.0, 33.0, 46.0, 97.0, 138.0, 122.0, 125.0, 96.0, 101.0, 68.0, 46.0, 32.0, 17.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.55727767944336, -18.358530044555664, -17.15978240966797, -15.961034774780273, -14.762287139892578, -13.563539505004883, -12.364792823791504, -11.166045188903809, -9.967297554016113, -8.768549919128418, -7.569802284240723, -6.3710551261901855, -5.17230749130249, -3.973559856414795, -2.774812698364258, -1.5760650634765625, -0.3773174285888672, 0.8214300870895386, 2.0201776027679443, 3.2189249992370605, 4.417672634124756, 5.616420269012451, 6.815167427062988, 8.013915061950684, 9.212662696838379, 10.411410331726074, 11.61015796661377, 12.808904647827148, 14.007652282714844, 15.206399917602539, 16.405147552490234, 17.60389518737793, 18.802642822265625, 20.00139045715332, 21.200138092041016, 22.39888572692871, 23.597633361816406, 24.7963809967041, 25.995128631591797, 27.19387435913086, 28.392623901367188, 29.591371536254883, 30.790119171142578, 31.988866806030273, 33.18761444091797, 34.38636016845703, 35.58510971069336, 36.78385543823242, 37.98260498046875, 39.18135070800781, 40.38010025024414, 41.5788459777832, 42.77759552001953, 43.976341247558594, 45.17509078979492, 46.373836517333984, 47.57258224487305, 48.77132797241211, 49.97007751464844, 51.1688232421875, 52.36757278442383, 53.56631851196289, 54.76506805419922, 55.96381378173828, 57.16256332397461]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 4.0, 6.0, 7.0, 15.0, 7.0, 13.0, 18.0, 21.0, 17.0, 21.0, 26.0, 40.0, 31.0, 35.0, 51.0, 41.0, 46.0, 57.0, 55.0, 53.0, 42.0, 44.0, 45.0, 43.0, 42.0, 28.0, 34.0, 28.0, 17.0, 21.0, 15.0, 10.0, 9.0, 9.0, 13.0, 7.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.261754989624023, -22.515945434570312, -21.770137786865234, -21.024328231811523, -20.278520584106445, -19.532711029052734, -18.786903381347656, -18.041093826293945, -17.295284271240234, -16.549474716186523, -15.803667068481445, -15.057857513427734, -14.312049865722656, -13.566240310668945, -12.82043170928955, -12.074623107910156, -11.328815460205078, -10.583006858825684, -9.837198257446289, -9.091388702392578, -8.3455810546875, -7.599771976470947, -6.8539628982543945, -6.108154296875, -5.3623456954956055, -4.616537094116211, -3.8707282543182373, -3.1249194145202637, -2.379110813140869, -1.6333022117614746, -0.8874931335449219, -0.14168453216552734, 0.6041259765625, 1.349934697151184, 2.095743417739868, 2.841552257537842, 3.5873608589172363, 4.333169460296631, 5.078978538513184, 5.824787139892578, 6.570595741271973, 7.316404342651367, 8.062212944030762, 8.808021545410156, 9.553831100463867, 10.299638748168945, 11.045448303222656, 11.79125690460205, 12.537065505981445, 13.28287410736084, 14.028682708740234, 14.774492263793945, 15.520299911499023, 16.266109466552734, 17.011917114257812, 17.757726669311523, 18.503536224365234, 19.249345779418945, 19.995153427124023, 20.740962982177734, 21.486770629882812, 22.232580184936523, 22.978389739990234, 23.724197387695312, 24.47000503540039]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 13.0, 37.0, 44.0, 70.0, 129.0, 190.0, 315.0, 656.0, 1445.0, 3117.0, 8351.0, 28304.0, 147610.0, 3687280.0, 259215.0, 39554.0, 10922.0, 3875.0, 1561.0, 712.0, 360.0, 200.0, 96.0, 51.0, 44.0, 34.0, 25.0, 10.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.3046875, -6.0987548828125, -5.892822265625, -5.6868896484375, -5.48095703125, -5.2750244140625, -5.069091796875, -4.8631591796875, -4.6572265625, -4.4512939453125, -4.245361328125, -4.0394287109375, -3.83349609375, -3.6275634765625, -3.421630859375, -3.2156982421875, -3.009765625, -2.8038330078125, -2.597900390625, -2.3919677734375, -2.18603515625, -1.9801025390625, -1.774169921875, -1.5682373046875, -1.3623046875, -1.1563720703125, -0.950439453125, -0.7445068359375, -0.53857421875, -0.3326416015625, -0.126708984375, 0.0792236328125, 0.28515625, 0.4910888671875, 0.697021484375, 0.9029541015625, 1.10888671875, 1.3148193359375, 1.520751953125, 1.7266845703125, 1.9326171875, 2.1385498046875, 2.344482421875, 2.5504150390625, 2.75634765625, 2.9622802734375, 3.168212890625, 3.3741455078125, 3.580078125, 3.7860107421875, 3.991943359375, 4.1978759765625, 4.40380859375, 4.6097412109375, 4.815673828125, 5.0216064453125, 5.2275390625, 5.4334716796875, 5.639404296875, 5.8453369140625, 6.05126953125, 6.2572021484375, 6.463134765625, 6.6690673828125, 6.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 14.0, 24.0, 30.0, 21.0, 28.0, 49.0, 51.0, 72.0, 72.0, 75.0, 71.0, 68.0, 59.0, 68.0, 59.0, 44.0, 36.0, 35.0, 29.0, 22.0, 13.0, 7.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.090240478515625, -1.05352783203125, -1.016815185546875, -0.9801025390625, -0.943389892578125, -0.90667724609375, -0.869964599609375, -0.833251953125, -0.796539306640625, -0.75982666015625, -0.723114013671875, -0.6864013671875, -0.649688720703125, -0.61297607421875, -0.576263427734375, -0.53955078125, -0.502838134765625, -0.46612548828125, -0.429412841796875, -0.3927001953125, -0.355987548828125, -0.31927490234375, -0.282562255859375, -0.245849609375, -0.209136962890625, -0.17242431640625, -0.135711669921875, -0.0989990234375, -0.062286376953125, -0.02557373046875, 0.011138916015625, 0.0478515625, 0.084564208984375, 0.12127685546875, 0.157989501953125, 0.1947021484375, 0.231414794921875, 0.26812744140625, 0.304840087890625, 0.341552734375, 0.378265380859375, 0.41497802734375, 0.451690673828125, 0.4884033203125, 0.525115966796875, 0.56182861328125, 0.598541259765625, 0.63525390625, 0.671966552734375, 0.70867919921875, 0.745391845703125, 0.7821044921875, 0.818817138671875, 0.85552978515625, 0.892242431640625, 0.928955078125, 0.965667724609375, 1.00238037109375, 1.039093017578125, 1.0758056640625, 1.112518310546875, 1.14923095703125, 1.185943603515625, 1.22265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 17.0, 22.0, 19.0, 29.0, 61.0, 90.0, 127.0, 165.0, 298.0, 445.0, 760.0, 1339.0, 2495.0, 4737.0, 10565.0, 26543.0, 79723.0, 372464.0, 3268576.0, 309986.0, 71362.0, 24352.0, 9928.0, 4515.0, 2311.0, 1270.0, 776.0, 433.0, 266.0, 183.0, 118.0, 81.0, 65.0, 43.0, 18.0, 18.0, 19.0, 11.0, 6.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0234375, -4.86865234375, -4.7138671875, -4.55908203125, -4.404296875, -4.24951171875, -4.0947265625, -3.93994140625, -3.78515625, -3.63037109375, -3.4755859375, -3.32080078125, -3.166015625, -3.01123046875, -2.8564453125, -2.70166015625, -2.546875, -2.39208984375, -2.2373046875, -2.08251953125, -1.927734375, -1.77294921875, -1.6181640625, -1.46337890625, -1.30859375, -1.15380859375, -0.9990234375, -0.84423828125, -0.689453125, -0.53466796875, -0.3798828125, -0.22509765625, -0.0703125, 0.08447265625, 0.2392578125, 0.39404296875, 0.548828125, 0.70361328125, 0.8583984375, 1.01318359375, 1.16796875, 1.32275390625, 1.4775390625, 1.63232421875, 1.787109375, 1.94189453125, 2.0966796875, 2.25146484375, 2.40625, 2.56103515625, 2.7158203125, 2.87060546875, 3.025390625, 3.18017578125, 3.3349609375, 3.48974609375, 3.64453125, 3.79931640625, 3.9541015625, 4.10888671875, 4.263671875, 4.41845703125, 4.5732421875, 4.72802734375, 4.8828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 15.0, 25.0, 39.0, 51.0, 72.0, 109.0, 174.0, 403.0, 1709.0, 755.0, 273.0, 155.0, 83.0, 46.0, 35.0, 37.0, 17.0, 13.0, 4.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.705322265625, -2.62744140625, -2.549560546875, -2.4716796875, -2.393798828125, -2.31591796875, -2.238037109375, -2.16015625, -2.082275390625, -2.00439453125, -1.926513671875, -1.8486328125, -1.770751953125, -1.69287109375, -1.614990234375, -1.537109375, -1.459228515625, -1.38134765625, -1.303466796875, -1.2255859375, -1.147705078125, -1.06982421875, -0.991943359375, -0.9140625, -0.836181640625, -0.75830078125, -0.680419921875, -0.6025390625, -0.524658203125, -0.44677734375, -0.368896484375, -0.291015625, -0.213134765625, -0.13525390625, -0.057373046875, 0.0205078125, 0.098388671875, 0.17626953125, 0.254150390625, 0.33203125, 0.409912109375, 0.48779296875, 0.565673828125, 0.6435546875, 0.721435546875, 0.79931640625, 0.877197265625, 0.955078125, 1.032958984375, 1.11083984375, 1.188720703125, 1.2666015625, 1.344482421875, 1.42236328125, 1.500244140625, 1.578125, 1.656005859375, 1.73388671875, 1.811767578125, 1.8896484375, 1.967529296875, 2.04541015625, 2.123291015625, 2.201171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 30.0, 80.0, 171.0, 237.0, 230.0, 137.0, 60.0, 18.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.856782913208008, -29.00043296813965, -28.14408302307129, -27.28773307800293, -26.431381225585938, -25.575031280517578, -24.71868133544922, -23.86233139038086, -23.0059814453125, -22.14963150024414, -21.29328155517578, -20.436931610107422, -19.580581665039062, -18.724231719970703, -17.86787986755371, -17.01152992248535, -16.155179977416992, -15.298830032348633, -14.442480087280273, -13.586129188537598, -12.729779243469238, -11.873429298400879, -11.017078399658203, -10.160728454589844, -9.304378509521484, -8.448028564453125, -7.591678142547607, -6.73532772064209, -5.8789777755737305, -5.022627830505371, -4.1662774085998535, -3.309926986694336, -2.4535751342773438, -1.5972249507904053, -0.7408747673034668, 0.11547541618347168, 0.9718255996704102, 1.8281755447387695, 2.684525966644287, 3.5408763885498047, 4.397226333618164, 5.253576278686523, 6.109926700592041, 6.966277122497559, 7.822627067565918, 8.678977012634277, 9.535327911376953, 10.391677856445312, 11.248027801513672, 12.104377746582031, 12.96072769165039, 13.817078590393066, 14.673428535461426, 15.529778480529785, 16.38612937927246, 17.24247932434082, 18.09882926940918, 18.95517921447754, 19.8115291595459, 20.667879104614258, 21.52423095703125, 22.38058090209961, 23.23693084716797, 24.093280792236328, 24.949630737304688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 2.0, 11.0, 19.0, 17.0, 24.0, 22.0, 32.0, 29.0, 43.0, 35.0, 47.0, 38.0, 63.0, 52.0, 47.0, 48.0, 48.0, 56.0, 35.0, 41.0, 45.0, 33.0, 32.0, 33.0, 26.0, 20.0, 19.0, 17.0, 11.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.195155143737793, -7.932441234588623, -7.669727325439453, -7.407013893127441, -7.1442999839782715, -6.881586074829102, -6.61887264251709, -6.35615873336792, -6.09344482421875, -5.83073091506958, -5.56801700592041, -5.305303573608398, -5.0425896644592285, -4.779875755310059, -4.517162322998047, -4.254448413848877, -3.991734504699707, -3.729020595550537, -3.4663069248199463, -3.2035932540893555, -2.9408793449401855, -2.6781654357910156, -2.415451765060425, -2.152738094329834, -1.890024185180664, -1.6273103952407837, -1.3645966053009033, -1.101882815361023, -0.8391690254211426, -0.5764552354812622, -0.31374144554138184, -0.051027655601501465, 0.2116870880126953, 0.4744008779525757, 0.737114667892456, 0.9998284578323364, 1.2625422477722168, 1.5252560377120972, 1.7879698276519775, 2.0506834983825684, 2.3133974075317383, 2.576111316680908, 2.838824987411499, 3.10153865814209, 3.3642525672912598, 3.6269664764404297, 3.8896801471710205, 4.152393817901611, 4.415107727050781, 4.677821636199951, 4.940535545349121, 5.203248977661133, 5.465962886810303, 5.728676795959473, 5.991390228271484, 6.254104137420654, 6.516818046569824, 6.779531955718994, 7.042245864868164, 7.304959297180176, 7.567673206329346, 7.830387115478516, 8.093100547790527, 8.355814933776855, 8.618528366088867]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 8.0, 19.0, 18.0, 20.0, 35.0, 51.0, 88.0, 122.0, 223.0, 342.0, 608.0, 1307.0, 2633.0, 5583.0, 13045.0, 32509.0, 88298.0, 278579.0, 413352.0, 132316.0, 46381.0, 18195.0, 7632.0, 3457.0, 1757.0, 847.0, 435.0, 250.0, 135.0, 98.0, 68.0, 49.0, 25.0, 21.0, 9.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.87591552734375, -4.7088623046875, -4.54180908203125, -4.374755859375, -4.20770263671875, -4.0406494140625, -3.87359619140625, -3.70654296875, -3.53948974609375, -3.3724365234375, -3.20538330078125, -3.038330078125, -2.87127685546875, -2.7042236328125, -2.53717041015625, -2.3701171875, -2.20306396484375, -2.0360107421875, -1.86895751953125, -1.701904296875, -1.53485107421875, -1.3677978515625, -1.20074462890625, -1.03369140625, -0.86663818359375, -0.6995849609375, -0.53253173828125, -0.365478515625, -0.19842529296875, -0.0313720703125, 0.13568115234375, 0.302734375, 0.46978759765625, 0.6368408203125, 0.80389404296875, 0.970947265625, 1.13800048828125, 1.3050537109375, 1.47210693359375, 1.63916015625, 1.80621337890625, 1.9732666015625, 2.14031982421875, 2.307373046875, 2.47442626953125, 2.6414794921875, 2.80853271484375, 2.9755859375, 3.14263916015625, 3.3096923828125, 3.47674560546875, 3.643798828125, 3.81085205078125, 3.9779052734375, 4.14495849609375, 4.31201171875, 4.47906494140625, 4.6461181640625, 4.81317138671875, 4.980224609375, 5.14727783203125, 5.3143310546875, 5.48138427734375, 5.6484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 6.0, 10.0, 13.0, 16.0, 11.0, 21.0, 21.0, 23.0, 31.0, 33.0, 44.0, 52.0, 61.0, 76.0, 56.0, 62.0, 57.0, 61.0, 55.0, 44.0, 41.0, 39.0, 40.0, 35.0, 19.0, 20.0, 8.0, 13.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.898040771484375, -0.86541748046875, -0.832794189453125, -0.8001708984375, -0.767547607421875, -0.73492431640625, -0.702301025390625, -0.669677734375, -0.637054443359375, -0.60443115234375, -0.571807861328125, -0.5391845703125, -0.506561279296875, -0.47393798828125, -0.441314697265625, -0.40869140625, -0.376068115234375, -0.34344482421875, -0.310821533203125, -0.2781982421875, -0.245574951171875, -0.21295166015625, -0.180328369140625, -0.147705078125, -0.115081787109375, -0.08245849609375, -0.049835205078125, -0.0172119140625, 0.015411376953125, 0.04803466796875, 0.080657958984375, 0.11328125, 0.145904541015625, 0.17852783203125, 0.211151123046875, 0.2437744140625, 0.276397705078125, 0.30902099609375, 0.341644287109375, 0.374267578125, 0.406890869140625, 0.43951416015625, 0.472137451171875, 0.5047607421875, 0.537384033203125, 0.57000732421875, 0.602630615234375, 0.63525390625, 0.667877197265625, 0.70050048828125, 0.733123779296875, 0.7657470703125, 0.798370361328125, 0.83099365234375, 0.863616943359375, 0.896240234375, 0.928863525390625, 0.96148681640625, 0.994110107421875, 1.0267333984375, 1.059356689453125, 1.09197998046875, 1.124603271484375, 1.1572265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 13.0, 10.0, 11.0, 15.0, 34.0, 33.0, 54.0, 75.0, 111.0, 196.0, 346.0, 583.0, 1245.0, 3311.0, 13385.0, 79009.0, 573452.0, 319610.0, 43967.0, 8559.0, 2387.0, 963.0, 434.0, 240.0, 161.0, 109.0, 81.0, 32.0, 30.0, 18.0, 15.0, 14.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.89306640625, -6.6455078125, -6.39794921875, -6.150390625, -5.90283203125, -5.6552734375, -5.40771484375, -5.16015625, -4.91259765625, -4.6650390625, -4.41748046875, -4.169921875, -3.92236328125, -3.6748046875, -3.42724609375, -3.1796875, -2.93212890625, -2.6845703125, -2.43701171875, -2.189453125, -1.94189453125, -1.6943359375, -1.44677734375, -1.19921875, -0.95166015625, -0.7041015625, -0.45654296875, -0.208984375, 0.03857421875, 0.2861328125, 0.53369140625, 0.78125, 1.02880859375, 1.2763671875, 1.52392578125, 1.771484375, 2.01904296875, 2.2666015625, 2.51416015625, 2.76171875, 3.00927734375, 3.2568359375, 3.50439453125, 3.751953125, 3.99951171875, 4.2470703125, 4.49462890625, 4.7421875, 4.98974609375, 5.2373046875, 5.48486328125, 5.732421875, 5.97998046875, 6.2275390625, 6.47509765625, 6.72265625, 6.97021484375, 7.2177734375, 7.46533203125, 7.712890625, 7.96044921875, 8.2080078125, 8.45556640625, 8.703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 5.0, 10.0, 7.0, 12.0, 11.0, 15.0, 16.0, 21.0, 35.0, 32.0, 30.0, 30.0, 53.0, 44.0, 49.0, 61.0, 54.0, 45.0, 57.0, 42.0, 60.0, 33.0, 41.0, 48.0, 34.0, 29.0, 16.0, 28.0, 11.0, 16.0, 17.0, 11.0, 4.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.222412109375, -4.07763671875, -3.932861328125, -3.7880859375, -3.643310546875, -3.49853515625, -3.353759765625, -3.208984375, -3.064208984375, -2.91943359375, -2.774658203125, -2.6298828125, -2.485107421875, -2.34033203125, -2.195556640625, -2.05078125, -1.906005859375, -1.76123046875, -1.616455078125, -1.4716796875, -1.326904296875, -1.18212890625, -1.037353515625, -0.892578125, -0.747802734375, -0.60302734375, -0.458251953125, -0.3134765625, -0.168701171875, -0.02392578125, 0.120849609375, 0.265625, 0.410400390625, 0.55517578125, 0.699951171875, 0.8447265625, 0.989501953125, 1.13427734375, 1.279052734375, 1.423828125, 1.568603515625, 1.71337890625, 1.858154296875, 2.0029296875, 2.147705078125, 2.29248046875, 2.437255859375, 2.58203125, 2.726806640625, 2.87158203125, 3.016357421875, 3.1611328125, 3.305908203125, 3.45068359375, 3.595458984375, 3.740234375, 3.885009765625, 4.02978515625, 4.174560546875, 4.3193359375, 4.464111328125, 4.60888671875, 4.753662109375, 4.8984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 5.0, 17.0, 15.0, 34.0, 40.0, 60.0, 99.0, 130.0, 219.0, 448.0, 1001.0, 2514.0, 9453.0, 84466.0, 836295.0, 98544.0, 10387.0, 2634.0, 1051.0, 480.0, 241.0, 141.0, 93.0, 44.0, 42.0, 30.0, 19.0, 13.0, 6.0, 6.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58203125, -7.29620361328125, -7.0103759765625, -6.72454833984375, -6.438720703125, -6.15289306640625, -5.8670654296875, -5.58123779296875, -5.29541015625, -5.00958251953125, -4.7237548828125, -4.43792724609375, -4.152099609375, -3.86627197265625, -3.5804443359375, -3.29461669921875, -3.0087890625, -2.72296142578125, -2.4371337890625, -2.15130615234375, -1.865478515625, -1.57965087890625, -1.2938232421875, -1.00799560546875, -0.72216796875, -0.43634033203125, -0.1505126953125, 0.13531494140625, 0.421142578125, 0.70697021484375, 0.9927978515625, 1.27862548828125, 1.564453125, 1.85028076171875, 2.1361083984375, 2.42193603515625, 2.707763671875, 2.99359130859375, 3.2794189453125, 3.56524658203125, 3.85107421875, 4.13690185546875, 4.4227294921875, 4.70855712890625, 4.994384765625, 5.28021240234375, 5.5660400390625, 5.85186767578125, 6.1376953125, 6.42352294921875, 6.7093505859375, 6.99517822265625, 7.281005859375, 7.56683349609375, 7.8526611328125, 8.13848876953125, 8.42431640625, 8.71014404296875, 8.9959716796875, 9.28179931640625, 9.567626953125, 9.85345458984375, 10.1392822265625, 10.42510986328125, 10.7109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 13.0, 12.0, 17.0, 24.0, 43.0, 41.0, 61.0, 134.0, 141.0, 142.0, 91.0, 43.0, 45.0, 29.0, 19.0, 19.0, 21.0, 10.0, 6.0, 10.0, 3.0, 8.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008206367492675781, -0.0007954463362693787, -0.0007702559232711792, -0.0007450655102729797, -0.0007198750972747803, -0.0006946846842765808, -0.0006694942712783813, -0.0006443038582801819, -0.0006191134452819824, -0.000593923032283783, -0.0005687326192855835, -0.000543542206287384, -0.0005183517932891846, -0.0004931613802909851, -0.00046797096729278564, -0.0004427805542945862, -0.0004175901412963867, -0.00039239972829818726, -0.0003672093152999878, -0.00034201890230178833, -0.00031682848930358887, -0.0002916380763053894, -0.00026644766330718994, -0.00024125725030899048, -0.00021606683731079102, -0.00019087642431259155, -0.0001656860113143921, -0.00014049559831619263, -0.00011530518531799316, -9.01147723197937e-05, -6.492435932159424e-05, -3.9733946323394775e-05, -1.4543533325195312e-05, 1.064687967300415e-05, 3.583729267120361e-05, 6.1027705669403076e-05, 8.621811866760254e-05, 0.000111408531665802, 0.00013659894466400146, 0.00016178935766220093, 0.0001869797706604004, 0.00021217018365859985, 0.00023736059665679932, 0.0002625510096549988, 0.00028774142265319824, 0.0003129318356513977, 0.00033812224864959717, 0.00036331266164779663, 0.0003885030746459961, 0.00041369348764419556, 0.000438883900642395, 0.0004640743136405945, 0.0004892647266387939, 0.0005144551396369934, 0.0005396455526351929, 0.0005648359656333923, 0.0005900263786315918, 0.0006152167916297913, 0.0006404072046279907, 0.0006655976176261902, 0.0006907880306243896, 0.0007159784436225891, 0.0007411688566207886, 0.000766359269618988, 0.0007915496826171875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 27.0, 32.0, 74.0, 124.0, 284.0, 772.0, 2704.0, 15629.0, 792614.0, 225289.0, 8176.0, 1681.0, 621.0, 235.0, 121.0, 56.0, 26.0, 18.0, 16.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.015625, -15.592529296875, -15.16943359375, -14.746337890625, -14.3232421875, -13.900146484375, -13.47705078125, -13.053955078125, -12.630859375, -12.207763671875, -11.78466796875, -11.361572265625, -10.9384765625, -10.515380859375, -10.09228515625, -9.669189453125, -9.24609375, -8.822998046875, -8.39990234375, -7.976806640625, -7.5537109375, -7.130615234375, -6.70751953125, -6.284423828125, -5.861328125, -5.438232421875, -5.01513671875, -4.592041015625, -4.1689453125, -3.745849609375, -3.32275390625, -2.899658203125, -2.4765625, -2.053466796875, -1.63037109375, -1.207275390625, -0.7841796875, -0.361083984375, 0.06201171875, 0.485107421875, 0.908203125, 1.331298828125, 1.75439453125, 2.177490234375, 2.6005859375, 3.023681640625, 3.44677734375, 3.869873046875, 4.29296875, 4.716064453125, 5.13916015625, 5.562255859375, 5.9853515625, 6.408447265625, 6.83154296875, 7.254638671875, 7.677734375, 8.100830078125, 8.52392578125, 8.947021484375, 9.3701171875, 9.793212890625, 10.21630859375, 10.639404296875, 11.0625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 7.0, 18.0, 21.0, 32.0, 71.0, 96.0, 130.0, 168.0, 135.0, 95.0, 69.0, 51.0, 29.0, 9.0, 14.0, 5.0, 10.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.33721923828125, -4.1744384765625, -4.01165771484375, -3.848876953125, -3.68609619140625, -3.5233154296875, -3.36053466796875, -3.19775390625, -3.03497314453125, -2.8721923828125, -2.70941162109375, -2.546630859375, -2.38385009765625, -2.2210693359375, -2.05828857421875, -1.8955078125, -1.73272705078125, -1.5699462890625, -1.40716552734375, -1.244384765625, -1.08160400390625, -0.9188232421875, -0.75604248046875, -0.59326171875, -0.43048095703125, -0.2677001953125, -0.10491943359375, 0.057861328125, 0.22064208984375, 0.3834228515625, 0.54620361328125, 0.708984375, 0.87176513671875, 1.0345458984375, 1.19732666015625, 1.360107421875, 1.52288818359375, 1.6856689453125, 1.84844970703125, 2.01123046875, 2.17401123046875, 2.3367919921875, 2.49957275390625, 2.662353515625, 2.82513427734375, 2.9879150390625, 3.15069580078125, 3.3134765625, 3.47625732421875, 3.6390380859375, 3.80181884765625, 3.964599609375, 4.12738037109375, 4.2901611328125, 4.45294189453125, 4.61572265625, 4.77850341796875, 4.9412841796875, 5.10406494140625, 5.266845703125, 5.42962646484375, 5.5924072265625, 5.75518798828125, 5.91796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 13.0, 37.0, 150.0, 317.0, 277.0, 149.0, 39.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.17984008789062, -138.70510864257812, -135.23037719726562, -131.7556610107422, -128.2809295654297, -124.80619812011719, -121.33146667480469, -117.85674285888672, -114.38201141357422, -110.90727996826172, -107.43255615234375, -103.95782470703125, -100.48310089111328, -97.00836944580078, -93.53364562988281, -90.05891418457031, -86.58418273925781, -83.10945129394531, -79.63472747802734, -76.15999603271484, -72.68527221679688, -69.21054077148438, -65.73580932617188, -62.261085510253906, -58.78636169433594, -55.3116340637207, -51.83690643310547, -48.36217498779297, -44.887447357177734, -41.4127197265625, -37.937992095947266, -34.46326446533203, -30.98853302001953, -27.513805389404297, -24.03907585144043, -20.564348220825195, -17.089618682861328, -13.614891052246094, -10.14016342163086, -6.665433883666992, -3.190706253051758, 0.28402209281921387, 3.7587504386901855, 7.233478546142578, 10.708207130432129, 14.18293571472168, 17.657663345336914, 21.13239288330078, 24.607120513916016, 28.08184814453125, 31.556577682495117, 35.03130340576172, 38.50603485107422, 41.98076248168945, 45.45549011230469, 48.93022155761719, 52.404945373535156, 55.87967300415039, 59.354400634765625, 62.829132080078125, 66.3038558959961, 69.7785873413086, 73.25331115722656, 76.72804260253906, 80.20277404785156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 13.0, 10.0, 14.0, 8.0, 25.0, 23.0, 18.0, 24.0, 22.0, 34.0, 24.0, 35.0, 30.0, 54.0, 40.0, 42.0, 43.0, 45.0, 39.0, 45.0, 45.0, 33.0, 45.0, 31.0, 23.0, 32.0, 28.0, 15.0, 16.0, 18.0, 11.0, 12.0, 16.0, 20.0, 7.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.59099769592285, -21.890220642089844, -21.189443588256836, -20.488666534423828, -19.78788948059082, -19.087112426757812, -18.386335372924805, -17.685558319091797, -16.98478126525879, -16.28400421142578, -15.583227157592773, -14.882450103759766, -14.181673049926758, -13.48089599609375, -12.780118942260742, -12.079341888427734, -11.378564834594727, -10.677787780761719, -9.977010726928711, -9.276233673095703, -8.575456619262695, -7.8746795654296875, -7.17390251159668, -6.473125457763672, -5.772348403930664, -5.071571350097656, -4.370794296264648, -3.6700172424316406, -2.969240188598633, -2.268463134765625, -1.5676860809326172, -0.8669090270996094, -0.16613388061523438, 0.5346431732177734, 1.2354202270507812, 1.936197280883789, 2.636974334716797, 3.3377513885498047, 4.0385284423828125, 4.73930549621582, 5.440082550048828, 6.140859603881836, 6.841636657714844, 7.542413711547852, 8.24319076538086, 8.943967819213867, 9.644744873046875, 10.345521926879883, 11.04629898071289, 11.747076034545898, 12.447853088378906, 13.148630142211914, 13.849407196044922, 14.55018424987793, 15.250961303710938, 15.951738357543945, 16.652515411376953, 17.35329246520996, 18.05406951904297, 18.754846572875977, 19.455623626708984, 20.156400680541992, 20.857177734375, 21.557954788208008, 22.258731842041016]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 20.0, 24.0, 24.0, 50.0, 67.0, 135.0, 213.0, 387.0, 696.0, 1410.0, 3332.0, 8569.0, 26686.0, 118018.0, 3131608.0, 794106.0, 77981.0, 19704.0, 6503.0, 2466.0, 1111.0, 503.0, 283.0, 144.0, 85.0, 46.0, 30.0, 27.0, 14.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -3.97454833984375, -3.7928466796875, -3.61114501953125, -3.429443359375, -3.24774169921875, -3.0660400390625, -2.88433837890625, -2.70263671875, -2.52093505859375, -2.3392333984375, -2.15753173828125, -1.975830078125, -1.79412841796875, -1.6124267578125, -1.43072509765625, -1.2490234375, -1.06732177734375, -0.8856201171875, -0.70391845703125, -0.522216796875, -0.34051513671875, -0.1588134765625, 0.02288818359375, 0.20458984375, 0.38629150390625, 0.5679931640625, 0.74969482421875, 0.931396484375, 1.11309814453125, 1.2947998046875, 1.47650146484375, 1.658203125, 1.83990478515625, 2.0216064453125, 2.20330810546875, 2.385009765625, 2.56671142578125, 2.7484130859375, 2.93011474609375, 3.11181640625, 3.29351806640625, 3.4752197265625, 3.65692138671875, 3.838623046875, 4.02032470703125, 4.2020263671875, 4.38372802734375, 4.5654296875, 4.74713134765625, 4.9288330078125, 5.11053466796875, 5.292236328125, 5.47393798828125, 5.6556396484375, 5.83734130859375, 6.01904296875, 6.20074462890625, 6.3824462890625, 6.56414794921875, 6.745849609375, 6.92755126953125, 7.1092529296875, 7.29095458984375, 7.47265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 5.0, 8.0, 12.0, 5.0, 18.0, 27.0, 15.0, 31.0, 42.0, 46.0, 62.0, 52.0, 56.0, 55.0, 62.0, 67.0, 51.0, 56.0, 59.0, 50.0, 49.0, 38.0, 25.0, 35.0, 13.0, 12.0, 10.0, 4.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -1.0113372802734375, -0.974822998046875, -0.9383087158203125, -0.90179443359375, -0.8652801513671875, -0.828765869140625, -0.7922515869140625, -0.7557373046875, -0.7192230224609375, -0.682708740234375, -0.6461944580078125, -0.60968017578125, -0.5731658935546875, -0.536651611328125, -0.5001373291015625, -0.463623046875, -0.4271087646484375, -0.390594482421875, -0.3540802001953125, -0.31756591796875, -0.2810516357421875, -0.244537353515625, -0.2080230712890625, -0.1715087890625, -0.1349945068359375, -0.098480224609375, -0.0619659423828125, -0.02545166015625, 0.0110626220703125, 0.047576904296875, 0.0840911865234375, 0.12060546875, 0.1571197509765625, 0.193634033203125, 0.2301483154296875, 0.26666259765625, 0.3031768798828125, 0.339691162109375, 0.3762054443359375, 0.4127197265625, 0.4492340087890625, 0.485748291015625, 0.5222625732421875, 0.55877685546875, 0.5952911376953125, 0.631805419921875, 0.6683197021484375, 0.704833984375, 0.7413482666015625, 0.777862548828125, 0.8143768310546875, 0.85089111328125, 0.8874053955078125, 0.923919677734375, 0.9604339599609375, 0.9969482421875, 1.0334625244140625, 1.069976806640625, 1.1064910888671875, 1.14300537109375, 1.1795196533203125, 1.216033935546875, 1.2525482177734375, 1.2890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 9.0, 16.0, 24.0, 30.0, 48.0, 72.0, 124.0, 211.0, 333.0, 607.0, 1049.0, 1938.0, 3647.0, 7759.0, 17973.0, 49154.0, 177594.0, 2260314.0, 1437548.0, 158003.0, 45190.0, 17102.0, 7528.0, 3657.0, 1790.0, 1022.0, 559.0, 317.0, 208.0, 151.0, 103.0, 62.0, 50.0, 19.0, 27.0, 5.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.05859375, -4.91387939453125, -4.7691650390625, -4.62445068359375, -4.479736328125, -4.33502197265625, -4.1903076171875, -4.04559326171875, -3.90087890625, -3.75616455078125, -3.6114501953125, -3.46673583984375, -3.322021484375, -3.17730712890625, -3.0325927734375, -2.88787841796875, -2.7431640625, -2.59844970703125, -2.4537353515625, -2.30902099609375, -2.164306640625, -2.01959228515625, -1.8748779296875, -1.73016357421875, -1.58544921875, -1.44073486328125, -1.2960205078125, -1.15130615234375, -1.006591796875, -0.86187744140625, -0.7171630859375, -0.57244873046875, -0.427734375, -0.28302001953125, -0.1383056640625, 0.00640869140625, 0.151123046875, 0.29583740234375, 0.4405517578125, 0.58526611328125, 0.72998046875, 0.87469482421875, 1.0194091796875, 1.16412353515625, 1.308837890625, 1.45355224609375, 1.5982666015625, 1.74298095703125, 1.8876953125, 2.03240966796875, 2.1771240234375, 2.32183837890625, 2.466552734375, 2.61126708984375, 2.7559814453125, 2.90069580078125, 3.04541015625, 3.19012451171875, 3.3348388671875, 3.47955322265625, 3.624267578125, 3.76898193359375, 3.9136962890625, 4.05841064453125, 4.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 21.0, 19.0, 25.0, 40.0, 42.0, 84.0, 129.0, 192.0, 345.0, 1015.0, 1057.0, 395.0, 193.0, 140.0, 95.0, 57.0, 33.0, 32.0, 22.0, 18.0, 12.0, 16.0, 12.0, 10.0, 3.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.060546875, -1.991973876953125, -1.92340087890625, -1.854827880859375, -1.7862548828125, -1.717681884765625, -1.64910888671875, -1.580535888671875, -1.511962890625, -1.443389892578125, -1.37481689453125, -1.306243896484375, -1.2376708984375, -1.169097900390625, -1.10052490234375, -1.031951904296875, -0.96337890625, -0.894805908203125, -0.82623291015625, -0.757659912109375, -0.6890869140625, -0.620513916015625, -0.55194091796875, -0.483367919921875, -0.414794921875, -0.346221923828125, -0.27764892578125, -0.209075927734375, -0.1405029296875, -0.071929931640625, -0.00335693359375, 0.065216064453125, 0.1337890625, 0.202362060546875, 0.27093505859375, 0.339508056640625, 0.4080810546875, 0.476654052734375, 0.54522705078125, 0.613800048828125, 0.682373046875, 0.750946044921875, 0.81951904296875, 0.888092041015625, 0.9566650390625, 1.025238037109375, 1.09381103515625, 1.162384033203125, 1.23095703125, 1.299530029296875, 1.36810302734375, 1.436676025390625, 1.5052490234375, 1.573822021484375, 1.64239501953125, 1.710968017578125, 1.779541015625, 1.848114013671875, 1.91668701171875, 1.985260009765625, 2.0538330078125, 2.122406005859375, 2.19097900390625, 2.259552001953125, 2.328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 17.0, 50.0, 87.0, 164.0, 207.0, 212.0, 127.0, 62.0, 31.0, 20.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.24348258972168, -21.3341121673584, -20.424741744995117, -19.515371322631836, -18.606000900268555, -17.696630477905273, -16.787261962890625, -15.877890586853027, -14.968520164489746, -14.059149742126465, -13.149779319763184, -12.240409851074219, -11.331039428710938, -10.421669006347656, -9.512298583984375, -8.602928161621094, -7.6935577392578125, -6.784187316894531, -5.87481689453125, -4.965446949005127, -4.056076526641846, -3.1467061042785645, -2.2373361587524414, -1.3279657363891602, -0.4185953140258789, 0.4907749891281128, 1.4001452922821045, 2.3095154762268066, 3.218885898590088, 4.128256320953369, 5.037626266479492, 5.946996688842773, 6.856365203857422, 7.765735626220703, 8.675106048583984, 9.584476470947266, 10.493846893310547, 11.403217315673828, 12.312586784362793, 13.221957206726074, 14.131327629089355, 15.040698051452637, 15.950068473815918, 16.859437942504883, 17.768808364868164, 18.678178787231445, 19.587549209594727, 20.496919631958008, 21.40629005432129, 22.31566047668457, 23.22503089904785, 24.134401321411133, 25.043771743774414, 25.953142166137695, 26.862510681152344, 27.771881103515625, 28.681251525878906, 29.590621948242188, 30.49999237060547, 31.40936279296875, 32.31873321533203, 33.22810363769531, 34.137474060058594, 35.046844482421875, 35.956214904785156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 4.0, 8.0, 15.0, 11.0, 16.0, 19.0, 25.0, 29.0, 34.0, 30.0, 36.0, 44.0, 37.0, 46.0, 45.0, 51.0, 53.0, 36.0, 39.0, 44.0, 39.0, 46.0, 35.0, 31.0, 36.0, 31.0, 26.0, 22.0, 16.0, 28.0, 14.0, 7.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203773498535156, -8.894710540771484, -8.585647583007812, -8.27658462524414, -7.967521667480469, -7.658458709716797, -7.349395751953125, -7.040332794189453, -6.731269836425781, -6.422206878662109, -6.1131439208984375, -5.804080963134766, -5.495018005371094, -5.185955047607422, -4.87689208984375, -4.567829132080078, -4.258766174316406, -3.9497032165527344, -3.6406402587890625, -3.3315773010253906, -3.0225143432617188, -2.713451385498047, -2.404388427734375, -2.095325469970703, -1.7862625122070312, -1.4771995544433594, -1.1681365966796875, -0.8590736389160156, -0.5500106811523438, -0.24094772338867188, 0.068115234375, 0.3771781921386719, 0.6862411499023438, 0.9953041076660156, 1.3043670654296875, 1.6134300231933594, 1.9224929809570312, 2.231555938720703, 2.540618896484375, 2.849681854248047, 3.1587448120117188, 3.4678077697753906, 3.7768707275390625, 4.085933685302734, 4.394996643066406, 4.704059600830078, 5.01312255859375, 5.322185516357422, 5.631248474121094, 5.940311431884766, 6.2493743896484375, 6.558437347412109, 6.867500305175781, 7.176563262939453, 7.485626220703125, 7.794689178466797, 8.103752136230469, 8.41281509399414, 8.721878051757812, 9.030941009521484, 9.340003967285156, 9.649066925048828, 9.9581298828125, 10.267192840576172, 10.576255798339844]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 19.0, 15.0, 22.0, 28.0, 44.0, 95.0, 127.0, 274.0, 420.0, 778.0, 1505.0, 3078.0, 6518.0, 15613.0, 39708.0, 118723.0, 645624.0, 139889.0, 44807.0, 17224.0, 7245.0, 3201.0, 1594.0, 850.0, 515.0, 257.0, 129.0, 92.0, 57.0, 35.0, 21.0, 21.0, 5.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.41998291015625, -6.2227783203125, -6.02557373046875, -5.828369140625, -5.63116455078125, -5.4339599609375, -5.23675537109375, -5.03955078125, -4.84234619140625, -4.6451416015625, -4.44793701171875, -4.250732421875, -4.05352783203125, -3.8563232421875, -3.65911865234375, -3.4619140625, -3.26470947265625, -3.0675048828125, -2.87030029296875, -2.673095703125, -2.47589111328125, -2.2786865234375, -2.08148193359375, -1.88427734375, -1.68707275390625, -1.4898681640625, -1.29266357421875, -1.095458984375, -0.89825439453125, -0.7010498046875, -0.50384521484375, -0.306640625, -0.10943603515625, 0.0877685546875, 0.28497314453125, 0.482177734375, 0.67938232421875, 0.8765869140625, 1.07379150390625, 1.27099609375, 1.46820068359375, 1.6654052734375, 1.86260986328125, 2.059814453125, 2.25701904296875, 2.4542236328125, 2.65142822265625, 2.8486328125, 3.04583740234375, 3.2430419921875, 3.44024658203125, 3.637451171875, 3.83465576171875, 4.0318603515625, 4.22906494140625, 4.42626953125, 4.62347412109375, 4.8206787109375, 5.01788330078125, 5.215087890625, 5.41229248046875, 5.6094970703125, 5.80670166015625, 6.00390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 8.0, 10.0, 18.0, 19.0, 19.0, 18.0, 35.0, 30.0, 39.0, 46.0, 54.0, 58.0, 52.0, 46.0, 64.0, 61.0, 50.0, 63.0, 48.0, 40.0, 32.0, 28.0, 25.0, 23.0, 19.0, 20.0, 11.0, 7.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.861358642578125, -0.82720947265625, -0.793060302734375, -0.7589111328125, -0.724761962890625, -0.69061279296875, -0.656463623046875, -0.622314453125, -0.588165283203125, -0.55401611328125, -0.519866943359375, -0.4857177734375, -0.451568603515625, -0.41741943359375, -0.383270263671875, -0.34912109375, -0.314971923828125, -0.28082275390625, -0.246673583984375, -0.2125244140625, -0.178375244140625, -0.14422607421875, -0.110076904296875, -0.075927734375, -0.041778564453125, -0.00762939453125, 0.026519775390625, 0.0606689453125, 0.094818115234375, 0.12896728515625, 0.163116455078125, 0.197265625, 0.231414794921875, 0.26556396484375, 0.299713134765625, 0.3338623046875, 0.368011474609375, 0.40216064453125, 0.436309814453125, 0.470458984375, 0.504608154296875, 0.53875732421875, 0.572906494140625, 0.6070556640625, 0.641204833984375, 0.67535400390625, 0.709503173828125, 0.74365234375, 0.777801513671875, 0.81195068359375, 0.846099853515625, 0.8802490234375, 0.914398193359375, 0.94854736328125, 0.982696533203125, 1.016845703125, 1.050994873046875, 1.08514404296875, 1.119293212890625, 1.1534423828125, 1.187591552734375, 1.22174072265625, 1.255889892578125, 1.2900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 13.0, 14.0, 18.0, 22.0, 29.0, 44.0, 57.0, 96.0, 138.0, 237.0, 409.0, 737.0, 1600.0, 4537.0, 17995.0, 91339.0, 768581.0, 128274.0, 24610.0, 5853.0, 1879.0, 798.0, 454.0, 279.0, 158.0, 99.0, 73.0, 51.0, 38.0, 31.0, 20.0, 9.0, 6.0, 10.0, 7.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1875, -7.910888671875, -7.63427734375, -7.357666015625, -7.0810546875, -6.804443359375, -6.52783203125, -6.251220703125, -5.974609375, -5.697998046875, -5.42138671875, -5.144775390625, -4.8681640625, -4.591552734375, -4.31494140625, -4.038330078125, -3.76171875, -3.485107421875, -3.20849609375, -2.931884765625, -2.6552734375, -2.378662109375, -2.10205078125, -1.825439453125, -1.548828125, -1.272216796875, -0.99560546875, -0.718994140625, -0.4423828125, -0.165771484375, 0.11083984375, 0.387451171875, 0.6640625, 0.940673828125, 1.21728515625, 1.493896484375, 1.7705078125, 2.047119140625, 2.32373046875, 2.600341796875, 2.876953125, 3.153564453125, 3.43017578125, 3.706787109375, 3.9833984375, 4.260009765625, 4.53662109375, 4.813232421875, 5.08984375, 5.366455078125, 5.64306640625, 5.919677734375, 6.1962890625, 6.472900390625, 6.74951171875, 7.026123046875, 7.302734375, 7.579345703125, 7.85595703125, 8.132568359375, 8.4091796875, 8.685791015625, 8.96240234375, 9.239013671875, 9.515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 7.0, 12.0, 10.0, 27.0, 36.0, 36.0, 51.0, 43.0, 43.0, 61.0, 61.0, 64.0, 43.0, 68.0, 48.0, 53.0, 52.0, 49.0, 41.0, 39.0, 28.0, 32.0, 17.0, 13.0, 10.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.9375, -5.767333984375, -5.59716796875, -5.427001953125, -5.2568359375, -5.086669921875, -4.91650390625, -4.746337890625, -4.576171875, -4.406005859375, -4.23583984375, -4.065673828125, -3.8955078125, -3.725341796875, -3.55517578125, -3.385009765625, -3.21484375, -3.044677734375, -2.87451171875, -2.704345703125, -2.5341796875, -2.364013671875, -2.19384765625, -2.023681640625, -1.853515625, -1.683349609375, -1.51318359375, -1.343017578125, -1.1728515625, -1.002685546875, -0.83251953125, -0.662353515625, -0.4921875, -0.322021484375, -0.15185546875, 0.018310546875, 0.1884765625, 0.358642578125, 0.52880859375, 0.698974609375, 0.869140625, 1.039306640625, 1.20947265625, 1.379638671875, 1.5498046875, 1.719970703125, 1.89013671875, 2.060302734375, 2.23046875, 2.400634765625, 2.57080078125, 2.740966796875, 2.9111328125, 3.081298828125, 3.25146484375, 3.421630859375, 3.591796875, 3.761962890625, 3.93212890625, 4.102294921875, 4.2724609375, 4.442626953125, 4.61279296875, 4.782958984375, 4.953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 20.0, 29.0, 43.0, 58.0, 112.0, 172.0, 302.0, 540.0, 1160.0, 2275.0, 5742.0, 15629.0, 46922.0, 203773.0, 631187.0, 93405.0, 29439.0, 10284.0, 3848.0, 1717.0, 853.0, 411.0, 228.0, 121.0, 71.0, 68.0, 42.0, 28.0, 16.0, 9.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.3428955078125, -3.228759765625, -3.1146240234375, -3.00048828125, -2.8863525390625, -2.772216796875, -2.6580810546875, -2.5439453125, -2.4298095703125, -2.315673828125, -2.2015380859375, -2.08740234375, -1.9732666015625, -1.859130859375, -1.7449951171875, -1.630859375, -1.5167236328125, -1.402587890625, -1.2884521484375, -1.17431640625, -1.0601806640625, -0.946044921875, -0.8319091796875, -0.7177734375, -0.6036376953125, -0.489501953125, -0.3753662109375, -0.26123046875, -0.1470947265625, -0.032958984375, 0.0811767578125, 0.1953125, 0.3094482421875, 0.423583984375, 0.5377197265625, 0.65185546875, 0.7659912109375, 0.880126953125, 0.9942626953125, 1.1083984375, 1.2225341796875, 1.336669921875, 1.4508056640625, 1.56494140625, 1.6790771484375, 1.793212890625, 1.9073486328125, 2.021484375, 2.1356201171875, 2.249755859375, 2.3638916015625, 2.47802734375, 2.5921630859375, 2.706298828125, 2.8204345703125, 2.9345703125, 3.0487060546875, 3.162841796875, 3.2769775390625, 3.39111328125, 3.5052490234375, 3.619384765625, 3.7335205078125, 3.84765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 9.0, 3.0, 5.0, 13.0, 4.0, 10.0, 8.0, 14.0, 22.0, 22.0, 32.0, 51.0, 122.0, 326.0, 148.0, 55.0, 28.0, 36.0, 17.0, 10.0, 8.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010080337524414062, -0.0009760856628417969, -0.0009441375732421875, -0.0009121894836425781, -0.0008802413940429688, -0.0008482933044433594, -0.00081634521484375, -0.0007843971252441406, -0.0007524490356445312, -0.0007205009460449219, -0.0006885528564453125, -0.0006566047668457031, -0.0006246566772460938, -0.0005927085876464844, -0.000560760498046875, -0.0005288124084472656, -0.0004968643188476562, -0.0004649162292480469, -0.0004329681396484375, -0.0004010200500488281, -0.00036907196044921875, -0.0003371238708496094, -0.00030517578125, -0.0002732276916503906, -0.00024127960205078125, -0.00020933151245117188, -0.0001773834228515625, -0.00014543533325195312, -0.00011348724365234375, -8.153915405273438e-05, -4.9591064453125e-05, -1.7642974853515625e-05, 1.430511474609375e-05, 4.6253204345703125e-05, 7.82012939453125e-05, 0.00011014938354492188, 0.00014209747314453125, 0.00017404556274414062, 0.00020599365234375, 0.00023794174194335938, 0.00026988983154296875, 0.0003018379211425781, 0.0003337860107421875, 0.0003657341003417969, 0.00039768218994140625, 0.0004296302795410156, 0.000461578369140625, 0.0004935264587402344, 0.0005254745483398438, 0.0005574226379394531, 0.0005893707275390625, 0.0006213188171386719, 0.0006532669067382812, 0.0006852149963378906, 0.0007171630859375, 0.0007491111755371094, 0.0007810592651367188, 0.0008130073547363281, 0.0008449554443359375, 0.0008769035339355469, 0.0009088516235351562, 0.0009407997131347656, 0.000972747802734375, 0.0010046958923339844, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 9.0, 7.0, 19.0, 23.0, 34.0, 62.0, 105.0, 117.0, 264.0, 560.0, 1469.0, 5220.0, 31444.0, 350213.0, 606255.0, 43164.0, 6534.0, 1666.0, 649.0, 306.0, 163.0, 89.0, 56.0, 30.0, 21.0, 16.0, 10.0, 10.0, 5.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.34246826171875, -4.1693115234375, -3.99615478515625, -3.822998046875, -3.64984130859375, -3.4766845703125, -3.30352783203125, -3.13037109375, -2.95721435546875, -2.7840576171875, -2.61090087890625, -2.437744140625, -2.26458740234375, -2.0914306640625, -1.91827392578125, -1.7451171875, -1.57196044921875, -1.3988037109375, -1.22564697265625, -1.052490234375, -0.87933349609375, -0.7061767578125, -0.53302001953125, -0.35986328125, -0.18670654296875, -0.0135498046875, 0.15960693359375, 0.332763671875, 0.50592041015625, 0.6790771484375, 0.85223388671875, 1.025390625, 1.19854736328125, 1.3717041015625, 1.54486083984375, 1.718017578125, 1.89117431640625, 2.0643310546875, 2.23748779296875, 2.41064453125, 2.58380126953125, 2.7569580078125, 2.93011474609375, 3.103271484375, 3.27642822265625, 3.4495849609375, 3.62274169921875, 3.7958984375, 3.96905517578125, 4.1422119140625, 4.31536865234375, 4.488525390625, 4.66168212890625, 4.8348388671875, 5.00799560546875, 5.18115234375, 5.35430908203125, 5.5274658203125, 5.70062255859375, 5.873779296875, 6.04693603515625, 6.2200927734375, 6.39324951171875, 6.56640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 16.0, 3.0, 7.0, 8.0, 9.0, 20.0, 14.0, 28.0, 19.0, 26.0, 41.0, 65.0, 117.0, 134.0, 108.0, 102.0, 69.0, 29.0, 26.0, 22.0, 16.0, 13.0, 21.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.509735107421875, -2.43939208984375, -2.369049072265625, -2.2987060546875, -2.228363037109375, -2.15802001953125, -2.087677001953125, -2.017333984375, -1.946990966796875, -1.87664794921875, -1.806304931640625, -1.7359619140625, -1.665618896484375, -1.59527587890625, -1.524932861328125, -1.45458984375, -1.384246826171875, -1.31390380859375, -1.243560791015625, -1.1732177734375, -1.102874755859375, -1.03253173828125, -0.962188720703125, -0.891845703125, -0.821502685546875, -0.75115966796875, -0.680816650390625, -0.6104736328125, -0.540130615234375, -0.46978759765625, -0.399444580078125, -0.3291015625, -0.258758544921875, -0.18841552734375, -0.118072509765625, -0.0477294921875, 0.022613525390625, 0.09295654296875, 0.163299560546875, 0.233642578125, 0.303985595703125, 0.37432861328125, 0.444671630859375, 0.5150146484375, 0.585357666015625, 0.65570068359375, 0.726043701171875, 0.79638671875, 0.866729736328125, 0.93707275390625, 1.007415771484375, 1.0777587890625, 1.148101806640625, 1.21844482421875, 1.288787841796875, 1.359130859375, 1.429473876953125, 1.49981689453125, 1.570159912109375, 1.6405029296875, 1.710845947265625, 1.78118896484375, 1.851531982421875, 1.921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 13.0, 32.0, 78.0, 180.0, 246.0, 265.0, 107.0, 59.0, 13.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.47672653198242, -35.871986389160156, -33.26724624633789, -30.662508010864258, -28.057769775390625, -25.45302963256836, -22.848289489746094, -20.24355125427246, -17.638811111450195, -15.034071922302246, -12.429332733154297, -9.824592590332031, -7.219853401184082, -4.615114212036133, -2.010374069213867, 0.5943641662597656, 3.1991043090820312, 5.8038434982299805, 8.40858268737793, 11.013322830200195, 13.618062019348145, 16.222801208496094, 18.82754135131836, 21.432279586791992, 24.037019729614258, 26.641759872436523, 29.246498107910156, 31.851238250732422, 34.45597839355469, 37.06071472167969, 39.66545867919922, 42.27019500732422, 44.87493133544922, 47.479671478271484, 50.08441162109375, 52.68914794921875, 55.293888092041016, 57.89862823486328, 60.50336837768555, 63.10810852050781, 65.71284484863281, 68.31758117675781, 70.92232513427734, 73.52706146240234, 76.13180541992188, 78.73654174804688, 81.34127807617188, 83.9460220336914, 86.55076599121094, 89.15550231933594, 91.76024627685547, 94.36498260498047, 96.9697265625, 99.574462890625, 102.17919921875, 104.78394317626953, 107.38867950439453, 109.99341583251953, 112.59815979003906, 115.20289611816406, 117.8076400756836, 120.4123764038086, 123.01712036132812, 125.62185668945312, 128.22659301757812]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 10.0, 16.0, 11.0, 15.0, 13.0, 19.0, 34.0, 24.0, 28.0, 35.0, 34.0, 49.0, 39.0, 49.0, 49.0, 48.0, 46.0, 45.0, 45.0, 37.0, 41.0, 40.0, 34.0, 31.0, 36.0, 24.0, 18.0, 23.0, 20.0, 13.0, 9.0, 12.0, 9.0, 3.0, 7.0, 2.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.024023056030273, -23.28664779663086, -22.549270629882812, -21.8118953704834, -21.074520111083984, -20.337142944335938, -19.599767684936523, -18.86239242553711, -18.125015258789062, -17.38763999938965, -16.6502628326416, -15.912887573242188, -15.175512313842773, -14.438136100769043, -13.700759887695312, -12.963384628295898, -12.226009368896484, -11.488633155822754, -10.75125789642334, -10.01388168334961, -9.276506423950195, -8.539130210876465, -7.801753997802734, -7.064378261566162, -6.32700252532959, -5.589626789093018, -4.852251052856445, -4.114874839782715, -3.3774991035461426, -2.6401233673095703, -1.9027471542358398, -1.1653714179992676, -0.4279975891113281, 0.3093782663345337, 1.0467541217803955, 1.7841300964355469, 2.521505832672119, 3.2588815689086914, 3.996257781982422, 4.733633518218994, 5.471009254455566, 6.208384990692139, 6.945760726928711, 7.683136940002441, 8.420513153076172, 9.157888412475586, 9.895264625549316, 10.632640838623047, 11.370016098022461, 12.107392311096191, 12.844767570495605, 13.582143783569336, 14.31951904296875, 15.05689525604248, 15.794271469116211, 16.531646728515625, 17.269023895263672, 18.006399154663086, 18.743776321411133, 19.481151580810547, 20.21852684020996, 20.955902099609375, 21.693279266357422, 22.430654525756836, 23.16802978515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 11.0, 19.0, 24.0, 29.0, 48.0, 83.0, 153.0, 297.0, 553.0, 1172.0, 2470.0, 6197.0, 17621.0, 65191.0, 641809.0, 3320005.0, 100923.0, 24117.0, 7829.0, 3075.0, 1322.0, 621.0, 327.0, 131.0, 96.0, 59.0, 26.0, 20.0, 13.0, 5.0, 7.0, 9.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.78594970703125, -6.5679931640625, -6.35003662109375, -6.132080078125, -5.91412353515625, -5.6961669921875, -5.47821044921875, -5.26025390625, -5.04229736328125, -4.8243408203125, -4.60638427734375, -4.388427734375, -4.17047119140625, -3.9525146484375, -3.73455810546875, -3.5166015625, -3.29864501953125, -3.0806884765625, -2.86273193359375, -2.644775390625, -2.42681884765625, -2.2088623046875, -1.99090576171875, -1.77294921875, -1.55499267578125, -1.3370361328125, -1.11907958984375, -0.901123046875, -0.68316650390625, -0.4652099609375, -0.24725341796875, -0.029296875, 0.18865966796875, 0.4066162109375, 0.62457275390625, 0.842529296875, 1.06048583984375, 1.2784423828125, 1.49639892578125, 1.71435546875, 1.93231201171875, 2.1502685546875, 2.36822509765625, 2.586181640625, 2.80413818359375, 3.0220947265625, 3.24005126953125, 3.4580078125, 3.67596435546875, 3.8939208984375, 4.11187744140625, 4.329833984375, 4.54779052734375, 4.7657470703125, 4.98370361328125, 5.20166015625, 5.41961669921875, 5.6375732421875, 5.85552978515625, 6.073486328125, 6.29144287109375, 6.5093994140625, 6.72735595703125, 6.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 11.0, 10.0, 15.0, 15.0, 16.0, 24.0, 29.0, 38.0, 50.0, 44.0, 55.0, 52.0, 59.0, 57.0, 73.0, 66.0, 54.0, 58.0, 44.0, 40.0, 49.0, 28.0, 30.0, 15.0, 14.0, 12.0, 11.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2109375, -1.1689910888671875, -1.127044677734375, -1.0850982666015625, -1.04315185546875, -1.0012054443359375, -0.959259033203125, -0.9173126220703125, -0.8753662109375, -0.8334197998046875, -0.791473388671875, -0.7495269775390625, -0.70758056640625, -0.6656341552734375, -0.623687744140625, -0.5817413330078125, -0.539794921875, -0.4978485107421875, -0.455902099609375, -0.4139556884765625, -0.37200927734375, -0.3300628662109375, -0.288116455078125, -0.2461700439453125, -0.2042236328125, -0.1622772216796875, -0.120330810546875, -0.0783843994140625, -0.03643798828125, 0.0055084228515625, 0.047454833984375, 0.0894012451171875, 0.13134765625, 0.1732940673828125, 0.215240478515625, 0.2571868896484375, 0.29913330078125, 0.3410797119140625, 0.383026123046875, 0.4249725341796875, 0.4669189453125, 0.5088653564453125, 0.550811767578125, 0.5927581787109375, 0.63470458984375, 0.6766510009765625, 0.718597412109375, 0.7605438232421875, 0.802490234375, 0.8444366455078125, 0.886383056640625, 0.9283294677734375, 0.97027587890625, 1.0122222900390625, 1.054168701171875, 1.0961151123046875, 1.1380615234375, 1.1800079345703125, 1.221954345703125, 1.2639007568359375, 1.30584716796875, 1.3477935791015625, 1.389739990234375, 1.4316864013671875, 1.4736328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 9.0, 8.0, 12.0, 17.0, 30.0, 62.0, 102.0, 133.0, 229.0, 414.0, 706.0, 1221.0, 2433.0, 4868.0, 11026.0, 29162.0, 97115.0, 640439.0, 3141840.0, 186708.0, 47249.0, 16565.0, 6772.0, 3305.0, 1683.0, 883.0, 523.0, 311.0, 165.0, 119.0, 68.0, 39.0, 22.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69952392578125, -5.5279541015625, -5.35638427734375, -5.184814453125, -5.01324462890625, -4.8416748046875, -4.67010498046875, -4.49853515625, -4.32696533203125, -4.1553955078125, -3.98382568359375, -3.812255859375, -3.64068603515625, -3.4691162109375, -3.29754638671875, -3.1259765625, -2.95440673828125, -2.7828369140625, -2.61126708984375, -2.439697265625, -2.26812744140625, -2.0965576171875, -1.92498779296875, -1.75341796875, -1.58184814453125, -1.4102783203125, -1.23870849609375, -1.067138671875, -0.89556884765625, -0.7239990234375, -0.55242919921875, -0.380859375, -0.20928955078125, -0.0377197265625, 0.13385009765625, 0.305419921875, 0.47698974609375, 0.6485595703125, 0.82012939453125, 0.99169921875, 1.16326904296875, 1.3348388671875, 1.50640869140625, 1.677978515625, 1.84954833984375, 2.0211181640625, 2.19268798828125, 2.3642578125, 2.53582763671875, 2.7073974609375, 2.87896728515625, 3.050537109375, 3.22210693359375, 3.3936767578125, 3.56524658203125, 3.73681640625, 3.90838623046875, 4.0799560546875, 4.25152587890625, 4.423095703125, 4.59466552734375, 4.7662353515625, 4.93780517578125, 5.109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 18.0, 13.0, 23.0, 30.0, 50.0, 74.0, 108.0, 190.0, 395.0, 1640.0, 818.0, 277.0, 129.0, 66.0, 52.0, 44.0, 30.0, 24.0, 16.0, 11.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.554412841796875, -2.47406005859375, -2.393707275390625, -2.3133544921875, -2.233001708984375, -2.15264892578125, -2.072296142578125, -1.991943359375, -1.911590576171875, -1.83123779296875, -1.750885009765625, -1.6705322265625, -1.590179443359375, -1.50982666015625, -1.429473876953125, -1.34912109375, -1.268768310546875, -1.18841552734375, -1.108062744140625, -1.0277099609375, -0.947357177734375, -0.86700439453125, -0.786651611328125, -0.706298828125, -0.625946044921875, -0.54559326171875, -0.465240478515625, -0.3848876953125, -0.304534912109375, -0.22418212890625, -0.143829345703125, -0.0634765625, 0.016876220703125, 0.09722900390625, 0.177581787109375, 0.2579345703125, 0.338287353515625, 0.41864013671875, 0.498992919921875, 0.579345703125, 0.659698486328125, 0.74005126953125, 0.820404052734375, 0.9007568359375, 0.981109619140625, 1.06146240234375, 1.141815185546875, 1.22216796875, 1.302520751953125, 1.38287353515625, 1.463226318359375, 1.5435791015625, 1.623931884765625, 1.70428466796875, 1.784637451171875, 1.864990234375, 1.945343017578125, 2.02569580078125, 2.106048583984375, 2.1864013671875, 2.266754150390625, 2.34710693359375, 2.427459716796875, 2.5078125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 21.0, 37.0, 77.0, 168.0, 224.0, 190.0, 147.0, 79.0, 27.0, 12.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.649436950683594, -27.853559494018555, -27.057682037353516, -26.261804580688477, -25.465927124023438, -24.6700496673584, -23.87417221069336, -23.078292846679688, -22.28241729736328, -21.486539840698242, -20.690662384033203, -19.894784927368164, -19.098907470703125, -18.303030014038086, -17.507152557373047, -16.711273193359375, -15.915395736694336, -15.119518280029297, -14.323640823364258, -13.527763366699219, -12.73188591003418, -11.93600845336914, -11.140130043029785, -10.344252586364746, -9.548375129699707, -8.752497673034668, -7.956620216369629, -7.160742282867432, -6.364864826202393, -5.5689873695373535, -4.773109436035156, -3.977231979370117, -3.181354522705078, -2.385477066040039, -1.589599370956421, -0.7937216758728027, 0.002155780792236328, 0.7980332374572754, 1.5939111709594727, 2.3897886276245117, 3.185666084289551, 3.98154354095459, 4.777420997619629, 5.573298931121826, 6.369176387786865, 7.165053844451904, 7.960931777954102, 8.75680923461914, 9.55268669128418, 10.348564147949219, 11.144441604614258, 11.940319061279297, 12.736196517944336, 13.532073974609375, 14.32795238494873, 15.12382984161377, 15.919707298278809, 16.715585708618164, 17.511463165283203, 18.307340621948242, 19.10321807861328, 19.89909553527832, 20.69497299194336, 21.4908504486084, 22.286727905273438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 9.0, 7.0, 9.0, 19.0, 17.0, 27.0, 17.0, 19.0, 37.0, 38.0, 38.0, 40.0, 42.0, 42.0, 52.0, 47.0, 47.0, 48.0, 50.0, 42.0, 44.0, 50.0, 23.0, 36.0, 28.0, 32.0, 23.0, 22.0, 11.0, 14.0, 19.0, 10.0, 6.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.208544731140137, -7.939805507659912, -7.6710662841796875, -7.402327060699463, -7.133587837219238, -6.864849090576172, -6.596109867095947, -6.327370643615723, -6.058631420135498, -5.789892196655273, -5.521152973175049, -5.252413749694824, -4.983675003051758, -4.714935302734375, -4.446196556091309, -4.177457332611084, -3.9087181091308594, -3.6399788856506348, -3.37123966217041, -3.1025006771087646, -2.83376145362854, -2.5650222301483154, -2.29628324508667, -2.0275440216064453, -1.7588047981262207, -1.490065574645996, -1.221326470375061, -0.9525873064994812, -0.6838481426239014, -0.41510891914367676, -0.1463698148727417, 0.12236928939819336, 0.39110851287841797, 0.6598476767539978, 0.9285868406295776, 1.1973259449005127, 1.4660651683807373, 1.734804391860962, 2.0035433769226074, 2.272282600402832, 2.5410218238830566, 2.8097610473632812, 3.078500270843506, 3.3472392559051514, 3.615978479385376, 3.8847177028656006, 4.153456687927246, 4.422195911407471, 4.690935134887695, 4.95967435836792, 5.2284135818481445, 5.497152805328369, 5.765892028808594, 6.03463077545166, 6.303369998931885, 6.572109222412109, 6.840848445892334, 7.109587669372559, 7.378326892852783, 7.647066116333008, 7.915804862976074, 8.184544563293457, 8.453283309936523, 8.722023010253906, 8.990761756896973]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 12.0, 19.0, 24.0, 30.0, 43.0, 74.0, 110.0, 164.0, 253.0, 486.0, 920.0, 1778.0, 3610.0, 7745.0, 16602.0, 35793.0, 104619.0, 578180.0, 206443.0, 49669.0, 22057.0, 10158.0, 4779.0, 2368.0, 1118.0, 608.0, 338.0, 193.0, 115.0, 89.0, 49.0, 28.0, 20.0, 15.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.468475341796875, -3.33343505859375, -3.198394775390625, -3.0633544921875, -2.928314208984375, -2.79327392578125, -2.658233642578125, -2.523193359375, -2.388153076171875, -2.25311279296875, -2.118072509765625, -1.9830322265625, -1.847991943359375, -1.71295166015625, -1.577911376953125, -1.44287109375, -1.307830810546875, -1.17279052734375, -1.037750244140625, -0.9027099609375, -0.767669677734375, -0.63262939453125, -0.497589111328125, -0.362548828125, -0.227508544921875, -0.09246826171875, 0.042572021484375, 0.1776123046875, 0.312652587890625, 0.44769287109375, 0.582733154296875, 0.7177734375, 0.852813720703125, 0.98785400390625, 1.122894287109375, 1.2579345703125, 1.392974853515625, 1.52801513671875, 1.663055419921875, 1.798095703125, 1.933135986328125, 2.06817626953125, 2.203216552734375, 2.3382568359375, 2.473297119140625, 2.60833740234375, 2.743377685546875, 2.87841796875, 3.013458251953125, 3.14849853515625, 3.283538818359375, 3.4185791015625, 3.553619384765625, 3.68865966796875, 3.823699951171875, 3.958740234375, 4.093780517578125, 4.22882080078125, 4.363861083984375, 4.4989013671875, 4.633941650390625, 4.76898193359375, 4.904022216796875, 5.0390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 8.0, 13.0, 14.0, 17.0, 15.0, 25.0, 24.0, 36.0, 40.0, 36.0, 39.0, 55.0, 43.0, 51.0, 66.0, 70.0, 53.0, 49.0, 43.0, 53.0, 45.0, 41.0, 39.0, 16.0, 28.0, 13.0, 21.0, 12.0, 1.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1874542236328125, -1.147369384765625, -1.1072845458984375, -1.06719970703125, -1.0271148681640625, -0.987030029296875, -0.9469451904296875, -0.9068603515625, -0.8667755126953125, -0.826690673828125, -0.7866058349609375, -0.74652099609375, -0.7064361572265625, -0.666351318359375, -0.6262664794921875, -0.586181640625, -0.5460968017578125, -0.506011962890625, -0.4659271240234375, -0.42584228515625, -0.3857574462890625, -0.345672607421875, -0.3055877685546875, -0.2655029296875, -0.2254180908203125, -0.185333251953125, -0.1452484130859375, -0.10516357421875, -0.0650787353515625, -0.024993896484375, 0.0150909423828125, 0.05517578125, 0.0952606201171875, 0.135345458984375, 0.1754302978515625, 0.21551513671875, 0.2555999755859375, 0.295684814453125, 0.3357696533203125, 0.3758544921875, 0.4159393310546875, 0.456024169921875, 0.4961090087890625, 0.53619384765625, 0.5762786865234375, 0.616363525390625, 0.6564483642578125, 0.696533203125, 0.7366180419921875, 0.776702880859375, 0.8167877197265625, 0.85687255859375, 0.8969573974609375, 0.937042236328125, 0.9771270751953125, 1.0172119140625, 1.0572967529296875, 1.097381591796875, 1.1374664306640625, 1.17755126953125, 1.2176361083984375, 1.257720947265625, 1.2978057861328125, 1.337890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 7.0, 14.0, 20.0, 14.0, 23.0, 40.0, 43.0, 88.0, 107.0, 209.0, 371.0, 791.0, 1934.0, 5495.0, 17180.0, 57144.0, 687099.0, 222431.0, 37457.0, 11539.0, 3769.0, 1426.0, 612.0, 287.0, 162.0, 94.0, 56.0, 44.0, 29.0, 11.0, 18.0, 13.0, 7.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.98828125, -7.7713623046875, -7.554443359375, -7.3375244140625, -7.12060546875, -6.9036865234375, -6.686767578125, -6.4698486328125, -6.2529296875, -6.0360107421875, -5.819091796875, -5.6021728515625, -5.38525390625, -5.1683349609375, -4.951416015625, -4.7344970703125, -4.517578125, -4.3006591796875, -4.083740234375, -3.8668212890625, -3.64990234375, -3.4329833984375, -3.216064453125, -2.9991455078125, -2.7822265625, -2.5653076171875, -2.348388671875, -2.1314697265625, -1.91455078125, -1.6976318359375, -1.480712890625, -1.2637939453125, -1.046875, -0.8299560546875, -0.613037109375, -0.3961181640625, -0.17919921875, 0.0377197265625, 0.254638671875, 0.4715576171875, 0.6884765625, 0.9053955078125, 1.122314453125, 1.3392333984375, 1.55615234375, 1.7730712890625, 1.989990234375, 2.2069091796875, 2.423828125, 2.6407470703125, 2.857666015625, 3.0745849609375, 3.29150390625, 3.5084228515625, 3.725341796875, 3.9422607421875, 4.1591796875, 4.3760986328125, 4.593017578125, 4.8099365234375, 5.02685546875, 5.2437744140625, 5.460693359375, 5.6776123046875, 5.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 11.0, 8.0, 14.0, 17.0, 22.0, 35.0, 36.0, 59.0, 66.0, 79.0, 84.0, 79.0, 82.0, 66.0, 62.0, 62.0, 38.0, 41.0, 42.0, 21.0, 13.0, 9.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3671875, -9.12725830078125, -8.8873291015625, -8.64739990234375, -8.407470703125, -8.16754150390625, -7.9276123046875, -7.68768310546875, -7.44775390625, -7.20782470703125, -6.9678955078125, -6.72796630859375, -6.488037109375, -6.24810791015625, -6.0081787109375, -5.76824951171875, -5.5283203125, -5.28839111328125, -5.0484619140625, -4.80853271484375, -4.568603515625, -4.32867431640625, -4.0887451171875, -3.84881591796875, -3.60888671875, -3.36895751953125, -3.1290283203125, -2.88909912109375, -2.649169921875, -2.40924072265625, -2.1693115234375, -1.92938232421875, -1.689453125, -1.44952392578125, -1.2095947265625, -0.96966552734375, -0.729736328125, -0.48980712890625, -0.2498779296875, -0.00994873046875, 0.22998046875, 0.46990966796875, 0.7098388671875, 0.94976806640625, 1.189697265625, 1.42962646484375, 1.6695556640625, 1.90948486328125, 2.1494140625, 2.38934326171875, 2.6292724609375, 2.86920166015625, 3.109130859375, 3.34906005859375, 3.5889892578125, 3.82891845703125, 4.06884765625, 4.30877685546875, 4.5487060546875, 4.78863525390625, 5.028564453125, 5.26849365234375, 5.5084228515625, 5.74835205078125, 5.98828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 8.0, 26.0, 20.0, 29.0, 45.0, 81.0, 101.0, 176.0, 255.0, 446.0, 741.0, 1320.0, 2444.0, 4942.0, 10548.0, 24764.0, 65081.0, 410216.0, 415830.0, 65408.0, 24772.0, 10598.0, 4838.0, 2552.0, 1311.0, 794.0, 415.0, 293.0, 157.0, 124.0, 66.0, 41.0, 34.0, 18.0, 20.0, 12.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.583984375, -2.510162353515625, -2.43634033203125, -2.362518310546875, -2.2886962890625, -2.214874267578125, -2.14105224609375, -2.067230224609375, -1.993408203125, -1.919586181640625, -1.84576416015625, -1.771942138671875, -1.6981201171875, -1.624298095703125, -1.55047607421875, -1.476654052734375, -1.40283203125, -1.329010009765625, -1.25518798828125, -1.181365966796875, -1.1075439453125, -1.033721923828125, -0.95989990234375, -0.886077880859375, -0.812255859375, -0.738433837890625, -0.66461181640625, -0.590789794921875, -0.5169677734375, -0.443145751953125, -0.36932373046875, -0.295501708984375, -0.2216796875, -0.147857666015625, -0.07403564453125, -0.000213623046875, 0.0736083984375, 0.147430419921875, 0.22125244140625, 0.295074462890625, 0.368896484375, 0.442718505859375, 0.51654052734375, 0.590362548828125, 0.6641845703125, 0.738006591796875, 0.81182861328125, 0.885650634765625, 0.95947265625, 1.033294677734375, 1.10711669921875, 1.180938720703125, 1.2547607421875, 1.328582763671875, 1.40240478515625, 1.476226806640625, 1.550048828125, 1.623870849609375, 1.69769287109375, 1.771514892578125, 1.8453369140625, 1.919158935546875, 1.99298095703125, 2.066802978515625, 2.140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 7.0, 6.0, 13.0, 18.0, 14.0, 23.0, 46.0, 178.0, 383.0, 132.0, 39.0, 29.0, 23.0, 16.0, 19.0, 8.0, 5.0, 7.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008817464113235474, -0.000852733850479126, -0.0008237212896347046, -0.0007947087287902832, -0.0007656961679458618, -0.0007366836071014404, -0.000707671046257019, -0.0006786584854125977, -0.0006496459245681763, -0.0006206333637237549, -0.0005916208028793335, -0.0005626082420349121, -0.0005335956811904907, -0.0005045831203460693, -0.00047557055950164795, -0.00044655799865722656, -0.0004175454378128052, -0.0003885328769683838, -0.0003595203161239624, -0.000330507755279541, -0.00030149519443511963, -0.00027248263359069824, -0.00024347007274627686, -0.00021445751190185547, -0.00018544495105743408, -0.0001564323902130127, -0.0001274198293685913, -9.840726852416992e-05, -6.939470767974854e-05, -4.038214683532715e-05, -1.1369585990905762e-05, 1.7642974853515625e-05, 4.665553569793701e-05, 7.56680965423584e-05, 0.00010468065738677979, 0.00013369321823120117, 0.00016270577907562256, 0.00019171833992004395, 0.00022073090076446533, 0.0002497434616088867, 0.0002787560224533081, 0.0003077685832977295, 0.0003367811441421509, 0.00036579370498657227, 0.00039480626583099365, 0.00042381882667541504, 0.0004528313875198364, 0.0004818439483642578, 0.0005108565092086792, 0.0005398690700531006, 0.000568881630897522, 0.0005978941917419434, 0.0006269067525863647, 0.0006559193134307861, 0.0006849318742752075, 0.0007139444351196289, 0.0007429569959640503, 0.0007719695568084717, 0.0008009821176528931, 0.0008299946784973145, 0.0008590072393417358, 0.0008880198001861572, 0.0009170323610305786, 0.000946044921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 13.0, 16.0, 33.0, 39.0, 67.0, 101.0, 174.0, 269.0, 550.0, 1517.0, 4774.0, 20925.0, 121947.0, 794208.0, 81838.0, 15820.0, 3859.0, 1226.0, 505.0, 248.0, 146.0, 105.0, 53.0, 35.0, 20.0, 24.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.56640625, -4.43743896484375, -4.3084716796875, -4.17950439453125, -4.050537109375, -3.92156982421875, -3.7926025390625, -3.66363525390625, -3.53466796875, -3.40570068359375, -3.2767333984375, -3.14776611328125, -3.018798828125, -2.88983154296875, -2.7608642578125, -2.63189697265625, -2.5029296875, -2.37396240234375, -2.2449951171875, -2.11602783203125, -1.987060546875, -1.85809326171875, -1.7291259765625, -1.60015869140625, -1.47119140625, -1.34222412109375, -1.2132568359375, -1.08428955078125, -0.955322265625, -0.82635498046875, -0.6973876953125, -0.56842041015625, -0.439453125, -0.31048583984375, -0.1815185546875, -0.05255126953125, 0.076416015625, 0.20538330078125, 0.3343505859375, 0.46331787109375, 0.59228515625, 0.72125244140625, 0.8502197265625, 0.97918701171875, 1.108154296875, 1.23712158203125, 1.3660888671875, 1.49505615234375, 1.6240234375, 1.75299072265625, 1.8819580078125, 2.01092529296875, 2.139892578125, 2.26885986328125, 2.3978271484375, 2.52679443359375, 2.65576171875, 2.78472900390625, 2.9136962890625, 3.04266357421875, 3.171630859375, 3.30059814453125, 3.4295654296875, 3.55853271484375, 3.6875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 4.0, 10.0, 14.0, 13.0, 20.0, 12.0, 24.0, 33.0, 57.0, 118.0, 145.0, 165.0, 125.0, 51.0, 32.0, 33.0, 23.0, 20.0, 15.0, 14.0, 7.0, 12.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09375, -2.019378662109375, -1.94500732421875, -1.870635986328125, -1.7962646484375, -1.721893310546875, -1.64752197265625, -1.573150634765625, -1.498779296875, -1.424407958984375, -1.35003662109375, -1.275665283203125, -1.2012939453125, -1.126922607421875, -1.05255126953125, -0.978179931640625, -0.90380859375, -0.829437255859375, -0.75506591796875, -0.680694580078125, -0.6063232421875, -0.531951904296875, -0.45758056640625, -0.383209228515625, -0.308837890625, -0.234466552734375, -0.16009521484375, -0.085723876953125, -0.0113525390625, 0.063018798828125, 0.13739013671875, 0.211761474609375, 0.2861328125, 0.360504150390625, 0.43487548828125, 0.509246826171875, 0.5836181640625, 0.657989501953125, 0.73236083984375, 0.806732177734375, 0.881103515625, 0.955474853515625, 1.02984619140625, 1.104217529296875, 1.1785888671875, 1.252960205078125, 1.32733154296875, 1.401702880859375, 1.47607421875, 1.550445556640625, 1.62481689453125, 1.699188232421875, 1.7735595703125, 1.847930908203125, 1.92230224609375, 1.996673583984375, 2.071044921875, 2.145416259765625, 2.21978759765625, 2.294158935546875, 2.3685302734375, 2.442901611328125, 2.51727294921875, 2.591644287109375, 2.666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 28.0, 25.0, 53.0, 62.0, 82.0, 88.0, 115.0, 102.0, 101.0, 82.0, 69.0, 42.0, 36.0, 22.0, 23.0, 16.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.986961364746094, -31.047964096069336, -30.108964920043945, -29.169967651367188, -28.23097038269043, -27.291973114013672, -26.35297393798828, -25.413976669311523, -24.474979400634766, -23.535982131958008, -22.596982955932617, -21.65798568725586, -20.7189884185791, -19.779991149902344, -18.840991973876953, -17.901994705200195, -16.962995529174805, -16.023998260498047, -15.085000038146973, -14.146001815795898, -13.20700454711914, -12.268006324768066, -11.329008102416992, -10.390010833740234, -9.45101261138916, -8.512014389038086, -7.573017120361328, -6.634018898010254, -5.695021152496338, -4.756023406982422, -3.8170251846313477, -2.8780274391174316, -1.9390277862548828, -1.0000299215316772, -0.06103205680847168, 0.8779659271240234, 1.8169636726379395, 2.7559614181518555, 3.6949596405029297, 4.633957386016846, 5.572955131530762, 6.511952877044678, 7.450950622558594, 8.389948844909668, 9.328947067260742, 10.2679443359375, 11.206942558288574, 12.145940780639648, 13.084938049316406, 14.02393627166748, 14.962933540344238, 15.901931762695312, 16.84092903137207, 17.779926300048828, 18.71892547607422, 19.657922744750977, 20.596920013427734, 21.535917282104492, 22.474916458129883, 23.41391372680664, 24.3529109954834, 25.291908264160156, 26.230907440185547, 27.169904708862305, 28.108903884887695]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 5.0, 10.0, 4.0, 13.0, 14.0, 15.0, 22.0, 15.0, 17.0, 28.0, 28.0, 31.0, 34.0, 35.0, 37.0, 44.0, 54.0, 50.0, 48.0, 42.0, 39.0, 40.0, 45.0, 40.0, 32.0, 42.0, 25.0, 31.0, 21.0, 19.0, 15.0, 19.0, 16.0, 12.0, 7.0, 14.0, 3.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-24.45825958251953, -23.762027740478516, -23.0657958984375, -22.369564056396484, -21.67333221435547, -20.977100372314453, -20.280868530273438, -19.584636688232422, -18.888404846191406, -18.19217300415039, -17.495941162109375, -16.79970932006836, -16.103477478027344, -15.407245635986328, -14.711012840270996, -14.01478099822998, -13.318548202514648, -12.622316360473633, -11.926084518432617, -11.229852676391602, -10.533620834350586, -9.83738899230957, -9.141156196594238, -8.444924354553223, -7.748692512512207, -7.052460670471191, -6.356228828430176, -5.659996509552002, -4.963764667510986, -4.267532825469971, -3.571300506591797, -2.8750686645507812, -2.178834915161133, -1.4826029539108276, -0.7863709926605225, -0.09013891220092773, 0.6060929298400879, 1.3023247718811035, 1.9985570907592773, 2.694788932800293, 3.3910207748413086, 4.087252616882324, 4.78348445892334, 5.479716777801514, 6.175948619842529, 6.872180461883545, 7.568412780761719, 8.264644622802734, 8.96087646484375, 9.657108306884766, 10.353340148925781, 11.049571990966797, 11.745803833007812, 12.442035675048828, 13.13826847076416, 13.834500312805176, 14.530732154846191, 15.226963996887207, 15.923195838928223, 16.619428634643555, 17.31566047668457, 18.011892318725586, 18.7081241607666, 19.404356002807617, 20.100587844848633]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 17.0, 35.0, 38.0, 68.0, 108.0, 216.0, 456.0, 991.0, 2372.0, 6111.0, 17300.0, 68537.0, 1583259.0, 2416290.0, 70520.0, 17752.0, 6003.0, 2298.0, 978.0, 440.0, 216.0, 109.0, 59.0, 28.0, 18.0, 7.0, 15.0, 8.0, 4.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75, -7.4732666015625, -7.196533203125, -6.9197998046875, -6.64306640625, -6.3663330078125, -6.089599609375, -5.8128662109375, -5.5361328125, -5.2593994140625, -4.982666015625, -4.7059326171875, -4.42919921875, -4.1524658203125, -3.875732421875, -3.5989990234375, -3.322265625, -3.0455322265625, -2.768798828125, -2.4920654296875, -2.21533203125, -1.9385986328125, -1.661865234375, -1.3851318359375, -1.1083984375, -0.8316650390625, -0.554931640625, -0.2781982421875, -0.00146484375, 0.2752685546875, 0.552001953125, 0.8287353515625, 1.10546875, 1.3822021484375, 1.658935546875, 1.9356689453125, 2.21240234375, 2.4891357421875, 2.765869140625, 3.0426025390625, 3.3193359375, 3.5960693359375, 3.872802734375, 4.1495361328125, 4.42626953125, 4.7030029296875, 4.979736328125, 5.2564697265625, 5.533203125, 5.8099365234375, 6.086669921875, 6.3634033203125, 6.64013671875, 6.9168701171875, 7.193603515625, 7.4703369140625, 7.7470703125, 8.0238037109375, 8.300537109375, 8.5772705078125, 8.85400390625, 9.1307373046875, 9.407470703125, 9.6842041015625, 9.9609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 12.0, 11.0, 14.0, 16.0, 14.0, 15.0, 28.0, 18.0, 32.0, 36.0, 47.0, 30.0, 35.0, 62.0, 59.0, 54.0, 59.0, 67.0, 46.0, 48.0, 47.0, 40.0, 33.0, 38.0, 33.0, 36.0, 10.0, 18.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2179718017578125, -1.177154541015625, -1.1363372802734375, -1.09552001953125, -1.0547027587890625, -1.013885498046875, -0.9730682373046875, -0.9322509765625, -0.8914337158203125, -0.850616455078125, -0.8097991943359375, -0.76898193359375, -0.7281646728515625, -0.687347412109375, -0.6465301513671875, -0.605712890625, -0.5648956298828125, -0.524078369140625, -0.4832611083984375, -0.44244384765625, -0.4016265869140625, -0.360809326171875, -0.3199920654296875, -0.2791748046875, -0.2383575439453125, -0.197540283203125, -0.1567230224609375, -0.11590576171875, -0.0750885009765625, -0.034271240234375, 0.0065460205078125, 0.04736328125, 0.0881805419921875, 0.128997802734375, 0.1698150634765625, 0.21063232421875, 0.2514495849609375, 0.292266845703125, 0.3330841064453125, 0.3739013671875, 0.4147186279296875, 0.455535888671875, 0.4963531494140625, 0.53717041015625, 0.5779876708984375, 0.618804931640625, 0.6596221923828125, 0.700439453125, 0.7412567138671875, 0.782073974609375, 0.8228912353515625, 0.86370849609375, 0.9045257568359375, 0.945343017578125, 0.9861602783203125, 1.0269775390625, 1.0677947998046875, 1.108612060546875, 1.1494293212890625, 1.19024658203125, 1.2310638427734375, 1.271881103515625, 1.3126983642578125, 1.353515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 13.0, 11.0, 20.0, 33.0, 50.0, 80.0, 70.0, 127.0, 171.0, 222.0, 297.0, 497.0, 815.0, 1381.0, 2636.0, 5352.0, 12195.0, 30264.0, 97024.0, 718487.0, 3109359.0, 144639.0, 40798.0, 15409.0, 6567.0, 3247.0, 1675.0, 936.0, 565.0, 388.0, 274.0, 173.0, 132.0, 93.0, 63.0, 56.0, 39.0, 35.0, 23.0, 16.0, 14.0, 13.0, 9.0, 7.0, 1.0, 3.0], "bins": [-8.140625, -7.92718505859375, -7.7137451171875, -7.50030517578125, -7.286865234375, -7.07342529296875, -6.8599853515625, -6.64654541015625, -6.43310546875, -6.21966552734375, -6.0062255859375, -5.79278564453125, -5.579345703125, -5.36590576171875, -5.1524658203125, -4.93902587890625, -4.7255859375, -4.51214599609375, -4.2987060546875, -4.08526611328125, -3.871826171875, -3.65838623046875, -3.4449462890625, -3.23150634765625, -3.01806640625, -2.80462646484375, -2.5911865234375, -2.37774658203125, -2.164306640625, -1.95086669921875, -1.7374267578125, -1.52398681640625, -1.310546875, -1.09710693359375, -0.8836669921875, -0.67022705078125, -0.456787109375, -0.24334716796875, -0.0299072265625, 0.18353271484375, 0.39697265625, 0.61041259765625, 0.8238525390625, 1.03729248046875, 1.250732421875, 1.46417236328125, 1.6776123046875, 1.89105224609375, 2.1044921875, 2.31793212890625, 2.5313720703125, 2.74481201171875, 2.958251953125, 3.17169189453125, 3.3851318359375, 3.59857177734375, 3.81201171875, 4.02545166015625, 4.2388916015625, 4.45233154296875, 4.665771484375, 4.87921142578125, 5.0926513671875, 5.30609130859375, 5.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 12.0, 12.0, 16.0, 24.0, 30.0, 46.0, 65.0, 148.0, 290.0, 1484.0, 1301.0, 275.0, 109.0, 78.0, 41.0, 47.0, 17.0, 13.0, 14.0, 11.0, 4.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57421875, -2.4622802734375, -2.350341796875, -2.2384033203125, -2.12646484375, -2.0145263671875, -1.902587890625, -1.7906494140625, -1.6787109375, -1.5667724609375, -1.454833984375, -1.3428955078125, -1.23095703125, -1.1190185546875, -1.007080078125, -0.8951416015625, -0.783203125, -0.6712646484375, -0.559326171875, -0.4473876953125, -0.33544921875, -0.2235107421875, -0.111572265625, 0.0003662109375, 0.1123046875, 0.2242431640625, 0.336181640625, 0.4481201171875, 0.56005859375, 0.6719970703125, 0.783935546875, 0.8958740234375, 1.0078125, 1.1197509765625, 1.231689453125, 1.3436279296875, 1.45556640625, 1.5675048828125, 1.679443359375, 1.7913818359375, 1.9033203125, 2.0152587890625, 2.127197265625, 2.2391357421875, 2.35107421875, 2.4630126953125, 2.574951171875, 2.6868896484375, 2.798828125, 2.9107666015625, 3.022705078125, 3.1346435546875, 3.24658203125, 3.3585205078125, 3.470458984375, 3.5823974609375, 3.6943359375, 3.8062744140625, 3.918212890625, 4.0301513671875, 4.14208984375, 4.2540283203125, 4.365966796875, 4.4779052734375, 4.58984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 33.0, 53.0, 72.0, 132.0, 157.0, 151.0, 128.0, 91.0, 52.0, 36.0, 23.0, 10.0, 11.0, 10.0, 1.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.313812255859375, -15.635957717895508, -14.958102226257324, -14.280247688293457, -13.602392196655273, -12.924537658691406, -12.246683120727539, -11.568827629089355, -10.890972137451172, -10.213117599487305, -9.535262107849121, -8.857407569885254, -8.17955207824707, -7.501697540283203, -6.823842525482178, -6.145987510681152, -5.468132972717285, -4.79027795791626, -4.112422943115234, -3.434568166732788, -2.7567131519317627, -2.0788581371307373, -1.401003360748291, -0.7231483459472656, -0.045293331146240234, 0.6325616240501404, 1.310416579246521, 1.9882714748382568, 2.6661264896392822, 3.3439815044403076, 4.021836280822754, 4.699691295623779, 5.377546310424805, 6.05540132522583, 6.7332563400268555, 7.411110877990723, 8.088966369628906, 8.766820907592773, 9.44467544555664, 10.122530937194824, 10.800386428833008, 11.478240966796875, 12.156096458435059, 12.833950996398926, 13.51180648803711, 14.189661026000977, 14.867515563964844, 15.545371055603027, 16.223224639892578, 16.901079177856445, 17.578933715820312, 18.256790161132812, 18.93464469909668, 19.612499237060547, 20.290353775024414, 20.96820831298828, 21.64606475830078, 22.32391929626465, 23.001773834228516, 23.679630279541016, 24.357484817504883, 25.03533935546875, 25.713193893432617, 26.391048431396484, 27.068904876708984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 9.0, 8.0, 9.0, 10.0, 11.0, 17.0, 20.0, 27.0, 22.0, 23.0, 40.0, 43.0, 48.0, 41.0, 46.0, 57.0, 42.0, 44.0, 70.0, 55.0, 47.0, 48.0, 49.0, 34.0, 30.0, 35.0, 21.0, 23.0, 18.0, 14.0, 12.0, 7.0, 4.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.803576469421387, -10.422284126281738, -10.04099178314209, -9.659699440002441, -9.278407096862793, -8.897113800048828, -8.51582145690918, -8.134529113769531, -7.753236770629883, -7.371944427490234, -6.990652084350586, -6.6093597412109375, -6.228066921234131, -5.846774578094482, -5.465482234954834, -5.084189414978027, -4.702897548675537, -4.321605205535889, -3.940312623977661, -3.5590202808380127, -3.177727699279785, -2.7964353561401367, -2.4151430130004883, -2.0338504314422607, -1.6525580883026123, -1.2712656259536743, -0.8899732232093811, -0.5086808204650879, -0.1273883581161499, 0.2539041042327881, 0.6351964473724365, 1.016489028930664, 1.3977813720703125, 1.7790738344192505, 2.1603662967681885, 2.541658639907837, 2.9229512214660645, 3.304243564605713, 3.6855359077453613, 4.066828727722168, 4.448121070861816, 4.829413414001465, 5.210705757141113, 5.591998100280762, 5.973290920257568, 6.354583263397217, 6.735875606536865, 7.117168426513672, 7.498460292816162, 7.8797526359558105, 8.261045455932617, 8.642337799072266, 9.023630142211914, 9.404922485351562, 9.786214828491211, 10.16750717163086, 10.548799514770508, 10.930091857910156, 11.311384201049805, 11.692676544189453, 12.073968887329102, 12.45526123046875, 12.836553573608398, 13.217846870422363, 13.599139213562012]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 17.0, 19.0, 34.0, 40.0, 72.0, 85.0, 136.0, 185.0, 334.0, 527.0, 922.0, 1864.0, 3714.0, 8368.0, 19525.0, 46241.0, 116123.0, 355675.0, 316337.0, 103347.0, 42112.0, 17620.0, 7794.0, 3513.0, 1657.0, 875.0, 507.0, 281.0, 197.0, 112.0, 66.0, 70.0, 50.0, 33.0, 28.0, 19.0, 12.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-5.08203125, -4.93231201171875, -4.7825927734375, -4.63287353515625, -4.483154296875, -4.33343505859375, -4.1837158203125, -4.03399658203125, -3.88427734375, -3.73455810546875, -3.5848388671875, -3.43511962890625, -3.285400390625, -3.13568115234375, -2.9859619140625, -2.83624267578125, -2.6865234375, -2.53680419921875, -2.3870849609375, -2.23736572265625, -2.087646484375, -1.93792724609375, -1.7882080078125, -1.63848876953125, -1.48876953125, -1.33905029296875, -1.1893310546875, -1.03961181640625, -0.889892578125, -0.74017333984375, -0.5904541015625, -0.44073486328125, -0.291015625, -0.14129638671875, 0.0084228515625, 0.15814208984375, 0.307861328125, 0.45758056640625, 0.6072998046875, 0.75701904296875, 0.90673828125, 1.05645751953125, 1.2061767578125, 1.35589599609375, 1.505615234375, 1.65533447265625, 1.8050537109375, 1.95477294921875, 2.1044921875, 2.25421142578125, 2.4039306640625, 2.55364990234375, 2.703369140625, 2.85308837890625, 3.0028076171875, 3.15252685546875, 3.30224609375, 3.45196533203125, 3.6016845703125, 3.75140380859375, 3.901123046875, 4.05084228515625, 4.2005615234375, 4.35028076171875, 4.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 18.0, 14.0, 17.0, 17.0, 17.0, 28.0, 34.0, 36.0, 35.0, 40.0, 51.0, 45.0, 60.0, 64.0, 55.0, 50.0, 63.0, 41.0, 40.0, 37.0, 39.0, 32.0, 29.0, 27.0, 20.0, 17.0, 24.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3803253173828125, -1.335845947265625, -1.2913665771484375, -1.24688720703125, -1.2024078369140625, -1.157928466796875, -1.1134490966796875, -1.0689697265625, -1.0244903564453125, -0.980010986328125, -0.9355316162109375, -0.89105224609375, -0.8465728759765625, -0.802093505859375, -0.7576141357421875, -0.713134765625, -0.6686553955078125, -0.624176025390625, -0.5796966552734375, -0.53521728515625, -0.4907379150390625, -0.446258544921875, -0.4017791748046875, -0.3572998046875, -0.3128204345703125, -0.268341064453125, -0.2238616943359375, -0.17938232421875, -0.1349029541015625, -0.090423583984375, -0.0459442138671875, -0.00146484375, 0.0430145263671875, 0.087493896484375, 0.1319732666015625, 0.17645263671875, 0.2209320068359375, 0.265411376953125, 0.3098907470703125, 0.3543701171875, 0.3988494873046875, 0.443328857421875, 0.4878082275390625, 0.53228759765625, 0.5767669677734375, 0.621246337890625, 0.6657257080078125, 0.710205078125, 0.7546844482421875, 0.799163818359375, 0.8436431884765625, 0.88812255859375, 0.9326019287109375, 0.977081298828125, 1.0215606689453125, 1.0660400390625, 1.1105194091796875, 1.154998779296875, 1.1994781494140625, 1.24395751953125, 1.2884368896484375, 1.332916259765625, 1.3773956298828125, 1.421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 14.0, 25.0, 51.0, 57.0, 77.0, 170.0, 256.0, 412.0, 764.0, 1855.0, 6301.0, 38539.0, 387533.0, 551943.0, 48835.0, 7647.0, 2010.0, 893.0, 426.0, 263.0, 159.0, 104.0, 61.0, 34.0, 28.0, 22.0, 16.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.11712646484375, -6.8084716796875, -6.49981689453125, -6.191162109375, -5.88250732421875, -5.5738525390625, -5.26519775390625, -4.95654296875, -4.64788818359375, -4.3392333984375, -4.03057861328125, -3.721923828125, -3.41326904296875, -3.1046142578125, -2.79595947265625, -2.4873046875, -2.17864990234375, -1.8699951171875, -1.56134033203125, -1.252685546875, -0.94403076171875, -0.6353759765625, -0.32672119140625, -0.01806640625, 0.29058837890625, 0.5992431640625, 0.90789794921875, 1.216552734375, 1.52520751953125, 1.8338623046875, 2.14251708984375, 2.451171875, 2.75982666015625, 3.0684814453125, 3.37713623046875, 3.685791015625, 3.99444580078125, 4.3031005859375, 4.61175537109375, 4.92041015625, 5.22906494140625, 5.5377197265625, 5.84637451171875, 6.155029296875, 6.46368408203125, 6.7723388671875, 7.08099365234375, 7.3896484375, 7.69830322265625, 8.0069580078125, 8.31561279296875, 8.624267578125, 8.93292236328125, 9.2415771484375, 9.55023193359375, 9.85888671875, 10.16754150390625, 10.4761962890625, 10.78485107421875, 11.093505859375, 11.40216064453125, 11.7108154296875, 12.01947021484375, 12.328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 7.0, 8.0, 10.0, 9.0, 15.0, 19.0, 19.0, 20.0, 25.0, 41.0, 34.0, 40.0, 38.0, 41.0, 49.0, 44.0, 39.0, 55.0, 57.0, 50.0, 46.0, 40.0, 30.0, 38.0, 27.0, 29.0, 33.0, 23.0, 28.0, 14.0, 14.0, 8.0, 3.0, 6.0, 8.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7984619140625, -5.612548828125, -5.4266357421875, -5.24072265625, -5.0548095703125, -4.868896484375, -4.6829833984375, -4.4970703125, -4.3111572265625, -4.125244140625, -3.9393310546875, -3.75341796875, -3.5675048828125, -3.381591796875, -3.1956787109375, -3.009765625, -2.8238525390625, -2.637939453125, -2.4520263671875, -2.26611328125, -2.0802001953125, -1.894287109375, -1.7083740234375, -1.5224609375, -1.3365478515625, -1.150634765625, -0.9647216796875, -0.77880859375, -0.5928955078125, -0.406982421875, -0.2210693359375, -0.03515625, 0.1507568359375, 0.336669921875, 0.5225830078125, 0.70849609375, 0.8944091796875, 1.080322265625, 1.2662353515625, 1.4521484375, 1.6380615234375, 1.823974609375, 2.0098876953125, 2.19580078125, 2.3817138671875, 2.567626953125, 2.7535400390625, 2.939453125, 3.1253662109375, 3.311279296875, 3.4971923828125, 3.68310546875, 3.8690185546875, 4.054931640625, 4.2408447265625, 4.4267578125, 4.6126708984375, 4.798583984375, 4.9844970703125, 5.17041015625, 5.3563232421875, 5.542236328125, 5.7281494140625, 5.9140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 13.0, 23.0, 22.0, 34.0, 58.0, 93.0, 175.0, 298.0, 622.0, 1246.0, 3039.0, 8145.0, 23854.0, 75957.0, 330608.0, 462081.0, 96846.0, 28849.0, 9854.0, 3695.0, 1498.0, 693.0, 337.0, 204.0, 101.0, 59.0, 43.0, 30.0, 21.0, 14.0, 8.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.015625, -3.91546630859375, -3.8153076171875, -3.71514892578125, -3.614990234375, -3.51483154296875, -3.4146728515625, -3.31451416015625, -3.21435546875, -3.11419677734375, -3.0140380859375, -2.91387939453125, -2.813720703125, -2.71356201171875, -2.6134033203125, -2.51324462890625, -2.4130859375, -2.31292724609375, -2.2127685546875, -2.11260986328125, -2.012451171875, -1.91229248046875, -1.8121337890625, -1.71197509765625, -1.61181640625, -1.51165771484375, -1.4114990234375, -1.31134033203125, -1.211181640625, -1.11102294921875, -1.0108642578125, -0.91070556640625, -0.810546875, -0.71038818359375, -0.6102294921875, -0.51007080078125, -0.409912109375, -0.30975341796875, -0.2095947265625, -0.10943603515625, -0.00927734375, 0.09088134765625, 0.1910400390625, 0.29119873046875, 0.391357421875, 0.49151611328125, 0.5916748046875, 0.69183349609375, 0.7919921875, 0.89215087890625, 0.9923095703125, 1.09246826171875, 1.192626953125, 1.29278564453125, 1.3929443359375, 1.49310302734375, 1.59326171875, 1.69342041015625, 1.7935791015625, 1.89373779296875, 1.993896484375, 2.09405517578125, 2.1942138671875, 2.29437255859375, 2.39453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 19.0, 10.0, 17.0, 27.0, 26.0, 38.0, 45.0, 55.0, 99.0, 207.0, 140.0, 62.0, 41.0, 29.0, 30.0, 25.0, 21.0, 17.0, 16.0, 11.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000835418701171875, -0.0008098036050796509, -0.0007841885089874268, -0.0007585734128952026, -0.0007329583168029785, -0.0007073432207107544, -0.0006817281246185303, -0.0006561130285263062, -0.000630497932434082, -0.0006048828363418579, -0.0005792677402496338, -0.0005536526441574097, -0.0005280375480651855, -0.0005024224519729614, -0.0004768073558807373, -0.0004511922597885132, -0.00042557716369628906, -0.00039996206760406494, -0.0003743469715118408, -0.0003487318754196167, -0.0003231167793273926, -0.00029750168323516846, -0.00027188658714294434, -0.0002462714910507202, -0.0002206563949584961, -0.00019504129886627197, -0.00016942620277404785, -0.00014381110668182373, -0.00011819601058959961, -9.258091449737549e-05, -6.696581840515137e-05, -4.1350722312927246e-05, -1.5735626220703125e-05, 9.879469871520996e-06, 3.549456596374512e-05, 6.110966205596924e-05, 8.672475814819336e-05, 0.00011233985424041748, 0.0001379549503326416, 0.00016357004642486572, 0.00018918514251708984, 0.00021480023860931396, 0.00024041533470153809, 0.0002660304307937622, 0.00029164552688598633, 0.00031726062297821045, 0.00034287571907043457, 0.0003684908151626587, 0.0003941059112548828, 0.00041972100734710693, 0.00044533610343933105, 0.0004709511995315552, 0.0004965662956237793, 0.0005221813917160034, 0.0005477964878082275, 0.0005734115839004517, 0.0005990266799926758, 0.0006246417760848999, 0.000650256872177124, 0.0006758719682693481, 0.0007014870643615723, 0.0007271021604537964, 0.0007527172565460205, 0.0007783323526382446, 0.0008039474487304688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 10.0, 18.0, 19.0, 20.0, 43.0, 51.0, 85.0, 163.0, 314.0, 560.0, 1420.0, 4589.0, 22625.0, 173400.0, 709442.0, 113809.0, 16021.0, 3655.0, 1154.0, 509.0, 241.0, 127.0, 85.0, 48.0, 34.0, 17.0, 22.0, 21.0, 10.0, 11.0, 8.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.1875, -6.0220947265625, -5.856689453125, -5.6912841796875, -5.52587890625, -5.3604736328125, -5.195068359375, -5.0296630859375, -4.8642578125, -4.6988525390625, -4.533447265625, -4.3680419921875, -4.20263671875, -4.0372314453125, -3.871826171875, -3.7064208984375, -3.541015625, -3.3756103515625, -3.210205078125, -3.0447998046875, -2.87939453125, -2.7139892578125, -2.548583984375, -2.3831787109375, -2.2177734375, -2.0523681640625, -1.886962890625, -1.7215576171875, -1.55615234375, -1.3907470703125, -1.225341796875, -1.0599365234375, -0.89453125, -0.7291259765625, -0.563720703125, -0.3983154296875, -0.23291015625, -0.0675048828125, 0.097900390625, 0.2633056640625, 0.4287109375, 0.5941162109375, 0.759521484375, 0.9249267578125, 1.09033203125, 1.2557373046875, 1.421142578125, 1.5865478515625, 1.751953125, 1.9173583984375, 2.082763671875, 2.2481689453125, 2.41357421875, 2.5789794921875, 2.744384765625, 2.9097900390625, 3.0751953125, 3.2406005859375, 3.406005859375, 3.5714111328125, 3.73681640625, 3.9022216796875, 4.067626953125, 4.2330322265625, 4.3984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 12.0, 19.0, 15.0, 31.0, 42.0, 69.0, 89.0, 118.0, 145.0, 126.0, 93.0, 70.0, 44.0, 33.0, 24.0, 10.0, 13.0, 11.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.26953125, -6.1324462890625, -5.995361328125, -5.8582763671875, -5.72119140625, -5.5841064453125, -5.447021484375, -5.3099365234375, -5.1728515625, -5.0357666015625, -4.898681640625, -4.7615966796875, -4.62451171875, -4.4874267578125, -4.350341796875, -4.2132568359375, -4.076171875, -3.9390869140625, -3.802001953125, -3.6649169921875, -3.52783203125, -3.3907470703125, -3.253662109375, -3.1165771484375, -2.9794921875, -2.8424072265625, -2.705322265625, -2.5682373046875, -2.43115234375, -2.2940673828125, -2.156982421875, -2.0198974609375, -1.8828125, -1.7457275390625, -1.608642578125, -1.4715576171875, -1.33447265625, -1.1973876953125, -1.060302734375, -0.9232177734375, -0.7861328125, -0.6490478515625, -0.511962890625, -0.3748779296875, -0.23779296875, -0.1007080078125, 0.036376953125, 0.1734619140625, 0.310546875, 0.4476318359375, 0.584716796875, 0.7218017578125, 0.85888671875, 0.9959716796875, 1.133056640625, 1.2701416015625, 1.4072265625, 1.5443115234375, 1.681396484375, 1.8184814453125, 1.95556640625, 2.0926513671875, 2.229736328125, 2.3668212890625, 2.50390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 21.0, 65.0, 181.0, 338.0, 251.0, 103.0, 24.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.445945739746094, -42.7911262512207, -39.13630676269531, -35.48148727416992, -31.82666778564453, -28.17184829711914, -24.51702880859375, -20.86220932006836, -17.20738983154297, -13.552570343017578, -9.897750854492188, -6.242931365966797, -2.5881118774414062, 1.0667076110839844, 4.721527099609375, 8.376346588134766, 12.031166076660156, 15.685985565185547, 19.340805053710938, 22.995624542236328, 26.65044403076172, 30.30526351928711, 33.9600830078125, 37.61490249633789, 41.26972198486328, 44.92454147338867, 48.57936096191406, 52.23418045043945, 55.888999938964844, 59.543819427490234, 63.198638916015625, 66.85345458984375, 70.50827026367188, 74.1630859375, 77.81790924072266, 81.47273254394531, 85.12754821777344, 88.78236389160156, 92.43718719482422, 96.09201049804688, 99.746826171875, 103.40164184570312, 107.05646514892578, 110.71128845214844, 114.36610412597656, 118.02091979980469, 121.67574310302734, 125.33056640625, 128.98538208007812, 132.64019775390625, 136.29501342773438, 139.94984436035156, 143.6046600341797, 147.2594757080078, 150.914306640625, 154.56912231445312, 158.22393798828125, 161.87875366210938, 165.5335693359375, 169.1884002685547, 172.8432159423828, 176.49803161621094, 180.15286254882812, 183.80767822265625, 187.46249389648438]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 8.0, 13.0, 13.0, 15.0, 15.0, 23.0, 20.0, 22.0, 17.0, 25.0, 36.0, 44.0, 33.0, 52.0, 35.0, 41.0, 45.0, 50.0, 43.0, 35.0, 45.0, 39.0, 44.0, 27.0, 29.0, 28.0, 27.0, 20.0, 22.0, 17.0, 18.0, 16.0, 11.0, 11.0, 6.0, 6.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.444995880126953, -28.50366973876953, -27.56234359741211, -26.621017456054688, -25.679691314697266, -24.738365173339844, -23.797039031982422, -22.855712890625, -21.914386749267578, -20.973060607910156, -20.031734466552734, -19.090408325195312, -18.14908218383789, -17.20775604248047, -16.266429901123047, -15.325104713439941, -14.383779525756836, -13.442453384399414, -12.501127243041992, -11.55980110168457, -10.618474960327148, -9.677148818969727, -8.735823631286621, -7.794497489929199, -6.853171348571777, -5.9118452072143555, -4.970519065856934, -4.02919340133667, -3.087867259979248, -2.146541118621826, -1.2052154541015625, -0.2638893127441406, 0.6774368286132812, 1.6187628507614136, 2.560088872909546, 3.5014147758483887, 4.4427409172058105, 5.384067058563232, 6.325392723083496, 7.266718864440918, 8.20804500579834, 9.149371147155762, 10.090697288513184, 11.032022476196289, 11.973348617553711, 12.914674758911133, 13.856000900268555, 14.797327041625977, 15.738653182983398, 16.67997932434082, 17.621305465698242, 18.562631607055664, 19.503957748413086, 20.445283889770508, 21.386608123779297, 22.32793426513672, 23.26926040649414, 24.210586547851562, 25.151912689208984, 26.093238830566406, 27.034564971923828, 27.97589111328125, 28.917217254638672, 29.858543395996094, 30.799869537353516]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 12.0, 21.0, 25.0, 59.0, 110.0, 221.0, 571.0, 1665.0, 6552.0, 32435.0, 398894.0, 3672063.0, 66051.0, 11341.0, 2787.0, 860.0, 294.0, 134.0, 74.0, 33.0, 27.0, 18.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7454833984375, -9.342529296875, -8.9395751953125, -8.53662109375, -8.1336669921875, -7.730712890625, -7.3277587890625, -6.9248046875, -6.5218505859375, -6.118896484375, -5.7159423828125, -5.31298828125, -4.9100341796875, -4.507080078125, -4.1041259765625, -3.701171875, -3.2982177734375, -2.895263671875, -2.4923095703125, -2.08935546875, -1.6864013671875, -1.283447265625, -0.8804931640625, -0.4775390625, -0.0745849609375, 0.328369140625, 0.7313232421875, 1.13427734375, 1.5372314453125, 1.940185546875, 2.3431396484375, 2.74609375, 3.1490478515625, 3.552001953125, 3.9549560546875, 4.35791015625, 4.7608642578125, 5.163818359375, 5.5667724609375, 5.9697265625, 6.3726806640625, 6.775634765625, 7.1785888671875, 7.58154296875, 7.9844970703125, 8.387451171875, 8.7904052734375, 9.193359375, 9.5963134765625, 9.999267578125, 10.4022216796875, 10.80517578125, 11.2081298828125, 11.611083984375, 12.0140380859375, 12.4169921875, 12.8199462890625, 13.222900390625, 13.6258544921875, 14.02880859375, 14.4317626953125, 14.834716796875, 15.2376708984375, 15.640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 5.0, 9.0, 11.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 31.0, 41.0, 41.0, 42.0, 43.0, 35.0, 48.0, 61.0, 59.0, 52.0, 46.0, 35.0, 44.0, 39.0, 36.0, 34.0, 36.0, 22.0, 13.0, 22.0, 16.0, 17.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3505859375, -1.3067779541015625, -1.262969970703125, -1.2191619873046875, -1.17535400390625, -1.1315460205078125, -1.087738037109375, -1.0439300537109375, -1.0001220703125, -0.9563140869140625, -0.912506103515625, -0.8686981201171875, -0.82489013671875, -0.7810821533203125, -0.737274169921875, -0.6934661865234375, -0.649658203125, -0.6058502197265625, -0.562042236328125, -0.5182342529296875, -0.47442626953125, -0.4306182861328125, -0.386810302734375, -0.3430023193359375, -0.2991943359375, -0.2553863525390625, -0.211578369140625, -0.1677703857421875, -0.12396240234375, -0.0801544189453125, -0.036346435546875, 0.0074615478515625, 0.05126953125, 0.0950775146484375, 0.138885498046875, 0.1826934814453125, 0.22650146484375, 0.2703094482421875, 0.314117431640625, 0.3579254150390625, 0.4017333984375, 0.4455413818359375, 0.489349365234375, 0.5331573486328125, 0.57696533203125, 0.6207733154296875, 0.664581298828125, 0.7083892822265625, 0.752197265625, 0.7960052490234375, 0.839813232421875, 0.8836212158203125, 0.92742919921875, 0.9712371826171875, 1.015045166015625, 1.0588531494140625, 1.1026611328125, 1.1464691162109375, 1.190277099609375, 1.2340850830078125, 1.27789306640625, 1.3217010498046875, 1.365509033203125, 1.4093170166015625, 1.453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 9.0, 8.0, 12.0, 12.0, 25.0, 34.0, 49.0, 65.0, 90.0, 133.0, 188.0, 284.0, 444.0, 737.0, 1215.0, 2190.0, 4384.0, 9058.0, 20804.0, 56349.0, 205633.0, 3089075.0, 633878.0, 107111.0, 34773.0, 13884.0, 6298.0, 3162.0, 1665.0, 962.0, 578.0, 367.0, 257.0, 147.0, 113.0, 78.0, 62.0, 38.0, 32.0, 19.0, 12.0, 10.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.24609375, -6.04949951171875, -5.8529052734375, -5.65631103515625, -5.459716796875, -5.26312255859375, -5.0665283203125, -4.86993408203125, -4.67333984375, -4.47674560546875, -4.2801513671875, -4.08355712890625, -3.886962890625, -3.69036865234375, -3.4937744140625, -3.29718017578125, -3.1005859375, -2.90399169921875, -2.7073974609375, -2.51080322265625, -2.314208984375, -2.11761474609375, -1.9210205078125, -1.72442626953125, -1.52783203125, -1.33123779296875, -1.1346435546875, -0.93804931640625, -0.741455078125, -0.54486083984375, -0.3482666015625, -0.15167236328125, 0.044921875, 0.24151611328125, 0.4381103515625, 0.63470458984375, 0.831298828125, 1.02789306640625, 1.2244873046875, 1.42108154296875, 1.61767578125, 1.81427001953125, 2.0108642578125, 2.20745849609375, 2.404052734375, 2.60064697265625, 2.7972412109375, 2.99383544921875, 3.1904296875, 3.38702392578125, 3.5836181640625, 3.78021240234375, 3.976806640625, 4.17340087890625, 4.3699951171875, 4.56658935546875, 4.76318359375, 4.95977783203125, 5.1563720703125, 5.35296630859375, 5.549560546875, 5.74615478515625, 5.9427490234375, 6.13934326171875, 6.3359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 14.0, 17.0, 29.0, 41.0, 58.0, 92.0, 140.0, 245.0, 736.0, 1684.0, 401.0, 189.0, 109.0, 63.0, 45.0, 42.0, 28.0, 19.0, 20.0, 12.0, 8.0, 7.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.16015625, -3.04815673828125, -2.9361572265625, -2.82415771484375, -2.712158203125, -2.60015869140625, -2.4881591796875, -2.37615966796875, -2.26416015625, -2.15216064453125, -2.0401611328125, -1.92816162109375, -1.816162109375, -1.70416259765625, -1.5921630859375, -1.48016357421875, -1.3681640625, -1.25616455078125, -1.1441650390625, -1.03216552734375, -0.920166015625, -0.80816650390625, -0.6961669921875, -0.58416748046875, -0.47216796875, -0.36016845703125, -0.2481689453125, -0.13616943359375, -0.024169921875, 0.08782958984375, 0.1998291015625, 0.31182861328125, 0.423828125, 0.53582763671875, 0.6478271484375, 0.75982666015625, 0.871826171875, 0.98382568359375, 1.0958251953125, 1.20782470703125, 1.31982421875, 1.43182373046875, 1.5438232421875, 1.65582275390625, 1.767822265625, 1.87982177734375, 1.9918212890625, 2.10382080078125, 2.2158203125, 2.32781982421875, 2.4398193359375, 2.55181884765625, 2.663818359375, 2.77581787109375, 2.8878173828125, 2.99981689453125, 3.11181640625, 3.22381591796875, 3.3358154296875, 3.44781494140625, 3.559814453125, 3.67181396484375, 3.7838134765625, 3.89581298828125, 4.0078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 11.0, 14.0, 27.0, 39.0, 46.0, 78.0, 105.0, 106.0, 130.0, 121.0, 77.0, 70.0, 62.0, 39.0, 28.0, 15.0, 7.0, 10.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.542293548583984, -11.814962387084961, -11.087631225585938, -10.360299110412598, -9.632967948913574, -8.90563678741455, -8.178304672241211, -7.4509735107421875, -6.723642349243164, -5.996311187744141, -5.268979549407959, -4.541647911071777, -3.814316749572754, -3.0869853496551514, -2.359653949737549, -1.6323223114013672, -0.9049911499023438, -0.1776597499847412, 0.5496716499328613, 1.2770030498504639, 2.0043344497680664, 2.731665849685669, 3.4589972496032715, 4.186328887939453, 4.913660049438477, 5.6409912109375, 6.368322849273682, 7.095654487609863, 7.822985649108887, 8.55031681060791, 9.27764892578125, 10.004980087280273, 10.732311248779297, 11.45964241027832, 12.186973571777344, 12.914305686950684, 13.641636848449707, 14.36896800994873, 15.09630012512207, 15.823631286621094, 16.550962448120117, 17.27829360961914, 18.005624771118164, 18.732955932617188, 19.460289001464844, 20.187620162963867, 20.91495132446289, 21.642282485961914, 22.369613647460938, 23.09694480895996, 23.824275970458984, 24.551607131958008, 25.27893829345703, 26.006271362304688, 26.73360252380371, 27.460933685302734, 28.188264846801758, 28.91559600830078, 29.642927169799805, 30.370258331298828, 31.097591400146484, 31.824922561645508, 32.55225372314453, 33.27958679199219, 34.00691604614258]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 14.0, 15.0, 18.0, 19.0, 23.0, 23.0, 36.0, 26.0, 27.0, 31.0, 31.0, 35.0, 42.0, 43.0, 48.0, 43.0, 44.0, 34.0, 40.0, 32.0, 46.0, 31.0, 29.0, 33.0, 27.0, 28.0, 18.0, 15.0, 17.0, 19.0, 16.0, 9.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.027045249938965, -10.672649383544922, -10.318252563476562, -9.96385669708252, -9.609460830688477, -9.255064010620117, -8.900668144226074, -8.546272277832031, -8.191875457763672, -7.837479114532471, -7.4830827713012695, -7.128686904907227, -6.774290561676025, -6.419894218444824, -6.065498352050781, -5.71110200881958, -5.356705665588379, -5.002309322357178, -4.647912979125977, -4.293517112731934, -3.9391207695007324, -3.5847244262695312, -3.230328321456909, -2.875932216644287, -2.521535873413086, -2.1671395301818848, -1.8127434253692627, -1.458347201347351, -1.1039509773254395, -0.7495547533035278, -0.3951585292816162, -0.04076242446899414, 0.31363487243652344, 0.6680310964584351, 1.0224273204803467, 1.3768235445022583, 1.73121976852417, 2.085616111755371, 2.440012216567993, 2.7944083213806152, 3.1488046646118164, 3.5032010078430176, 3.8575971126556396, 4.211993217468262, 4.566389560699463, 4.920785903930664, 5.275181770324707, 5.629578113555908, 5.983974456787109, 6.3383708000183105, 6.692767143249512, 7.047163009643555, 7.401559352874756, 7.755955696105957, 8.1103515625, 8.46474838256836, 8.819144248962402, 9.173540115356445, 9.527936935424805, 9.882332801818848, 10.23672866821289, 10.59112548828125, 10.945521354675293, 11.299917221069336, 11.654314041137695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 19.0, 23.0, 26.0, 68.0, 96.0, 168.0, 289.0, 615.0, 1291.0, 3147.0, 8648.0, 28011.0, 102977.0, 384054.0, 377173.0, 100549.0, 27158.0, 8557.0, 3101.0, 1288.0, 570.0, 291.0, 188.0, 94.0, 59.0, 26.0, 18.0, 10.0, 7.0, 7.0, 3.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.63739013671875, -6.4232177734375, -6.20904541015625, -5.994873046875, -5.78070068359375, -5.5665283203125, -5.35235595703125, -5.13818359375, -4.92401123046875, -4.7098388671875, -4.49566650390625, -4.281494140625, -4.06732177734375, -3.8531494140625, -3.63897705078125, -3.4248046875, -3.21063232421875, -2.9964599609375, -2.78228759765625, -2.568115234375, -2.35394287109375, -2.1397705078125, -1.92559814453125, -1.71142578125, -1.49725341796875, -1.2830810546875, -1.06890869140625, -0.854736328125, -0.64056396484375, -0.4263916015625, -0.21221923828125, 0.001953125, 0.21612548828125, 0.4302978515625, 0.64447021484375, 0.858642578125, 1.07281494140625, 1.2869873046875, 1.50115966796875, 1.71533203125, 1.92950439453125, 2.1436767578125, 2.35784912109375, 2.572021484375, 2.78619384765625, 3.0003662109375, 3.21453857421875, 3.4287109375, 3.64288330078125, 3.8570556640625, 4.07122802734375, 4.285400390625, 4.49957275390625, 4.7137451171875, 4.92791748046875, 5.14208984375, 5.35626220703125, 5.5704345703125, 5.78460693359375, 5.998779296875, 6.21295166015625, 6.4271240234375, 6.64129638671875, 6.85546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 8.0, 15.0, 17.0, 22.0, 19.0, 25.0, 28.0, 34.0, 39.0, 53.0, 43.0, 46.0, 54.0, 42.0, 49.0, 61.0, 59.0, 50.0, 38.0, 56.0, 38.0, 41.0, 27.0, 29.0, 23.0, 20.0, 18.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.638671875, -1.5885772705078125, -1.538482666015625, -1.4883880615234375, -1.43829345703125, -1.3881988525390625, -1.338104248046875, -1.2880096435546875, -1.2379150390625, -1.1878204345703125, -1.137725830078125, -1.0876312255859375, -1.03753662109375, -0.9874420166015625, -0.937347412109375, -0.8872528076171875, -0.837158203125, -0.7870635986328125, -0.736968994140625, -0.6868743896484375, -0.63677978515625, -0.5866851806640625, -0.536590576171875, -0.4864959716796875, -0.4364013671875, -0.3863067626953125, -0.336212158203125, -0.2861175537109375, -0.23602294921875, -0.1859283447265625, -0.135833740234375, -0.0857391357421875, -0.03564453125, 0.0144500732421875, 0.064544677734375, 0.1146392822265625, 0.16473388671875, 0.2148284912109375, 0.264923095703125, 0.3150177001953125, 0.3651123046875, 0.4152069091796875, 0.465301513671875, 0.5153961181640625, 0.56549072265625, 0.6155853271484375, 0.665679931640625, 0.7157745361328125, 0.765869140625, 0.8159637451171875, 0.866058349609375, 0.9161529541015625, 0.96624755859375, 1.0163421630859375, 1.066436767578125, 1.1165313720703125, 1.1666259765625, 1.2167205810546875, 1.266815185546875, 1.3169097900390625, 1.36700439453125, 1.4170989990234375, 1.467193603515625, 1.5172882080078125, 1.5673828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 7.0, 6.0, 10.0, 12.0, 13.0, 24.0, 37.0, 31.0, 80.0, 130.0, 221.0, 356.0, 660.0, 1360.0, 3668.0, 14321.0, 107283.0, 718131.0, 173607.0, 20488.0, 4614.0, 1656.0, 812.0, 417.0, 223.0, 140.0, 73.0, 61.0, 35.0, 21.0, 16.0, 9.0, 20.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -11.03271484375, -10.7138671875, -10.39501953125, -10.076171875, -9.75732421875, -9.4384765625, -9.11962890625, -8.80078125, -8.48193359375, -8.1630859375, -7.84423828125, -7.525390625, -7.20654296875, -6.8876953125, -6.56884765625, -6.25, -5.93115234375, -5.6123046875, -5.29345703125, -4.974609375, -4.65576171875, -4.3369140625, -4.01806640625, -3.69921875, -3.38037109375, -3.0615234375, -2.74267578125, -2.423828125, -2.10498046875, -1.7861328125, -1.46728515625, -1.1484375, -0.82958984375, -0.5107421875, -0.19189453125, 0.126953125, 0.44580078125, 0.7646484375, 1.08349609375, 1.40234375, 1.72119140625, 2.0400390625, 2.35888671875, 2.677734375, 2.99658203125, 3.3154296875, 3.63427734375, 3.953125, 4.27197265625, 4.5908203125, 4.90966796875, 5.228515625, 5.54736328125, 5.8662109375, 6.18505859375, 6.50390625, 6.82275390625, 7.1416015625, 7.46044921875, 7.779296875, 8.09814453125, 8.4169921875, 8.73583984375, 9.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 9.0, 19.0, 24.0, 16.0, 24.0, 24.0, 24.0, 32.0, 36.0, 36.0, 38.0, 32.0, 46.0, 47.0, 50.0, 44.0, 44.0, 37.0, 46.0, 45.0, 56.0, 31.0, 31.0, 26.0, 22.0, 26.0, 19.0, 23.0, 14.0, 9.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.23046875, -7.008544921875, -6.78662109375, -6.564697265625, -6.3427734375, -6.120849609375, -5.89892578125, -5.677001953125, -5.455078125, -5.233154296875, -5.01123046875, -4.789306640625, -4.5673828125, -4.345458984375, -4.12353515625, -3.901611328125, -3.6796875, -3.457763671875, -3.23583984375, -3.013916015625, -2.7919921875, -2.570068359375, -2.34814453125, -2.126220703125, -1.904296875, -1.682373046875, -1.46044921875, -1.238525390625, -1.0166015625, -0.794677734375, -0.57275390625, -0.350830078125, -0.12890625, 0.093017578125, 0.31494140625, 0.536865234375, 0.7587890625, 0.980712890625, 1.20263671875, 1.424560546875, 1.646484375, 1.868408203125, 2.09033203125, 2.312255859375, 2.5341796875, 2.756103515625, 2.97802734375, 3.199951171875, 3.421875, 3.643798828125, 3.86572265625, 4.087646484375, 4.3095703125, 4.531494140625, 4.75341796875, 4.975341796875, 5.197265625, 5.419189453125, 5.64111328125, 5.863037109375, 6.0849609375, 6.306884765625, 6.52880859375, 6.750732421875, 6.97265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 11.0, 12.0, 30.0, 36.0, 79.0, 103.0, 242.0, 494.0, 1150.0, 3110.0, 10778.0, 56634.0, 394649.0, 488475.0, 73377.0, 13415.0, 3506.0, 1271.0, 539.0, 281.0, 134.0, 81.0, 53.0, 22.0, 24.0, 11.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.899169921875, -4.75537109375, -4.611572265625, -4.4677734375, -4.323974609375, -4.18017578125, -4.036376953125, -3.892578125, -3.748779296875, -3.60498046875, -3.461181640625, -3.3173828125, -3.173583984375, -3.02978515625, -2.885986328125, -2.7421875, -2.598388671875, -2.45458984375, -2.310791015625, -2.1669921875, -2.023193359375, -1.87939453125, -1.735595703125, -1.591796875, -1.447998046875, -1.30419921875, -1.160400390625, -1.0166015625, -0.872802734375, -0.72900390625, -0.585205078125, -0.44140625, -0.297607421875, -0.15380859375, -0.010009765625, 0.1337890625, 0.277587890625, 0.42138671875, 0.565185546875, 0.708984375, 0.852783203125, 0.99658203125, 1.140380859375, 1.2841796875, 1.427978515625, 1.57177734375, 1.715576171875, 1.859375, 2.003173828125, 2.14697265625, 2.290771484375, 2.4345703125, 2.578369140625, 2.72216796875, 2.865966796875, 3.009765625, 3.153564453125, 3.29736328125, 3.441162109375, 3.5849609375, 3.728759765625, 3.87255859375, 4.016357421875, 4.16015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 18.0, 12.0, 24.0, 28.0, 30.0, 47.0, 61.0, 70.0, 76.0, 101.0, 100.0, 78.0, 64.0, 60.0, 38.0, 28.0, 28.0, 23.0, 21.0, 11.0, 12.0, 6.0, 3.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006122589111328125, -0.0005916431546211243, -0.000571027398109436, -0.0005504116415977478, -0.0005297958850860596, -0.0005091801285743713, -0.0004885643720626831, -0.0004679486155509949, -0.00044733285903930664, -0.0004267171025276184, -0.0004061013460159302, -0.00038548558950424194, -0.0003648698329925537, -0.0003442540764808655, -0.00032363831996917725, -0.000303022563457489, -0.0002824068069458008, -0.00026179105043411255, -0.00024117529392242432, -0.00022055953741073608, -0.00019994378089904785, -0.00017932802438735962, -0.0001587122678756714, -0.00013809651136398315, -0.00011748075485229492, -9.686499834060669e-05, -7.624924182891846e-05, -5.5633485317230225e-05, -3.501772880554199e-05, -1.440197229385376e-05, 6.213784217834473e-06, 2.6829540729522705e-05, 4.744529724121094e-05, 6.806105375289917e-05, 8.86768102645874e-05, 0.00010929256677627563, 0.00012990832328796387, 0.0001505240797996521, 0.00017113983631134033, 0.00019175559282302856, 0.0002123713493347168, 0.00023298710584640503, 0.00025360286235809326, 0.0002742186188697815, 0.0002948343753814697, 0.00031545013189315796, 0.0003360658884048462, 0.0003566816449165344, 0.00037729740142822266, 0.0003979131579399109, 0.0004185289144515991, 0.00043914467096328735, 0.0004597604274749756, 0.0004803761839866638, 0.000500991940498352, 0.0005216076970100403, 0.0005422234535217285, 0.0005628392100334167, 0.000583454966545105, 0.0006040707230567932, 0.0006246864795684814, 0.0006453022360801697, 0.0006659179925918579, 0.0006865337491035461, 0.0007071495056152344]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 16.0, 41.0, 63.0, 187.0, 493.0, 1576.0, 8214.0, 109368.0, 841762.0, 77975.0, 6720.0, 1378.0, 414.0, 178.0, 77.0, 39.0, 15.0, 9.0, 7.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5152587890625, -7.241455078125, -6.9676513671875, -6.69384765625, -6.4200439453125, -6.146240234375, -5.8724365234375, -5.5986328125, -5.3248291015625, -5.051025390625, -4.7772216796875, -4.50341796875, -4.2296142578125, -3.955810546875, -3.6820068359375, -3.408203125, -3.1343994140625, -2.860595703125, -2.5867919921875, -2.31298828125, -2.0391845703125, -1.765380859375, -1.4915771484375, -1.2177734375, -0.9439697265625, -0.670166015625, -0.3963623046875, -0.12255859375, 0.1512451171875, 0.425048828125, 0.6988525390625, 0.97265625, 1.2464599609375, 1.520263671875, 1.7940673828125, 2.06787109375, 2.3416748046875, 2.615478515625, 2.8892822265625, 3.1630859375, 3.4368896484375, 3.710693359375, 3.9844970703125, 4.25830078125, 4.5321044921875, 4.805908203125, 5.0797119140625, 5.353515625, 5.6273193359375, 5.901123046875, 6.1749267578125, 6.44873046875, 6.7225341796875, 6.996337890625, 7.2701416015625, 7.5439453125, 7.8177490234375, 8.091552734375, 8.3653564453125, 8.63916015625, 8.9129638671875, 9.186767578125, 9.4605712890625, 9.734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 8.0, 15.0, 14.0, 16.0, 25.0, 39.0, 38.0, 64.0, 66.0, 65.0, 85.0, 84.0, 45.0, 70.0, 69.0, 66.0, 31.0, 33.0, 34.0, 24.0, 20.0, 11.0, 10.0, 9.0, 2.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.931640625, -2.841827392578125, -2.75201416015625, -2.662200927734375, -2.5723876953125, -2.482574462890625, -2.39276123046875, -2.302947998046875, -2.213134765625, -2.123321533203125, -2.03350830078125, -1.943695068359375, -1.8538818359375, -1.764068603515625, -1.67425537109375, -1.584442138671875, -1.49462890625, -1.404815673828125, -1.31500244140625, -1.225189208984375, -1.1353759765625, -1.045562744140625, -0.95574951171875, -0.865936279296875, -0.776123046875, -0.686309814453125, -0.59649658203125, -0.506683349609375, -0.4168701171875, -0.327056884765625, -0.23724365234375, -0.147430419921875, -0.0576171875, 0.032196044921875, 0.12200927734375, 0.211822509765625, 0.3016357421875, 0.391448974609375, 0.48126220703125, 0.571075439453125, 0.660888671875, 0.750701904296875, 0.84051513671875, 0.930328369140625, 1.0201416015625, 1.109954833984375, 1.19976806640625, 1.289581298828125, 1.37939453125, 1.469207763671875, 1.55902099609375, 1.648834228515625, 1.7386474609375, 1.828460693359375, 1.91827392578125, 2.008087158203125, 2.097900390625, 2.187713623046875, 2.27752685546875, 2.367340087890625, 2.4571533203125, 2.546966552734375, 2.63677978515625, 2.726593017578125, 2.81640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 13.0, 12.0, 22.0, 33.0, 29.0, 49.0, 68.0, 99.0, 93.0, 132.0, 94.0, 89.0, 81.0, 54.0, 42.0, 31.0, 23.0, 5.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.91415786743164, -41.5188102722168, -40.12346267700195, -38.72811508178711, -37.33277130126953, -35.93742370605469, -34.542076110839844, -33.146728515625, -31.751380920410156, -30.356033325195312, -28.96068572998047, -27.565340042114258, -26.169992446899414, -24.77464485168457, -23.37929916381836, -21.983951568603516, -20.588603973388672, -19.193256378173828, -17.797908782958984, -16.402563095092773, -15.00721549987793, -13.611867904663086, -12.216521263122559, -10.821174621582031, -9.425827026367188, -8.030479431152344, -6.635132789611816, -5.239785671234131, -3.8444385528564453, -2.4490914344787598, -1.0537443161010742, 0.3416023254394531, 1.7369461059570312, 3.132293224334717, 4.527640342712402, 5.922987461090088, 7.318334579467773, 8.713682174682617, 10.109028816223145, 11.504375457763672, 12.899723052978516, 14.29507064819336, 15.690417289733887, 17.085763931274414, 18.481111526489258, 19.8764591217041, 21.271804809570312, 22.667152404785156, 24.0625, 25.457847595214844, 26.853195190429688, 28.2485408782959, 29.643888473510742, 31.039236068725586, 32.4345817565918, 33.82992935180664, 35.225276947021484, 36.62062454223633, 38.01597213745117, 39.411319732666016, 40.806663513183594, 42.20201110839844, 43.59735870361328, 44.992706298828125, 46.38805389404297]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 9.0, 13.0, 8.0, 12.0, 26.0, 26.0, 23.0, 41.0, 38.0, 36.0, 44.0, 40.0, 44.0, 49.0, 42.0, 48.0, 48.0, 50.0, 41.0, 44.0, 29.0, 33.0, 27.0, 35.0, 25.0, 18.0, 27.0, 18.0, 12.0, 10.0, 10.0, 9.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.061729431152344, -31.95173454284668, -30.841739654541016, -29.731746673583984, -28.62175178527832, -27.511756896972656, -26.401763916015625, -25.29176902770996, -24.181774139404297, -23.071779251098633, -21.96178436279297, -20.851791381835938, -19.741796493530273, -18.63180160522461, -17.521808624267578, -16.411813735961914, -15.30181884765625, -14.191823959350586, -13.081830024719238, -11.97183609008789, -10.861841201782227, -9.751846313476562, -8.641852378845215, -7.531857967376709, -6.421863555908203, -5.311869144439697, -4.201874732971191, -3.0918803215026855, -1.9818859100341797, -0.8718914985656738, 0.23810291290283203, 1.348097324371338, 2.4580917358398438, 3.5680861473083496, 4.6780805587768555, 5.788074970245361, 6.898069381713867, 8.008064270019531, 9.118058204650879, 10.228052139282227, 11.33804702758789, 12.448041915893555, 13.558035850524902, 14.66802978515625, 15.778024673461914, 16.888019561767578, 17.99801254272461, 19.108007431030273, 20.218002319335938, 21.3279972076416, 22.437992095947266, 23.547985076904297, 24.65797996520996, 25.767974853515625, 26.877967834472656, 27.98796272277832, 29.097957611083984, 30.20795249938965, 31.317947387695312, 32.427940368652344, 33.537933349609375, 34.64793014526367, 35.7579231262207, 36.867919921875, 37.97791290283203]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 17.0, 5.0, 6.0, 14.0, 25.0, 23.0, 43.0, 68.0, 106.0, 149.0, 233.0, 380.0, 654.0, 1084.0, 1793.0, 3522.0, 7646.0, 24925.0, 3926244.0, 196586.0, 17639.0, 6108.0, 2900.0, 1585.0, 948.0, 555.0, 344.0, 229.0, 140.0, 92.0, 64.0, 50.0, 33.0, 25.0, 15.0, 11.0, 7.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.390625, -11.081787109375, -10.77294921875, -10.464111328125, -10.1552734375, -9.846435546875, -9.53759765625, -9.228759765625, -8.919921875, -8.611083984375, -8.30224609375, -7.993408203125, -7.6845703125, -7.375732421875, -7.06689453125, -6.758056640625, -6.44921875, -6.140380859375, -5.83154296875, -5.522705078125, -5.2138671875, -4.905029296875, -4.59619140625, -4.287353515625, -3.978515625, -3.669677734375, -3.36083984375, -3.052001953125, -2.7431640625, -2.434326171875, -2.12548828125, -1.816650390625, -1.5078125, -1.198974609375, -0.89013671875, -0.581298828125, -0.2724609375, 0.036376953125, 0.34521484375, 0.654052734375, 0.962890625, 1.271728515625, 1.58056640625, 1.889404296875, 2.1982421875, 2.507080078125, 2.81591796875, 3.124755859375, 3.43359375, 3.742431640625, 4.05126953125, 4.360107421875, 4.6689453125, 4.977783203125, 5.28662109375, 5.595458984375, 5.904296875, 6.213134765625, 6.52197265625, 6.830810546875, 7.1396484375, 7.448486328125, 7.75732421875, 8.066162109375, 8.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 7.0, 7.0, 9.0, 23.0, 24.0, 24.0, 30.0, 34.0, 52.0, 43.0, 48.0, 48.0, 63.0, 69.0, 71.0, 61.0, 72.0, 59.0, 37.0, 49.0, 34.0, 32.0, 20.0, 12.0, 16.0, 12.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.8614044189453125, -1.800933837890625, -1.7404632568359375, -1.67999267578125, -1.6195220947265625, -1.559051513671875, -1.4985809326171875, -1.4381103515625, -1.3776397705078125, -1.317169189453125, -1.2566986083984375, -1.19622802734375, -1.1357574462890625, -1.075286865234375, -1.0148162841796875, -0.954345703125, -0.8938751220703125, -0.833404541015625, -0.7729339599609375, -0.71246337890625, -0.6519927978515625, -0.591522216796875, -0.5310516357421875, -0.4705810546875, -0.4101104736328125, -0.349639892578125, -0.2891693115234375, -0.22869873046875, -0.1682281494140625, -0.107757568359375, -0.0472869873046875, 0.01318359375, 0.0736541748046875, 0.134124755859375, 0.1945953369140625, 0.25506591796875, 0.3155364990234375, 0.376007080078125, 0.4364776611328125, 0.4969482421875, 0.5574188232421875, 0.617889404296875, 0.6783599853515625, 0.73883056640625, 0.7993011474609375, 0.859771728515625, 0.9202423095703125, 0.980712890625, 1.0411834716796875, 1.101654052734375, 1.1621246337890625, 1.22259521484375, 1.2830657958984375, 1.343536376953125, 1.4040069580078125, 1.4644775390625, 1.5249481201171875, 1.585418701171875, 1.6458892822265625, 1.70635986328125, 1.7668304443359375, 1.827301025390625, 1.8877716064453125, 1.9482421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 10.0, 19.0, 21.0, 36.0, 62.0, 75.0, 115.0, 179.0, 252.0, 374.0, 583.0, 945.0, 1899.0, 4773.0, 27763.0, 4080460.0, 64413.0, 6914.0, 2341.0, 1132.0, 637.0, 390.0, 269.0, 191.0, 126.0, 83.0, 66.0, 48.0, 20.0, 18.0, 9.0, 14.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.278564453125, -12.81494140625, -12.351318359375, -11.8876953125, -11.424072265625, -10.96044921875, -10.496826171875, -10.033203125, -9.569580078125, -9.10595703125, -8.642333984375, -8.1787109375, -7.715087890625, -7.25146484375, -6.787841796875, -6.32421875, -5.860595703125, -5.39697265625, -4.933349609375, -4.4697265625, -4.006103515625, -3.54248046875, -3.078857421875, -2.615234375, -2.151611328125, -1.68798828125, -1.224365234375, -0.7607421875, -0.297119140625, 0.16650390625, 0.630126953125, 1.09375, 1.557373046875, 2.02099609375, 2.484619140625, 2.9482421875, 3.411865234375, 3.87548828125, 4.339111328125, 4.802734375, 5.266357421875, 5.72998046875, 6.193603515625, 6.6572265625, 7.120849609375, 7.58447265625, 8.048095703125, 8.51171875, 8.975341796875, 9.43896484375, 9.902587890625, 10.3662109375, 10.829833984375, 11.29345703125, 11.757080078125, 12.220703125, 12.684326171875, 13.14794921875, 13.611572265625, 14.0751953125, 14.538818359375, 15.00244140625, 15.466064453125, 15.9296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 17.0, 20.0, 47.0, 156.0, 3519.0, 210.0, 47.0, 25.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.133392333984375, -2.04998779296875, -1.966583251953125, -1.8831787109375, -1.799774169921875, -1.71636962890625, -1.632965087890625, -1.549560546875, -1.466156005859375, -1.38275146484375, -1.299346923828125, -1.2159423828125, -1.132537841796875, -1.04913330078125, -0.965728759765625, -0.88232421875, -0.798919677734375, -0.71551513671875, -0.632110595703125, -0.5487060546875, -0.465301513671875, -0.38189697265625, -0.298492431640625, -0.215087890625, -0.131683349609375, -0.04827880859375, 0.035125732421875, 0.1185302734375, 0.201934814453125, 0.28533935546875, 0.368743896484375, 0.4521484375, 0.535552978515625, 0.61895751953125, 0.702362060546875, 0.7857666015625, 0.869171142578125, 0.95257568359375, 1.035980224609375, 1.119384765625, 1.202789306640625, 1.28619384765625, 1.369598388671875, 1.4530029296875, 1.536407470703125, 1.61981201171875, 1.703216552734375, 1.78662109375, 1.870025634765625, 1.95343017578125, 2.036834716796875, 2.1202392578125, 2.203643798828125, 2.28704833984375, 2.370452880859375, 2.453857421875, 2.537261962890625, 2.62066650390625, 2.704071044921875, 2.7874755859375, 2.870880126953125, 2.95428466796875, 3.037689208984375, 3.12109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 11.0, 10.0, 25.0, 26.0, 35.0, 41.0, 68.0, 84.0, 105.0, 115.0, 88.0, 99.0, 75.0, 70.0, 50.0, 28.0, 17.0, 22.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.274593353271484, -8.061896324157715, -7.849198341369629, -7.636501312255859, -7.423803806304932, -7.211106300354004, -6.998409271240234, -6.785711765289307, -6.573014259338379, -6.360316753387451, -6.147619247436523, -5.934922218322754, -5.722224712371826, -5.509527206420898, -5.296830177307129, -5.084132671356201, -4.871435165405273, -4.658737659454346, -4.446040153503418, -4.233343124389648, -4.020645618438721, -3.807948112487793, -3.5952508449554443, -3.3825535774230957, -3.169856071472168, -2.9571585655212402, -2.7444612979888916, -2.531764030456543, -2.3190665245056152, -2.1063690185546875, -1.8936717510223389, -1.6809743642807007, -1.4682765007019043, -1.2555791139602661, -1.042881727218628, -0.8301843404769897, -0.6174869537353516, -0.4047895669937134, -0.1920921802520752, 0.02060520648956299, 0.23330259323120117, 0.44599997997283936, 0.6586973667144775, 0.8713947534561157, 1.084092140197754, 1.296789526939392, 1.5094869136810303, 1.7221843004226685, 1.9348816871643066, 2.1475791931152344, 2.360276460647583, 2.5729737281799316, 2.7856712341308594, 2.998368740081787, 3.2110660076141357, 3.4237632751464844, 3.636460781097412, 3.84915828704834, 4.061855316162109, 4.274552822113037, 4.487250328063965, 4.699947834014893, 4.91264533996582, 5.12534236907959, 5.338039875030518]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 16.0, 10.0, 11.0, 20.0, 22.0, 28.0, 29.0, 22.0, 25.0, 33.0, 38.0, 27.0, 45.0, 41.0, 47.0, 41.0, 48.0, 37.0, 38.0, 44.0, 45.0, 26.0, 34.0, 41.0, 23.0, 32.0, 20.0, 27.0, 17.0, 14.0, 13.0, 17.0, 9.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.4689292907714844, -3.3560986518859863, -3.2432680130004883, -3.130437135696411, -3.017606496810913, -2.904775857925415, -2.791944980621338, -2.67911434173584, -2.566283702850342, -2.4534530639648438, -2.3406224250793457, -2.2277915477752686, -2.1149609088897705, -2.0021302700042725, -1.8892995119094849, -1.7764687538146973, -1.6636381149291992, -1.5508074760437012, -1.4379767179489136, -1.325145959854126, -1.212315320968628, -1.0994846820831299, -0.9866539239883423, -0.8738232254981995, -0.7609925270080566, -0.6481618285179138, -0.535331130027771, -0.4225004315376282, -0.30966973304748535, -0.19683903455734253, -0.08400833606719971, 0.028822362422943115, 0.14165306091308594, 0.25448375940322876, 0.3673144578933716, 0.4801451563835144, 0.5929758548736572, 0.7058065533638, 0.8186372518539429, 0.9314679503440857, 1.0442986488342285, 1.1571292877197266, 1.2699600458145142, 1.3827908039093018, 1.4956214427947998, 1.6084520816802979, 1.7212828397750854, 1.834113597869873, 1.946944236755371, 2.059774875640869, 2.172605514526367, 2.2854363918304443, 2.3982670307159424, 2.5110976696014404, 2.6239285469055176, 2.7367591857910156, 2.8495898246765137, 2.9624204635620117, 3.0752511024475098, 3.188081979751587, 3.300912618637085, 3.413743257522583, 3.52657413482666, 3.639404773712158, 3.7522354125976562]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 11.0, 9.0, 10.0, 24.0, 42.0, 67.0, 120.0, 211.0, 421.0, 797.0, 1930.0, 4705.0, 13189.0, 39208.0, 128568.0, 376640.0, 327687.0, 104684.0, 32302.0, 10640.0, 4085.0, 1642.0, 757.0, 362.0, 185.0, 100.0, 48.0, 35.0, 22.0, 14.0, 15.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.80859375, -6.6241455078125, -6.439697265625, -6.2552490234375, -6.07080078125, -5.8863525390625, -5.701904296875, -5.5174560546875, -5.3330078125, -5.1485595703125, -4.964111328125, -4.7796630859375, -4.59521484375, -4.4107666015625, -4.226318359375, -4.0418701171875, -3.857421875, -3.6729736328125, -3.488525390625, -3.3040771484375, -3.11962890625, -2.9351806640625, -2.750732421875, -2.5662841796875, -2.3818359375, -2.1973876953125, -2.012939453125, -1.8284912109375, -1.64404296875, -1.4595947265625, -1.275146484375, -1.0906982421875, -0.90625, -0.7218017578125, -0.537353515625, -0.3529052734375, -0.16845703125, 0.0159912109375, 0.200439453125, 0.3848876953125, 0.5693359375, 0.7537841796875, 0.938232421875, 1.1226806640625, 1.30712890625, 1.4915771484375, 1.676025390625, 1.8604736328125, 2.044921875, 2.2293701171875, 2.413818359375, 2.5982666015625, 2.78271484375, 2.9671630859375, 3.151611328125, 3.3360595703125, 3.5205078125, 3.7049560546875, 3.889404296875, 4.0738525390625, 4.25830078125, 4.4427490234375, 4.627197265625, 4.8116455078125, 4.99609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 7.0, 9.0, 12.0, 18.0, 19.0, 19.0, 29.0, 22.0, 32.0, 29.0, 49.0, 50.0, 43.0, 48.0, 55.0, 67.0, 51.0, 54.0, 55.0, 56.0, 50.0, 49.0, 45.0, 27.0, 29.0, 10.0, 19.0, 8.0, 5.0, 11.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.892547607421875, -1.83099365234375, -1.769439697265625, -1.7078857421875, -1.646331787109375, -1.58477783203125, -1.523223876953125, -1.461669921875, -1.400115966796875, -1.33856201171875, -1.277008056640625, -1.2154541015625, -1.153900146484375, -1.09234619140625, -1.030792236328125, -0.96923828125, -0.907684326171875, -0.84613037109375, -0.784576416015625, -0.7230224609375, -0.661468505859375, -0.59991455078125, -0.538360595703125, -0.476806640625, -0.415252685546875, -0.35369873046875, -0.292144775390625, -0.2305908203125, -0.169036865234375, -0.10748291015625, -0.045928955078125, 0.015625, 0.077178955078125, 0.13873291015625, 0.200286865234375, 0.2618408203125, 0.323394775390625, 0.38494873046875, 0.446502685546875, 0.508056640625, 0.569610595703125, 0.63116455078125, 0.692718505859375, 0.7542724609375, 0.815826416015625, 0.87738037109375, 0.938934326171875, 1.00048828125, 1.062042236328125, 1.12359619140625, 1.185150146484375, 1.2467041015625, 1.308258056640625, 1.36981201171875, 1.431365966796875, 1.492919921875, 1.554473876953125, 1.61602783203125, 1.677581787109375, 1.7391357421875, 1.800689697265625, 1.86224365234375, 1.923797607421875, 1.9853515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 9.0, 13.0, 22.0, 36.0, 51.0, 73.0, 121.0, 171.0, 249.0, 422.0, 779.0, 1379.0, 3271.0, 10537.0, 47454.0, 328767.0, 548957.0, 81912.0, 15853.0, 4462.0, 1735.0, 914.0, 497.0, 291.0, 181.0, 126.0, 92.0, 48.0, 27.0, 23.0, 12.0, 13.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.62249755859375, -7.3778076171875, -7.13311767578125, -6.888427734375, -6.64373779296875, -6.3990478515625, -6.15435791015625, -5.90966796875, -5.66497802734375, -5.4202880859375, -5.17559814453125, -4.930908203125, -4.68621826171875, -4.4415283203125, -4.19683837890625, -3.9521484375, -3.70745849609375, -3.4627685546875, -3.21807861328125, -2.973388671875, -2.72869873046875, -2.4840087890625, -2.23931884765625, -1.99462890625, -1.74993896484375, -1.5052490234375, -1.26055908203125, -1.015869140625, -0.77117919921875, -0.5264892578125, -0.28179931640625, -0.037109375, 0.20758056640625, 0.4522705078125, 0.69696044921875, 0.941650390625, 1.18634033203125, 1.4310302734375, 1.67572021484375, 1.92041015625, 2.16510009765625, 2.4097900390625, 2.65447998046875, 2.899169921875, 3.14385986328125, 3.3885498046875, 3.63323974609375, 3.8779296875, 4.12261962890625, 4.3673095703125, 4.61199951171875, 4.856689453125, 5.10137939453125, 5.3460693359375, 5.59075927734375, 5.83544921875, 6.08013916015625, 6.3248291015625, 6.56951904296875, 6.814208984375, 7.05889892578125, 7.3035888671875, 7.54827880859375, 7.79296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 9.0, 13.0, 18.0, 20.0, 16.0, 32.0, 24.0, 26.0, 24.0, 22.0, 34.0, 29.0, 40.0, 37.0, 47.0, 48.0, 31.0, 52.0, 36.0, 41.0, 41.0, 33.0, 46.0, 33.0, 23.0, 28.0, 21.0, 32.0, 21.0, 17.0, 12.0, 9.0, 8.0, 16.0, 6.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.31640625, -7.08319091796875, -6.8499755859375, -6.61676025390625, -6.383544921875, -6.15032958984375, -5.9171142578125, -5.68389892578125, -5.45068359375, -5.21746826171875, -4.9842529296875, -4.75103759765625, -4.517822265625, -4.28460693359375, -4.0513916015625, -3.81817626953125, -3.5849609375, -3.35174560546875, -3.1185302734375, -2.88531494140625, -2.652099609375, -2.41888427734375, -2.1856689453125, -1.95245361328125, -1.71923828125, -1.48602294921875, -1.2528076171875, -1.01959228515625, -0.786376953125, -0.55316162109375, -0.3199462890625, -0.08673095703125, 0.146484375, 0.37969970703125, 0.6129150390625, 0.84613037109375, 1.079345703125, 1.31256103515625, 1.5457763671875, 1.77899169921875, 2.01220703125, 2.24542236328125, 2.4786376953125, 2.71185302734375, 2.945068359375, 3.17828369140625, 3.4114990234375, 3.64471435546875, 3.8779296875, 4.11114501953125, 4.3443603515625, 4.57757568359375, 4.810791015625, 5.04400634765625, 5.2772216796875, 5.51043701171875, 5.74365234375, 5.97686767578125, 6.2100830078125, 6.44329833984375, 6.676513671875, 6.90972900390625, 7.1429443359375, 7.37615966796875, 7.609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 13.0, 21.0, 29.0, 44.0, 74.0, 134.0, 273.0, 500.0, 1060.0, 2578.0, 7634.0, 28102.0, 147204.0, 604107.0, 205183.0, 36458.0, 9393.0, 3234.0, 1274.0, 559.0, 304.0, 151.0, 84.0, 46.0, 30.0, 15.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.677734375, -3.56488037109375, -3.4520263671875, -3.33917236328125, -3.226318359375, -3.11346435546875, -3.0006103515625, -2.88775634765625, -2.77490234375, -2.66204833984375, -2.5491943359375, -2.43634033203125, -2.323486328125, -2.21063232421875, -2.0977783203125, -1.98492431640625, -1.8720703125, -1.75921630859375, -1.6463623046875, -1.53350830078125, -1.420654296875, -1.30780029296875, -1.1949462890625, -1.08209228515625, -0.96923828125, -0.85638427734375, -0.7435302734375, -0.63067626953125, -0.517822265625, -0.40496826171875, -0.2921142578125, -0.17926025390625, -0.06640625, 0.04644775390625, 0.1593017578125, 0.27215576171875, 0.385009765625, 0.49786376953125, 0.6107177734375, 0.72357177734375, 0.83642578125, 0.94927978515625, 1.0621337890625, 1.17498779296875, 1.287841796875, 1.40069580078125, 1.5135498046875, 1.62640380859375, 1.7392578125, 1.85211181640625, 1.9649658203125, 2.07781982421875, 2.190673828125, 2.30352783203125, 2.4163818359375, 2.52923583984375, 2.64208984375, 2.75494384765625, 2.8677978515625, 2.98065185546875, 3.093505859375, 3.20635986328125, 3.3192138671875, 3.43206787109375, 3.544921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 8.0, 9.0, 9.0, 12.0, 22.0, 23.0, 32.0, 45.0, 60.0, 76.0, 110.0, 113.0, 102.0, 84.0, 72.0, 49.0, 43.0, 30.0, 26.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00079345703125, -0.0007698088884353638, -0.0007461607456207275, -0.0007225126028060913, -0.0006988644599914551, -0.0006752163171768188, -0.0006515681743621826, -0.0006279200315475464, -0.0006042718887329102, -0.0005806237459182739, -0.0005569756031036377, -0.0005333274602890015, -0.0005096793174743652, -0.000486031174659729, -0.0004623830318450928, -0.00043873488903045654, -0.0004150867462158203, -0.0003914386034011841, -0.00036779046058654785, -0.0003441423177719116, -0.0003204941749572754, -0.00029684603214263916, -0.00027319788932800293, -0.0002495497465133667, -0.00022590160369873047, -0.00020225346088409424, -0.000178605318069458, -0.00015495717525482178, -0.00013130903244018555, -0.00010766088962554932, -8.401274681091309e-05, -6.0364603996276855e-05, -3.6716461181640625e-05, -1.3068318367004395e-05, 1.0579824447631836e-05, 3.4227967262268066e-05, 5.78761100769043e-05, 8.152425289154053e-05, 0.00010517239570617676, 0.000128820538520813, 0.00015246868133544922, 0.00017611682415008545, 0.00019976496696472168, 0.0002234131097793579, 0.00024706125259399414, 0.00027070939540863037, 0.0002943575382232666, 0.00031800568103790283, 0.00034165382385253906, 0.0003653019666671753, 0.0003889501094818115, 0.00041259825229644775, 0.000436246395111084, 0.0004598945379257202, 0.00048354268074035645, 0.0005071908235549927, 0.0005308389663696289, 0.0005544871091842651, 0.0005781352519989014, 0.0006017833948135376, 0.0006254315376281738, 0.0006490796804428101, 0.0006727278232574463, 0.0006963759660720825, 0.0007200241088867188]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 21.0, 34.0, 53.0, 79.0, 139.0, 282.0, 557.0, 1410.0, 4586.0, 21904.0, 240558.0, 691339.0, 73082.0, 10099.0, 2618.0, 921.0, 390.0, 180.0, 113.0, 53.0, 41.0, 18.0, 22.0, 10.0, 7.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9921875, -5.8314208984375, -5.670654296875, -5.5098876953125, -5.34912109375, -5.1883544921875, -5.027587890625, -4.8668212890625, -4.7060546875, -4.5452880859375, -4.384521484375, -4.2237548828125, -4.06298828125, -3.9022216796875, -3.741455078125, -3.5806884765625, -3.419921875, -3.2591552734375, -3.098388671875, -2.9376220703125, -2.77685546875, -2.6160888671875, -2.455322265625, -2.2945556640625, -2.1337890625, -1.9730224609375, -1.812255859375, -1.6514892578125, -1.49072265625, -1.3299560546875, -1.169189453125, -1.0084228515625, -0.84765625, -0.6868896484375, -0.526123046875, -0.3653564453125, -0.20458984375, -0.0438232421875, 0.116943359375, 0.2777099609375, 0.4384765625, 0.5992431640625, 0.760009765625, 0.9207763671875, 1.08154296875, 1.2423095703125, 1.403076171875, 1.5638427734375, 1.724609375, 1.8853759765625, 2.046142578125, 2.2069091796875, 2.36767578125, 2.5284423828125, 2.689208984375, 2.8499755859375, 3.0107421875, 3.1715087890625, 3.332275390625, 3.4930419921875, 3.65380859375, 3.8145751953125, 3.975341796875, 4.1361083984375, 4.296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 10.0, 6.0, 6.0, 13.0, 15.0, 14.0, 26.0, 20.0, 46.0, 39.0, 56.0, 56.0, 73.0, 66.0, 61.0, 75.0, 65.0, 56.0, 57.0, 36.0, 37.0, 37.0, 32.0, 18.0, 16.0, 14.0, 10.0, 6.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98095703125, -1.9013671875, -1.82177734375, -1.7421875, -1.66259765625, -1.5830078125, -1.50341796875, -1.423828125, -1.34423828125, -1.2646484375, -1.18505859375, -1.10546875, -1.02587890625, -0.9462890625, -0.86669921875, -0.787109375, -0.70751953125, -0.6279296875, -0.54833984375, -0.46875, -0.38916015625, -0.3095703125, -0.22998046875, -0.150390625, -0.07080078125, 0.0087890625, 0.08837890625, 0.16796875, 0.24755859375, 0.3271484375, 0.40673828125, 0.486328125, 0.56591796875, 0.6455078125, 0.72509765625, 0.8046875, 0.88427734375, 0.9638671875, 1.04345703125, 1.123046875, 1.20263671875, 1.2822265625, 1.36181640625, 1.44140625, 1.52099609375, 1.6005859375, 1.68017578125, 1.759765625, 1.83935546875, 1.9189453125, 1.99853515625, 2.078125, 2.15771484375, 2.2373046875, 2.31689453125, 2.396484375, 2.47607421875, 2.5556640625, 2.63525390625, 2.71484375, 2.79443359375, 2.8740234375, 2.95361328125, 3.033203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 17.0, 25.0, 42.0, 78.0, 94.0, 124.0, 147.0, 120.0, 113.0, 71.0, 66.0, 31.0, 25.0, 9.0, 9.0, 6.0, 2.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.62795639038086, -59.896305084228516, -58.16465377807617, -56.43300247192383, -54.70135498046875, -52.969703674316406, -51.23805236816406, -49.50640106201172, -47.774749755859375, -46.04309844970703, -44.31144714355469, -42.579795837402344, -40.84814453125, -39.116493225097656, -37.38484573364258, -35.653194427490234, -33.92154312133789, -32.18989181518555, -30.458240509033203, -28.726591110229492, -26.99493980407715, -25.263288497924805, -23.531639099121094, -21.79998779296875, -20.068336486816406, -18.336685180664062, -16.60503387451172, -14.873384475708008, -13.141733169555664, -11.41008186340332, -9.678431510925293, -7.946781158447266, -6.2151336669921875, -4.483482837677002, -2.7518320083618164, -1.0201811790466309, 0.7114696502685547, 2.4431209564208984, 4.174771308898926, 5.906421661376953, 7.638072967529297, 9.36972427368164, 11.101374626159668, 12.833024978637695, 14.564676284790039, 16.296327590942383, 18.027976989746094, 19.759628295898438, 21.49127960205078, 23.222930908203125, 24.95458221435547, 26.68623161315918, 28.417882919311523, 30.149534225463867, 31.881183624267578, 33.61283493041992, 35.344486236572266, 37.07613754272461, 38.80778884887695, 40.5394401550293, 42.271087646484375, 44.00273895263672, 45.73439025878906, 47.466041564941406, 49.19769287109375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 9.0, 13.0, 27.0, 18.0, 27.0, 17.0, 41.0, 47.0, 33.0, 31.0, 42.0, 50.0, 56.0, 55.0, 59.0, 49.0, 62.0, 46.0, 31.0, 28.0, 30.0, 27.0, 29.0, 28.0, 17.0, 21.0, 17.0, 11.0, 7.0, 7.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.503570556640625, -43.09716033935547, -41.69075393676758, -40.28434371948242, -38.87793731689453, -37.471527099609375, -36.06511688232422, -34.65871047973633, -33.25230026245117, -31.84589195251465, -30.439483642578125, -29.03307342529297, -27.626665115356445, -26.220256805419922, -24.8138484954834, -23.407440185546875, -22.00103187561035, -20.594623565673828, -19.188215255737305, -17.78180694580078, -16.375396728515625, -14.968988418579102, -13.562580108642578, -12.156170845031738, -10.749762535095215, -9.343354225158691, -7.936944961547852, -6.530536651611328, -5.1241278648376465, -3.717719078063965, -2.3113107681274414, -0.9049015045166016, 0.5015068054199219, 1.907915472984314, 3.314324140548706, 4.720732688903809, 6.12714147567749, 7.533550262451172, 8.939958572387695, 10.346367835998535, 11.752776145935059, 13.159184455871582, 14.565593719482422, 15.972002029418945, 17.37841033935547, 18.784820556640625, 20.191226959228516, 21.597637176513672, 23.004045486450195, 24.41045379638672, 25.816862106323242, 27.223270416259766, 28.629680633544922, 30.036088943481445, 31.44249725341797, 32.848907470703125, 34.255313873291016, 35.66172409057617, 37.06813049316406, 38.47454071044922, 39.88094711303711, 41.287357330322266, 42.693763732910156, 44.10017395019531, 45.50658416748047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 14.0, 21.0, 41.0, 56.0, 100.0, 178.0, 321.0, 716.0, 1782.0, 6294.0, 55760.0, 4103617.0, 19271.0, 3727.0, 1254.0, 526.0, 265.0, 150.0, 72.0, 39.0, 28.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.14111328125, -14.6416015625, -14.14208984375, -13.642578125, -13.14306640625, -12.6435546875, -12.14404296875, -11.64453125, -11.14501953125, -10.6455078125, -10.14599609375, -9.646484375, -9.14697265625, -8.6474609375, -8.14794921875, -7.6484375, -7.14892578125, -6.6494140625, -6.14990234375, -5.650390625, -5.15087890625, -4.6513671875, -4.15185546875, -3.65234375, -3.15283203125, -2.6533203125, -2.15380859375, -1.654296875, -1.15478515625, -0.6552734375, -0.15576171875, 0.34375, 0.84326171875, 1.3427734375, 1.84228515625, 2.341796875, 2.84130859375, 3.3408203125, 3.84033203125, 4.33984375, 4.83935546875, 5.3388671875, 5.83837890625, 6.337890625, 6.83740234375, 7.3369140625, 7.83642578125, 8.3359375, 8.83544921875, 9.3349609375, 9.83447265625, 10.333984375, 10.83349609375, 11.3330078125, 11.83251953125, 12.33203125, 12.83154296875, 13.3310546875, 13.83056640625, 14.330078125, 14.82958984375, 15.3291015625, 15.82861328125, 16.328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 8.0, 21.0, 13.0, 26.0, 32.0, 42.0, 47.0, 53.0, 26.0, 46.0, 55.0, 64.0, 61.0, 51.0, 43.0, 50.0, 50.0, 44.0, 50.0, 29.0, 27.0, 26.0, 34.0, 15.0, 19.0, 11.0, 11.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.880859375, -1.82232666015625, -1.7637939453125, -1.70526123046875, -1.646728515625, -1.58819580078125, -1.5296630859375, -1.47113037109375, -1.41259765625, -1.35406494140625, -1.2955322265625, -1.23699951171875, -1.178466796875, -1.11993408203125, -1.0614013671875, -1.00286865234375, -0.9443359375, -0.88580322265625, -0.8272705078125, -0.76873779296875, -0.710205078125, -0.65167236328125, -0.5931396484375, -0.53460693359375, -0.47607421875, -0.41754150390625, -0.3590087890625, -0.30047607421875, -0.241943359375, -0.18341064453125, -0.1248779296875, -0.06634521484375, -0.0078125, 0.05072021484375, 0.1092529296875, 0.16778564453125, 0.226318359375, 0.28485107421875, 0.3433837890625, 0.40191650390625, 0.46044921875, 0.51898193359375, 0.5775146484375, 0.63604736328125, 0.694580078125, 0.75311279296875, 0.8116455078125, 0.87017822265625, 0.9287109375, 0.98724365234375, 1.0457763671875, 1.10430908203125, 1.162841796875, 1.22137451171875, 1.2799072265625, 1.33843994140625, 1.39697265625, 1.45550537109375, 1.5140380859375, 1.57257080078125, 1.631103515625, 1.68963623046875, 1.7481689453125, 1.80670166015625, 1.865234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 10.0, 20.0, 26.0, 26.0, 44.0, 59.0, 72.0, 103.0, 122.0, 183.0, 252.0, 371.0, 577.0, 1022.0, 1742.0, 3686.0, 8743.0, 27661.0, 260649.0, 3819073.0, 46848.0, 12580.0, 4768.0, 2200.0, 1217.0, 690.0, 429.0, 314.0, 218.0, 143.0, 106.0, 72.0, 55.0, 39.0, 37.0, 19.0, 24.0, 15.0, 11.0, 6.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.26171875, -6.04705810546875, -5.8323974609375, -5.61773681640625, -5.403076171875, -5.18841552734375, -4.9737548828125, -4.75909423828125, -4.54443359375, -4.32977294921875, -4.1151123046875, -3.90045166015625, -3.685791015625, -3.47113037109375, -3.2564697265625, -3.04180908203125, -2.8271484375, -2.61248779296875, -2.3978271484375, -2.18316650390625, -1.968505859375, -1.75384521484375, -1.5391845703125, -1.32452392578125, -1.10986328125, -0.89520263671875, -0.6805419921875, -0.46588134765625, -0.251220703125, -0.03656005859375, 0.1781005859375, 0.39276123046875, 0.607421875, 0.82208251953125, 1.0367431640625, 1.25140380859375, 1.466064453125, 1.68072509765625, 1.8953857421875, 2.11004638671875, 2.32470703125, 2.53936767578125, 2.7540283203125, 2.96868896484375, 3.183349609375, 3.39801025390625, 3.6126708984375, 3.82733154296875, 4.0419921875, 4.25665283203125, 4.4713134765625, 4.68597412109375, 4.900634765625, 5.11529541015625, 5.3299560546875, 5.54461669921875, 5.75927734375, 5.97393798828125, 6.1885986328125, 6.40325927734375, 6.617919921875, 6.83258056640625, 7.0472412109375, 7.26190185546875, 7.4765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 34.0, 99.0, 364.0, 3151.0, 173.0, 60.0, 32.0, 23.0, 10.0, 10.0, 10.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.248504638671875, -1.19232177734375, -1.136138916015625, -1.0799560546875, -1.023773193359375, -0.96759033203125, -0.911407470703125, -0.855224609375, -0.799041748046875, -0.74285888671875, -0.686676025390625, -0.6304931640625, -0.574310302734375, -0.51812744140625, -0.461944580078125, -0.40576171875, -0.349578857421875, -0.29339599609375, -0.237213134765625, -0.1810302734375, -0.124847412109375, -0.06866455078125, -0.012481689453125, 0.043701171875, 0.099884033203125, 0.15606689453125, 0.212249755859375, 0.2684326171875, 0.324615478515625, 0.38079833984375, 0.436981201171875, 0.4931640625, 0.549346923828125, 0.60552978515625, 0.661712646484375, 0.7178955078125, 0.774078369140625, 0.83026123046875, 0.886444091796875, 0.942626953125, 0.998809814453125, 1.05499267578125, 1.111175537109375, 1.1673583984375, 1.223541259765625, 1.27972412109375, 1.335906982421875, 1.39208984375, 1.448272705078125, 1.50445556640625, 1.560638427734375, 1.6168212890625, 1.673004150390625, 1.72918701171875, 1.785369873046875, 1.841552734375, 1.897735595703125, 1.95391845703125, 2.010101318359375, 2.0662841796875, 2.122467041015625, 2.17864990234375, 2.234832763671875, 2.291015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 24.0, 18.0, 35.0, 62.0, 88.0, 94.0, 125.0, 121.0, 112.0, 102.0, 67.0, 53.0, 23.0, 17.0, 15.0, 18.0, 10.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.574706077575684, -8.327876091003418, -8.081045150756836, -7.83421516418457, -7.587385177612305, -7.340554714202881, -7.093724250793457, -6.846894264221191, -6.600064277648926, -6.353233814239502, -6.106403827667236, -5.8595733642578125, -5.612743377685547, -5.365912914276123, -5.119082450866699, -4.872252464294434, -4.62542200088501, -4.378591537475586, -4.13176155090332, -3.8849310874938965, -3.638101100921631, -3.391270637512207, -3.1444404125213623, -2.8976101875305176, -2.650779962539673, -2.403949737548828, -2.1571195125579834, -1.9102891683578491, -1.6634589433670044, -1.4166287183761597, -1.1697983741760254, -0.9229681491851807, -0.6761379241943359, -0.4293076694011688, -0.1824774146080017, 0.06435286998748779, 0.3111830949783325, 0.5580133199691772, 0.8048436641693115, 1.0516738891601562, 1.298504114151001, 1.5453343391418457, 1.7921645641326904, 2.038994789123535, 2.285825252532959, 2.5326552391052246, 2.7794857025146484, 3.026315927505493, 3.273146152496338, 3.5199763774871826, 3.7668066024780273, 4.013637065887451, 4.260467052459717, 4.507297515869141, 4.754127502441406, 5.00095796585083, 5.247788429260254, 5.494618892669678, 5.741448879241943, 5.988279342651367, 6.235109329223633, 6.481939792633057, 6.7287702560424805, 6.975600242614746, 7.222430229187012]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 15.0, 15.0, 16.0, 24.0, 17.0, 27.0, 35.0, 35.0, 45.0, 28.0, 37.0, 49.0, 48.0, 42.0, 42.0, 41.0, 41.0, 46.0, 41.0, 38.0, 41.0, 21.0, 34.0, 39.0, 34.0, 25.0, 22.0, 17.0, 13.0, 6.0, 7.0, 12.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.112955093383789, -3.997013568878174, -3.8810720443725586, -3.7651305198669434, -3.6491892337799072, -3.533247709274292, -3.4173061847686768, -3.3013646602630615, -3.1854231357574463, -3.069481611251831, -2.953540086746216, -2.8375988006591797, -2.7216572761535645, -2.605715751647949, -2.489774227142334, -2.3738327026367188, -2.2578911781311035, -2.1419496536254883, -2.026008129119873, -1.9100667238235474, -1.7941251993179321, -1.6781837940216064, -1.5622422695159912, -1.446300745010376, -1.3303594589233398, -1.2144179344177246, -1.098476529121399, -0.9825350046157837, -0.8665934801101685, -0.750652015209198, -0.6347105503082275, -0.5187690258026123, -0.40282750129699707, -0.2868860065937042, -0.17094452679157257, -0.05500304698944092, 0.06093844771385193, 0.17687994241714478, 0.29282140731811523, 0.40876293182373047, 0.5247043967247009, 0.6406458616256714, 0.7565873861312866, 0.8725288510322571, 0.9884703159332275, 1.1044118404388428, 1.220353364944458, 1.3362948894500732, 1.452236294746399, 1.5681778192520142, 1.6841192245483398, 1.800060749053955, 1.9160022735595703, 2.0319437980651855, 2.147885322570801, 2.263826847076416, 2.379768133163452, 2.4957096576690674, 2.6116511821746826, 2.7275924682617188, 2.843533992767334, 2.959475517272949, 3.0754170417785645, 3.1913585662841797, 3.307300090789795]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 42.0, 74.0, 119.0, 202.0, 324.0, 641.0, 1262.0, 2333.0, 4979.0, 11450.0, 29618.0, 85347.0, 245795.0, 376364.0, 186541.0, 63356.0, 22754.0, 9091.0, 4023.0, 1928.0, 962.0, 540.0, 309.0, 157.0, 88.0, 61.0, 42.0, 19.0, 21.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.1640625, -4.03924560546875, -3.9144287109375, -3.78961181640625, -3.664794921875, -3.53997802734375, -3.4151611328125, -3.29034423828125, -3.16552734375, -3.04071044921875, -2.9158935546875, -2.79107666015625, -2.666259765625, -2.54144287109375, -2.4166259765625, -2.29180908203125, -2.1669921875, -2.04217529296875, -1.9173583984375, -1.79254150390625, -1.667724609375, -1.54290771484375, -1.4180908203125, -1.29327392578125, -1.16845703125, -1.04364013671875, -0.9188232421875, -0.79400634765625, -0.669189453125, -0.54437255859375, -0.4195556640625, -0.29473876953125, -0.169921875, -0.04510498046875, 0.0797119140625, 0.20452880859375, 0.329345703125, 0.45416259765625, 0.5789794921875, 0.70379638671875, 0.82861328125, 0.95343017578125, 1.0782470703125, 1.20306396484375, 1.327880859375, 1.45269775390625, 1.5775146484375, 1.70233154296875, 1.8271484375, 1.95196533203125, 2.0767822265625, 2.20159912109375, 2.326416015625, 2.45123291015625, 2.5760498046875, 2.70086669921875, 2.82568359375, 2.95050048828125, 3.0753173828125, 3.20013427734375, 3.324951171875, 3.44976806640625, 3.5745849609375, 3.69940185546875, 3.82421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 13.0, 15.0, 20.0, 21.0, 22.0, 33.0, 39.0, 30.0, 51.0, 45.0, 41.0, 51.0, 49.0, 59.0, 47.0, 66.0, 58.0, 48.0, 49.0, 36.0, 39.0, 25.0, 35.0, 24.0, 18.0, 16.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.7986907958984375, -1.737030029296875, -1.6753692626953125, -1.61370849609375, -1.5520477294921875, -1.490386962890625, -1.4287261962890625, -1.3670654296875, -1.3054046630859375, -1.243743896484375, -1.1820831298828125, -1.12042236328125, -1.0587615966796875, -0.997100830078125, -0.9354400634765625, -0.873779296875, -0.8121185302734375, -0.750457763671875, -0.6887969970703125, -0.62713623046875, -0.5654754638671875, -0.503814697265625, -0.4421539306640625, -0.3804931640625, -0.3188323974609375, -0.257171630859375, -0.1955108642578125, -0.13385009765625, -0.0721893310546875, -0.010528564453125, 0.0511322021484375, 0.11279296875, 0.1744537353515625, 0.236114501953125, 0.2977752685546875, 0.35943603515625, 0.4210968017578125, 0.482757568359375, 0.5444183349609375, 0.6060791015625, 0.6677398681640625, 0.729400634765625, 0.7910614013671875, 0.85272216796875, 0.9143829345703125, 0.976043701171875, 1.0377044677734375, 1.099365234375, 1.1610260009765625, 1.222686767578125, 1.2843475341796875, 1.34600830078125, 1.4076690673828125, 1.469329833984375, 1.5309906005859375, 1.5926513671875, 1.6543121337890625, 1.715972900390625, 1.7776336669921875, 1.83929443359375, 1.9009552001953125, 1.962615966796875, 2.0242767333984375, 2.0859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 10.0, 12.0, 15.0, 26.0, 25.0, 35.0, 53.0, 83.0, 125.0, 209.0, 316.0, 500.0, 923.0, 2045.0, 5785.0, 27246.0, 292348.0, 642134.0, 60904.0, 9901.0, 2939.0, 1311.0, 578.0, 392.0, 225.0, 122.0, 95.0, 45.0, 51.0, 25.0, 15.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.796875, -7.56884765625, -7.3408203125, -7.11279296875, -6.884765625, -6.65673828125, -6.4287109375, -6.20068359375, -5.97265625, -5.74462890625, -5.5166015625, -5.28857421875, -5.060546875, -4.83251953125, -4.6044921875, -4.37646484375, -4.1484375, -3.92041015625, -3.6923828125, -3.46435546875, -3.236328125, -3.00830078125, -2.7802734375, -2.55224609375, -2.32421875, -2.09619140625, -1.8681640625, -1.64013671875, -1.412109375, -1.18408203125, -0.9560546875, -0.72802734375, -0.5, -0.27197265625, -0.0439453125, 0.18408203125, 0.412109375, 0.64013671875, 0.8681640625, 1.09619140625, 1.32421875, 1.55224609375, 1.7802734375, 2.00830078125, 2.236328125, 2.46435546875, 2.6923828125, 2.92041015625, 3.1484375, 3.37646484375, 3.6044921875, 3.83251953125, 4.060546875, 4.28857421875, 4.5166015625, 4.74462890625, 4.97265625, 5.20068359375, 5.4287109375, 5.65673828125, 5.884765625, 6.11279296875, 6.3408203125, 6.56884765625, 6.796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 8.0, 14.0, 14.0, 12.0, 12.0, 12.0, 27.0, 22.0, 29.0, 25.0, 29.0, 39.0, 44.0, 46.0, 39.0, 47.0, 56.0, 42.0, 61.0, 51.0, 47.0, 40.0, 44.0, 44.0, 37.0, 34.0, 27.0, 17.0, 13.0, 17.0, 7.0, 12.0, 14.0, 1.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.28948974609375, -8.0399169921875, -7.79034423828125, -7.540771484375, -7.29119873046875, -7.0416259765625, -6.79205322265625, -6.54248046875, -6.29290771484375, -6.0433349609375, -5.79376220703125, -5.544189453125, -5.29461669921875, -5.0450439453125, -4.79547119140625, -4.5458984375, -4.29632568359375, -4.0467529296875, -3.79718017578125, -3.547607421875, -3.29803466796875, -3.0484619140625, -2.79888916015625, -2.54931640625, -2.29974365234375, -2.0501708984375, -1.80059814453125, -1.551025390625, -1.30145263671875, -1.0518798828125, -0.80230712890625, -0.552734375, -0.30316162109375, -0.0535888671875, 0.19598388671875, 0.445556640625, 0.69512939453125, 0.9447021484375, 1.19427490234375, 1.44384765625, 1.69342041015625, 1.9429931640625, 2.19256591796875, 2.442138671875, 2.69171142578125, 2.9412841796875, 3.19085693359375, 3.4404296875, 3.69000244140625, 3.9395751953125, 4.18914794921875, 4.438720703125, 4.68829345703125, 4.9378662109375, 5.18743896484375, 5.43701171875, 5.68658447265625, 5.9361572265625, 6.18572998046875, 6.435302734375, 6.68487548828125, 6.9344482421875, 7.18402099609375, 7.43359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 5.0, 14.0, 31.0, 27.0, 38.0, 61.0, 81.0, 157.0, 310.0, 660.0, 1674.0, 5768.0, 31078.0, 315974.0, 615924.0, 63387.0, 9187.0, 2300.0, 900.0, 426.0, 192.0, 106.0, 61.0, 53.0, 37.0, 23.0, 14.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.80078125, -3.67047119140625, -3.5401611328125, -3.40985107421875, -3.279541015625, -3.14923095703125, -3.0189208984375, -2.88861083984375, -2.75830078125, -2.62799072265625, -2.4976806640625, -2.36737060546875, -2.237060546875, -2.10675048828125, -1.9764404296875, -1.84613037109375, -1.7158203125, -1.58551025390625, -1.4552001953125, -1.32489013671875, -1.194580078125, -1.06427001953125, -0.9339599609375, -0.80364990234375, -0.67333984375, -0.54302978515625, -0.4127197265625, -0.28240966796875, -0.152099609375, -0.02178955078125, 0.1085205078125, 0.23883056640625, 0.369140625, 0.49945068359375, 0.6297607421875, 0.76007080078125, 0.890380859375, 1.02069091796875, 1.1510009765625, 1.28131103515625, 1.41162109375, 1.54193115234375, 1.6722412109375, 1.80255126953125, 1.932861328125, 2.06317138671875, 2.1934814453125, 2.32379150390625, 2.4541015625, 2.58441162109375, 2.7147216796875, 2.84503173828125, 2.975341796875, 3.10565185546875, 3.2359619140625, 3.36627197265625, 3.49658203125, 3.62689208984375, 3.7572021484375, 3.88751220703125, 4.017822265625, 4.14813232421875, 4.2784423828125, 4.40875244140625, 4.5390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 15.0, 18.0, 26.0, 17.0, 28.0, 27.0, 53.0, 51.0, 80.0, 75.0, 89.0, 85.0, 75.0, 63.0, 56.0, 44.0, 35.0, 14.0, 25.0, 15.0, 14.0, 10.0, 10.0, 15.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005002021789550781, -0.00048532336950302124, -0.00047044456005096436, -0.00045556575059890747, -0.0004406869411468506, -0.0004258081316947937, -0.0004109293222427368, -0.00039605051279067993, -0.00038117170333862305, -0.00036629289388656616, -0.0003514140844345093, -0.0003365352749824524, -0.0003216564655303955, -0.0003067776560783386, -0.00029189884662628174, -0.00027702003717422485, -0.00026214122772216797, -0.0002472624182701111, -0.0002323836088180542, -0.00021750479936599731, -0.00020262598991394043, -0.00018774718046188354, -0.00017286837100982666, -0.00015798956155776978, -0.0001431107521057129, -0.000128231942653656, -0.00011335313320159912, -9.847432374954224e-05, -8.359551429748535e-05, -6.871670484542847e-05, -5.383789539337158e-05, -3.89590859413147e-05, -2.4080276489257812e-05, -9.201467037200928e-06, 5.677342414855957e-06, 2.0556151866912842e-05, 3.5434961318969727e-05, 5.031377077102661e-05, 6.51925802230835e-05, 8.007138967514038e-05, 9.495019912719727e-05, 0.00010982900857925415, 0.00012470781803131104, 0.00013958662748336792, 0.0001544654369354248, 0.0001693442463874817, 0.00018422305583953857, 0.00019910186529159546, 0.00021398067474365234, 0.00022885948419570923, 0.0002437382936477661, 0.000258617103099823, 0.0002734959125518799, 0.00028837472200393677, 0.00030325353145599365, 0.00031813234090805054, 0.0003330111503601074, 0.0003478899598121643, 0.0003627687692642212, 0.0003776475787162781, 0.00039252638816833496, 0.00040740519762039185, 0.00042228400707244873, 0.0004371628165245056, 0.0004520416259765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 9.0, 9.0, 15.0, 20.0, 30.0, 56.0, 84.0, 174.0, 372.0, 1201.0, 5894.0, 111012.0, 883976.0, 40511.0, 3634.0, 881.0, 325.0, 152.0, 71.0, 50.0, 25.0, 16.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.9432373046875, -6.714599609375, -6.4859619140625, -6.25732421875, -6.0286865234375, -5.800048828125, -5.5714111328125, -5.3427734375, -5.1141357421875, -4.885498046875, -4.6568603515625, -4.42822265625, -4.1995849609375, -3.970947265625, -3.7423095703125, -3.513671875, -3.2850341796875, -3.056396484375, -2.8277587890625, -2.59912109375, -2.3704833984375, -2.141845703125, -1.9132080078125, -1.6845703125, -1.4559326171875, -1.227294921875, -0.9986572265625, -0.77001953125, -0.5413818359375, -0.312744140625, -0.0841064453125, 0.14453125, 0.3731689453125, 0.601806640625, 0.8304443359375, 1.05908203125, 1.2877197265625, 1.516357421875, 1.7449951171875, 1.9736328125, 2.2022705078125, 2.430908203125, 2.6595458984375, 2.88818359375, 3.1168212890625, 3.345458984375, 3.5740966796875, 3.802734375, 4.0313720703125, 4.260009765625, 4.4886474609375, 4.71728515625, 4.9459228515625, 5.174560546875, 5.4031982421875, 5.6318359375, 5.8604736328125, 6.089111328125, 6.3177490234375, 6.54638671875, 6.7750244140625, 7.003662109375, 7.2322998046875, 7.4609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 7.0, 20.0, 27.0, 25.0, 44.0, 49.0, 54.0, 57.0, 68.0, 71.0, 71.0, 62.0, 64.0, 62.0, 65.0, 44.0, 38.0, 32.0, 28.0, 16.0, 14.0, 15.0, 8.0, 6.0, 3.0, 8.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.10546875, -2.029296875, -1.953125, -1.876953125, -1.80078125, -1.724609375, -1.6484375, -1.572265625, -1.49609375, -1.419921875, -1.34375, -1.267578125, -1.19140625, -1.115234375, -1.0390625, -0.962890625, -0.88671875, -0.810546875, -0.734375, -0.658203125, -0.58203125, -0.505859375, -0.4296875, -0.353515625, -0.27734375, -0.201171875, -0.125, -0.048828125, 0.02734375, 0.103515625, 0.1796875, 0.255859375, 0.33203125, 0.408203125, 0.484375, 0.560546875, 0.63671875, 0.712890625, 0.7890625, 0.865234375, 0.94140625, 1.017578125, 1.09375, 1.169921875, 1.24609375, 1.322265625, 1.3984375, 1.474609375, 1.55078125, 1.626953125, 1.703125, 1.779296875, 1.85546875, 1.931640625, 2.0078125, 2.083984375, 2.16015625, 2.236328125, 2.3125, 2.388671875, 2.46484375, 2.541015625, 2.6171875, 2.693359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 9.0, 14.0, 22.0, 42.0, 78.0, 112.0, 167.0, 169.0, 161.0, 95.0, 62.0, 38.0, 19.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-80.1387710571289, -78.24723815917969, -76.35569763183594, -74.46415710449219, -72.57262420654297, -70.68109130859375, -68.78955078125, -66.89801025390625, -65.00647735595703, -63.11494064331055, -61.22340393066406, -59.33186721801758, -57.440330505371094, -55.54879379272461, -53.657257080078125, -51.76572036743164, -49.874183654785156, -47.98264694213867, -46.09111022949219, -44.1995735168457, -42.30803680419922, -40.416500091552734, -38.52496337890625, -36.633426666259766, -34.74188995361328, -32.8503532409668, -30.958816528320312, -29.067279815673828, -27.175743103027344, -25.28420639038086, -23.392669677734375, -21.50113296508789, -19.609596252441406, -17.718059539794922, -15.826522827148438, -13.934986114501953, -12.043449401855469, -10.151912689208984, -8.2603759765625, -6.368839263916016, -4.477302551269531, -2.585765838623047, -0.6942291259765625, 1.1973075866699219, 3.0888442993164062, 4.980381011962891, 6.871917724609375, 8.76345443725586, 10.654991149902344, 12.546527862548828, 14.438064575195312, 16.329601287841797, 18.22113800048828, 20.112674713134766, 22.00421142578125, 23.895748138427734, 25.78728485107422, 27.678821563720703, 29.570358276367188, 31.461894989013672, 33.353431701660156, 35.24496841430664, 37.136505126953125, 39.02804183959961, 40.919578552246094]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 13.0, 25.0, 23.0, 22.0, 28.0, 37.0, 32.0, 40.0, 44.0, 51.0, 56.0, 57.0, 50.0, 44.0, 55.0, 39.0, 40.0, 31.0, 38.0, 34.0, 31.0, 23.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.078405380249023, -30.00717544555664, -28.935945510864258, -27.864715576171875, -26.79348373413086, -25.72225570678711, -24.651023864746094, -23.57979393005371, -22.508563995361328, -21.437334060668945, -20.366104125976562, -19.29487419128418, -18.223644256591797, -17.15241241455078, -16.0811824798584, -15.009952545166016, -13.938722610473633, -12.86749267578125, -11.796262741088867, -10.725031852722168, -9.653801918029785, -8.582571983337402, -7.511341571807861, -6.44011116027832, -5.3688812255859375, -4.297651290893555, -3.2264208793640137, -2.1551907062530518, -1.0839605331420898, -0.012730598449707031, 1.058499813079834, 2.129730224609375, 3.2009620666503906, 4.272192001342773, 5.3434224128723145, 6.4146528244018555, 7.485882759094238, 8.557112693786621, 9.62834358215332, 10.699573516845703, 11.770803451538086, 12.842033386230469, 13.913263320922852, 14.98449420928955, 16.05572509765625, 17.126953125, 18.198184967041016, 19.2694149017334, 20.34064483642578, 21.411874771118164, 22.483104705810547, 23.55433464050293, 24.625564575195312, 25.696796417236328, 26.76802635192871, 27.839256286621094, 28.910486221313477, 29.98171615600586, 31.052946090698242, 32.124176025390625, 33.19540786743164, 34.26663589477539, 35.337867736816406, 36.409095764160156, 37.48032760620117]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 22.0, 38.0, 88.0, 170.0, 253.0, 439.0, 833.0, 1843.0, 5771.0, 57627.0, 4110120.0, 11767.0, 2859.0, 1120.0, 564.0, 309.0, 175.0, 116.0, 61.0, 43.0, 21.0, 13.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.46044921875, -12.9833984375, -12.50634765625, -12.029296875, -11.55224609375, -11.0751953125, -10.59814453125, -10.12109375, -9.64404296875, -9.1669921875, -8.68994140625, -8.212890625, -7.73583984375, -7.2587890625, -6.78173828125, -6.3046875, -5.82763671875, -5.3505859375, -4.87353515625, -4.396484375, -3.91943359375, -3.4423828125, -2.96533203125, -2.48828125, -2.01123046875, -1.5341796875, -1.05712890625, -0.580078125, -0.10302734375, 0.3740234375, 0.85107421875, 1.328125, 1.80517578125, 2.2822265625, 2.75927734375, 3.236328125, 3.71337890625, 4.1904296875, 4.66748046875, 5.14453125, 5.62158203125, 6.0986328125, 6.57568359375, 7.052734375, 7.52978515625, 8.0068359375, 8.48388671875, 8.9609375, 9.43798828125, 9.9150390625, 10.39208984375, 10.869140625, 11.34619140625, 11.8232421875, 12.30029296875, 12.77734375, 13.25439453125, 13.7314453125, 14.20849609375, 14.685546875, 15.16259765625, 15.6396484375, 16.11669921875, 16.59375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 8.0, 17.0, 15.0, 24.0, 35.0, 32.0, 46.0, 39.0, 50.0, 41.0, 56.0, 53.0, 60.0, 62.0, 63.0, 55.0, 52.0, 49.0, 46.0, 36.0, 32.0, 18.0, 20.0, 16.0, 14.0, 13.0, 7.0, 7.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1328125, -2.066497802734375, -2.00018310546875, -1.933868408203125, -1.8675537109375, -1.801239013671875, -1.73492431640625, -1.668609619140625, -1.602294921875, -1.535980224609375, -1.46966552734375, -1.403350830078125, -1.3370361328125, -1.270721435546875, -1.20440673828125, -1.138092041015625, -1.07177734375, -1.005462646484375, -0.93914794921875, -0.872833251953125, -0.8065185546875, -0.740203857421875, -0.67388916015625, -0.607574462890625, -0.541259765625, -0.474945068359375, -0.40863037109375, -0.342315673828125, -0.2760009765625, -0.209686279296875, -0.14337158203125, -0.077056884765625, -0.0107421875, 0.055572509765625, 0.12188720703125, 0.188201904296875, 0.2545166015625, 0.320831298828125, 0.38714599609375, 0.453460693359375, 0.519775390625, 0.586090087890625, 0.65240478515625, 0.718719482421875, 0.7850341796875, 0.851348876953125, 0.91766357421875, 0.983978271484375, 1.05029296875, 1.116607666015625, 1.18292236328125, 1.249237060546875, 1.3155517578125, 1.381866455078125, 1.44818115234375, 1.514495849609375, 1.580810546875, 1.647125244140625, 1.71343994140625, 1.779754638671875, 1.8460693359375, 1.912384033203125, 1.97869873046875, 2.045013427734375, 2.111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 9.0, 10.0, 16.0, 24.0, 29.0, 34.0, 46.0, 88.0, 122.0, 176.0, 329.0, 619.0, 1123.0, 2358.0, 6967.0, 42662.0, 4081714.0, 45675.0, 7246.0, 2409.0, 1134.0, 597.0, 338.0, 189.0, 104.0, 62.0, 57.0, 40.0, 24.0, 13.0, 11.0, 10.0, 8.0, 6.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.9375, -11.6353759765625, -11.333251953125, -11.0311279296875, -10.72900390625, -10.4268798828125, -10.124755859375, -9.8226318359375, -9.5205078125, -9.2183837890625, -8.916259765625, -8.6141357421875, -8.31201171875, -8.0098876953125, -7.707763671875, -7.4056396484375, -7.103515625, -6.8013916015625, -6.499267578125, -6.1971435546875, -5.89501953125, -5.5928955078125, -5.290771484375, -4.9886474609375, -4.6865234375, -4.3843994140625, -4.082275390625, -3.7801513671875, -3.47802734375, -3.1759033203125, -2.873779296875, -2.5716552734375, -2.26953125, -1.9674072265625, -1.665283203125, -1.3631591796875, -1.06103515625, -0.7589111328125, -0.456787109375, -0.1546630859375, 0.1474609375, 0.4495849609375, 0.751708984375, 1.0538330078125, 1.35595703125, 1.6580810546875, 1.960205078125, 2.2623291015625, 2.564453125, 2.8665771484375, 3.168701171875, 3.4708251953125, 3.77294921875, 4.0750732421875, 4.377197265625, 4.6793212890625, 4.9814453125, 5.2835693359375, 5.585693359375, 5.8878173828125, 6.18994140625, 6.4920654296875, 6.794189453125, 7.0963134765625, 7.3984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 11.0, 19.0, 46.0, 161.0, 3553.0, 158.0, 39.0, 24.0, 19.0, 14.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.784088134765625, -2.71856689453125, -2.653045654296875, -2.5875244140625, -2.522003173828125, -2.45648193359375, -2.390960693359375, -2.325439453125, -2.259918212890625, -2.19439697265625, -2.128875732421875, -2.0633544921875, -1.997833251953125, -1.93231201171875, -1.866790771484375, -1.80126953125, -1.735748291015625, -1.67022705078125, -1.604705810546875, -1.5391845703125, -1.473663330078125, -1.40814208984375, -1.342620849609375, -1.277099609375, -1.211578369140625, -1.14605712890625, -1.080535888671875, -1.0150146484375, -0.949493408203125, -0.88397216796875, -0.818450927734375, -0.7529296875, -0.687408447265625, -0.62188720703125, -0.556365966796875, -0.4908447265625, -0.425323486328125, -0.35980224609375, -0.294281005859375, -0.228759765625, -0.163238525390625, -0.09771728515625, -0.032196044921875, 0.0333251953125, 0.098846435546875, 0.16436767578125, 0.229888916015625, 0.29541015625, 0.360931396484375, 0.42645263671875, 0.491973876953125, 0.5574951171875, 0.623016357421875, 0.68853759765625, 0.754058837890625, 0.819580078125, 0.885101318359375, 0.95062255859375, 1.016143798828125, 1.0816650390625, 1.147186279296875, 1.21270751953125, 1.278228759765625, 1.34375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 13.0, 28.0, 35.0, 56.0, 119.0, 153.0, 204.0, 167.0, 108.0, 52.0, 29.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.651954650878906, -7.372481346130371, -7.093008518218994, -6.813535213470459, -6.534062385559082, -6.254589080810547, -5.975115776062012, -5.695642948150635, -5.416170120239258, -5.136696815490723, -4.857223987579346, -4.5777506828308105, -4.298277854919434, -4.018804550170898, -3.7393314838409424, -3.4598584175109863, -3.180385112762451, -2.900912046432495, -2.621438980102539, -2.341965675354004, -2.062492847442627, -1.7830196619033813, -1.5035464763641357, -1.2240734100341797, -0.9446003437042236, -0.6651272773742676, -0.38565415143966675, -0.10618102550506592, 0.17329204082489014, 0.4527651071548462, 0.7322382926940918, 1.0117113590240479, 1.291184425354004, 1.57065749168396, 1.850130558013916, 2.129603862762451, 2.409076690673828, 2.6885499954223633, 2.9680230617523193, 3.2474961280822754, 3.5269691944122314, 3.8064422607421875, 4.085915565490723, 4.3653883934021, 4.644861698150635, 4.924334526062012, 5.203807830810547, 5.483281135559082, 5.762753963470459, 6.042227268218994, 6.321700096130371, 6.601173400878906, 6.880646228790283, 7.160119533538818, 7.439592361450195, 7.7190656661987305, 7.998538970947266, 8.2780122756958, 8.557485580444336, 8.836957931518555, 9.11643123626709, 9.395904541015625, 9.67537784576416, 9.954851150512695, 10.234323501586914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 3.0, 10.0, 5.0, 11.0, 9.0, 9.0, 11.0, 18.0, 21.0, 22.0, 22.0, 32.0, 27.0, 34.0, 36.0, 40.0, 40.0, 49.0, 47.0, 57.0, 47.0, 43.0, 46.0, 37.0, 43.0, 39.0, 32.0, 32.0, 28.0, 21.0, 23.0, 22.0, 18.0, 14.0, 9.0, 12.0, 3.0, 3.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-3.4852757453918457, -3.389942169189453, -3.2946088314056396, -3.199275255203247, -3.1039419174194336, -3.008608341217041, -2.9132747650146484, -2.817941188812256, -2.7226078510284424, -2.62727427482605, -2.5319409370422363, -2.4366073608398438, -2.341273784637451, -2.2459404468536377, -2.150606870651245, -2.0552735328674316, -1.959939956665039, -1.864606499671936, -1.769273042678833, -1.6739394664764404, -1.5786060094833374, -1.4832725524902344, -1.3879389762878418, -1.2926055192947388, -1.1972720623016357, -1.1019386053085327, -1.0066051483154297, -0.9112715721130371, -0.8159381151199341, -0.720604658126831, -0.6252711415290833, -0.5299376249313354, -0.4346041679382324, -0.339270681142807, -0.2439371943473816, -0.14860370755195618, -0.05327022075653076, 0.04206326603889465, 0.13739675283432007, 0.23273026943206787, 0.3280637264251709, 0.4233972132205963, 0.5187307000160217, 0.6140642166137695, 0.7093976736068726, 0.8047311305999756, 0.9000646471977234, 0.9953981637954712, 1.0907316207885742, 1.1860650777816772, 1.2813985347747803, 1.3767321109771729, 1.4720655679702759, 1.567399024963379, 1.6627326011657715, 1.7580660581588745, 1.8533995151519775, 1.9487329721450806, 2.0440664291381836, 2.139400005340576, 2.2347335815429688, 2.3300669193267822, 2.425400495529175, 2.5207338333129883, 2.616067409515381]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 7.0, 11.0, 19.0, 15.0, 26.0, 52.0, 64.0, 109.0, 160.0, 277.0, 437.0, 698.0, 1157.0, 2162.0, 3993.0, 7905.0, 17595.0, 41488.0, 104303.0, 262260.0, 338252.0, 157974.0, 61327.0, 24994.0, 11167.0, 5503.0, 2796.0, 1498.0, 848.0, 537.0, 313.0, 200.0, 138.0, 74.0, 59.0, 37.0, 28.0, 21.0, 17.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.533203125, -3.438262939453125, -3.34332275390625, -3.248382568359375, -3.1534423828125, -3.058502197265625, -2.96356201171875, -2.868621826171875, -2.773681640625, -2.678741455078125, -2.58380126953125, -2.488861083984375, -2.3939208984375, -2.298980712890625, -2.20404052734375, -2.109100341796875, -2.01416015625, -1.919219970703125, -1.82427978515625, -1.729339599609375, -1.6343994140625, -1.539459228515625, -1.44451904296875, -1.349578857421875, -1.254638671875, -1.159698486328125, -1.06475830078125, -0.969818115234375, -0.8748779296875, -0.779937744140625, -0.68499755859375, -0.590057373046875, -0.4951171875, -0.400177001953125, -0.30523681640625, -0.210296630859375, -0.1153564453125, -0.020416259765625, 0.07452392578125, 0.169464111328125, 0.264404296875, 0.359344482421875, 0.45428466796875, 0.549224853515625, 0.6441650390625, 0.739105224609375, 0.83404541015625, 0.928985595703125, 1.02392578125, 1.118865966796875, 1.21380615234375, 1.308746337890625, 1.4036865234375, 1.498626708984375, 1.59356689453125, 1.688507080078125, 1.783447265625, 1.878387451171875, 1.97332763671875, 2.068267822265625, 2.1632080078125, 2.258148193359375, 2.35308837890625, 2.448028564453125, 2.54296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 14.0, 30.0, 31.0, 22.0, 40.0, 41.0, 46.0, 46.0, 36.0, 53.0, 58.0, 55.0, 50.0, 60.0, 47.0, 51.0, 61.0, 43.0, 37.0, 27.0, 26.0, 23.0, 15.0, 12.0, 8.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.995513916015625, -1.93048095703125, -1.865447998046875, -1.8004150390625, -1.735382080078125, -1.67034912109375, -1.605316162109375, -1.540283203125, -1.475250244140625, -1.41021728515625, -1.345184326171875, -1.2801513671875, -1.215118408203125, -1.15008544921875, -1.085052490234375, -1.02001953125, -0.954986572265625, -0.88995361328125, -0.824920654296875, -0.7598876953125, -0.694854736328125, -0.62982177734375, -0.564788818359375, -0.499755859375, -0.434722900390625, -0.36968994140625, -0.304656982421875, -0.2396240234375, -0.174591064453125, -0.10955810546875, -0.044525146484375, 0.0205078125, 0.085540771484375, 0.15057373046875, 0.215606689453125, 0.2806396484375, 0.345672607421875, 0.41070556640625, 0.475738525390625, 0.540771484375, 0.605804443359375, 0.67083740234375, 0.735870361328125, 0.8009033203125, 0.865936279296875, 0.93096923828125, 0.996002197265625, 1.06103515625, 1.126068115234375, 1.19110107421875, 1.256134033203125, 1.3211669921875, 1.386199951171875, 1.45123291015625, 1.516265869140625, 1.581298828125, 1.646331787109375, 1.71136474609375, 1.776397705078125, 1.8414306640625, 1.906463623046875, 1.97149658203125, 2.036529541015625, 2.1015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 6.0, 9.0, 7.0, 13.0, 17.0, 21.0, 45.0, 49.0, 80.0, 109.0, 154.0, 248.0, 366.0, 618.0, 1088.0, 2496.0, 7560.0, 43327.0, 607667.0, 346510.0, 27804.0, 5755.0, 2106.0, 944.0, 537.0, 326.0, 214.0, 146.0, 100.0, 61.0, 49.0, 31.0, 29.0, 22.0, 18.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.46484375, -6.26214599609375, -6.0594482421875, -5.85675048828125, -5.654052734375, -5.45135498046875, -5.2486572265625, -5.04595947265625, -4.84326171875, -4.64056396484375, -4.4378662109375, -4.23516845703125, -4.032470703125, -3.82977294921875, -3.6270751953125, -3.42437744140625, -3.2216796875, -3.01898193359375, -2.8162841796875, -2.61358642578125, -2.410888671875, -2.20819091796875, -2.0054931640625, -1.80279541015625, -1.60009765625, -1.39739990234375, -1.1947021484375, -0.99200439453125, -0.789306640625, -0.58660888671875, -0.3839111328125, -0.18121337890625, 0.021484375, 0.22418212890625, 0.4268798828125, 0.62957763671875, 0.832275390625, 1.03497314453125, 1.2376708984375, 1.44036865234375, 1.64306640625, 1.84576416015625, 2.0484619140625, 2.25115966796875, 2.453857421875, 2.65655517578125, 2.8592529296875, 3.06195068359375, 3.2646484375, 3.46734619140625, 3.6700439453125, 3.87274169921875, 4.075439453125, 4.27813720703125, 4.4808349609375, 4.68353271484375, 4.88623046875, 5.08892822265625, 5.2916259765625, 5.49432373046875, 5.697021484375, 5.89971923828125, 6.1024169921875, 6.30511474609375, 6.5078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 15.0, 7.0, 5.0, 13.0, 23.0, 21.0, 13.0, 24.0, 29.0, 26.0, 24.0, 44.0, 50.0, 26.0, 43.0, 37.0, 35.0, 49.0, 47.0, 43.0, 37.0, 43.0, 38.0, 40.0, 28.0, 29.0, 20.0, 21.0, 24.0, 21.0, 17.0, 18.0, 16.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.8125, -6.61279296875, -6.4130859375, -6.21337890625, -6.013671875, -5.81396484375, -5.6142578125, -5.41455078125, -5.21484375, -5.01513671875, -4.8154296875, -4.61572265625, -4.416015625, -4.21630859375, -4.0166015625, -3.81689453125, -3.6171875, -3.41748046875, -3.2177734375, -3.01806640625, -2.818359375, -2.61865234375, -2.4189453125, -2.21923828125, -2.01953125, -1.81982421875, -1.6201171875, -1.42041015625, -1.220703125, -1.02099609375, -0.8212890625, -0.62158203125, -0.421875, -0.22216796875, -0.0224609375, 0.17724609375, 0.376953125, 0.57666015625, 0.7763671875, 0.97607421875, 1.17578125, 1.37548828125, 1.5751953125, 1.77490234375, 1.974609375, 2.17431640625, 2.3740234375, 2.57373046875, 2.7734375, 2.97314453125, 3.1728515625, 3.37255859375, 3.572265625, 3.77197265625, 3.9716796875, 4.17138671875, 4.37109375, 4.57080078125, 4.7705078125, 4.97021484375, 5.169921875, 5.36962890625, 5.5693359375, 5.76904296875, 5.96875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 10.0, 19.0, 18.0, 32.0, 45.0, 85.0, 180.0, 366.0, 1073.0, 4428.0, 42956.0, 855178.0, 133012.0, 8510.0, 1662.0, 501.0, 224.0, 94.0, 57.0, 33.0, 16.0, 18.0, 12.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640625, -4.478759765625, -4.31689453125, -4.155029296875, -3.9931640625, -3.831298828125, -3.66943359375, -3.507568359375, -3.345703125, -3.183837890625, -3.02197265625, -2.860107421875, -2.6982421875, -2.536376953125, -2.37451171875, -2.212646484375, -2.05078125, -1.888916015625, -1.72705078125, -1.565185546875, -1.4033203125, -1.241455078125, -1.07958984375, -0.917724609375, -0.755859375, -0.593994140625, -0.43212890625, -0.270263671875, -0.1083984375, 0.053466796875, 0.21533203125, 0.377197265625, 0.5390625, 0.700927734375, 0.86279296875, 1.024658203125, 1.1865234375, 1.348388671875, 1.51025390625, 1.672119140625, 1.833984375, 1.995849609375, 2.15771484375, 2.319580078125, 2.4814453125, 2.643310546875, 2.80517578125, 2.967041015625, 3.12890625, 3.290771484375, 3.45263671875, 3.614501953125, 3.7763671875, 3.938232421875, 4.10009765625, 4.261962890625, 4.423828125, 4.585693359375, 4.74755859375, 4.909423828125, 5.0712890625, 5.233154296875, 5.39501953125, 5.556884765625, 5.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 14.0, 18.0, 18.0, 31.0, 63.0, 90.0, 189.0, 185.0, 134.0, 70.0, 47.0, 36.0, 21.0, 7.0, 14.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007348060607910156, -0.0007087960839271545, -0.0006827861070632935, -0.0006567761301994324, -0.0006307661533355713, -0.0006047561764717102, -0.0005787461996078491, -0.000552736222743988, -0.000526726245880127, -0.0005007162690162659, -0.0004747062921524048, -0.0004486963152885437, -0.0004226863384246826, -0.00039667636156082153, -0.00037066638469696045, -0.00034465640783309937, -0.0003186464309692383, -0.0002926364541053772, -0.0002666264772415161, -0.00024061650037765503, -0.00021460652351379395, -0.00018859654664993286, -0.00016258656978607178, -0.0001365765929222107, -0.00011056661605834961, -8.455663919448853e-05, -5.854666233062744e-05, -3.253668546676636e-05, -6.5267086029052734e-06, 1.948326826095581e-05, 4.5493245124816895e-05, 7.150322198867798e-05, 9.751319885253906e-05, 0.00012352317571640015, 0.00014953315258026123, 0.00017554312944412231, 0.0002015531063079834, 0.00022756308317184448, 0.00025357306003570557, 0.00027958303689956665, 0.00030559301376342773, 0.0003316029906272888, 0.0003576129674911499, 0.000383622944355011, 0.00040963292121887207, 0.00043564289808273315, 0.00046165287494659424, 0.0004876628518104553, 0.0005136728286743164, 0.0005396828055381775, 0.0005656927824020386, 0.0005917027592658997, 0.0006177127361297607, 0.0006437227129936218, 0.0006697326898574829, 0.000695742666721344, 0.0007217526435852051, 0.0007477626204490662, 0.0007737725973129272, 0.0007997825741767883, 0.0008257925510406494, 0.0008518025279045105, 0.0008778125047683716, 0.0009038224816322327, 0.0009298324584960938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 20.0, 17.0, 28.0, 46.0, 79.0, 132.0, 212.0, 422.0, 840.0, 1859.0, 5178.0, 22440.0, 185323.0, 705192.0, 104737.0, 14912.0, 3952.0, 1508.0, 707.0, 386.0, 204.0, 126.0, 69.0, 37.0, 37.0, 20.0, 11.0, 12.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.842559814453125, -3.73394775390625, -3.625335693359375, -3.5167236328125, -3.408111572265625, -3.29949951171875, -3.190887451171875, -3.082275390625, -2.973663330078125, -2.86505126953125, -2.756439208984375, -2.6478271484375, -2.539215087890625, -2.43060302734375, -2.321990966796875, -2.21337890625, -2.104766845703125, -1.99615478515625, -1.887542724609375, -1.7789306640625, -1.670318603515625, -1.56170654296875, -1.453094482421875, -1.344482421875, -1.235870361328125, -1.12725830078125, -1.018646240234375, -0.9100341796875, -0.801422119140625, -0.69281005859375, -0.584197998046875, -0.4755859375, -0.366973876953125, -0.25836181640625, -0.149749755859375, -0.0411376953125, 0.067474365234375, 0.17608642578125, 0.284698486328125, 0.393310546875, 0.501922607421875, 0.61053466796875, 0.719146728515625, 0.8277587890625, 0.936370849609375, 1.04498291015625, 1.153594970703125, 1.26220703125, 1.370819091796875, 1.47943115234375, 1.588043212890625, 1.6966552734375, 1.805267333984375, 1.91387939453125, 2.022491455078125, 2.131103515625, 2.239715576171875, 2.34832763671875, 2.456939697265625, 2.5655517578125, 2.674163818359375, 2.78277587890625, 2.891387939453125, 3.0]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 24.0, 34.0, 30.0, 42.0, 44.0, 71.0, 64.0, 69.0, 96.0, 97.0, 77.0, 83.0, 59.0, 52.0, 32.0, 26.0, 17.0, 16.0, 10.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.011810302734375, -2.92987060546875, -2.847930908203125, -2.7659912109375, -2.684051513671875, -2.60211181640625, -2.520172119140625, -2.438232421875, -2.356292724609375, -2.27435302734375, -2.192413330078125, -2.1104736328125, -2.028533935546875, -1.94659423828125, -1.864654541015625, -1.78271484375, -1.700775146484375, -1.61883544921875, -1.536895751953125, -1.4549560546875, -1.373016357421875, -1.29107666015625, -1.209136962890625, -1.127197265625, -1.045257568359375, -0.96331787109375, -0.881378173828125, -0.7994384765625, -0.717498779296875, -0.63555908203125, -0.553619384765625, -0.4716796875, -0.389739990234375, -0.30780029296875, -0.225860595703125, -0.1439208984375, -0.061981201171875, 0.01995849609375, 0.101898193359375, 0.183837890625, 0.265777587890625, 0.34771728515625, 0.429656982421875, 0.5115966796875, 0.593536376953125, 0.67547607421875, 0.757415771484375, 0.83935546875, 0.921295166015625, 1.00323486328125, 1.085174560546875, 1.1671142578125, 1.249053955078125, 1.33099365234375, 1.412933349609375, 1.494873046875, 1.576812744140625, 1.65875244140625, 1.740692138671875, 1.8226318359375, 1.904571533203125, 1.98651123046875, 2.068450927734375, 2.150390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 30.0, 89.0, 178.0, 288.0, 245.0, 89.0, 39.0, 18.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.6630630493164, -92.97833251953125, -90.29359436035156, -87.6088638305664, -84.92412567138672, -82.23939514160156, -79.55465698242188, -76.86992645263672, -74.18519592285156, -71.5004653930664, -68.81572723388672, -66.13099670410156, -63.446258544921875, -60.76152801513672, -58.0767936706543, -55.392059326171875, -52.70732116699219, -50.022586822509766, -47.337852478027344, -44.65312194824219, -41.9683837890625, -39.283653259277344, -36.59891891479492, -33.9141845703125, -31.229450225830078, -28.544715881347656, -25.859981536865234, -23.175249099731445, -20.490514755249023, -17.8057804107666, -15.121047973632812, -12.43631362915039, -9.7515869140625, -7.066853046417236, -4.382119178771973, -1.6973857879638672, 0.9873485565185547, 3.6720829010009766, 6.356815338134766, 9.041549682617188, 11.72628402709961, 14.411018371582031, 17.095752716064453, 19.780485153198242, 22.465219497680664, 25.149953842163086, 27.834686279296875, 30.519420623779297, 33.20415496826172, 35.88888931274414, 38.57362365722656, 41.25835418701172, 43.943092346191406, 46.62782287597656, 49.312557220458984, 51.997291564941406, 54.68202590942383, 57.36676025390625, 60.05149459838867, 62.736228942871094, 65.42095947265625, 68.10569763183594, 70.7904281616211, 73.47515869140625, 76.15989685058594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 5.0, 11.0, 11.0, 12.0, 20.0, 29.0, 23.0, 28.0, 43.0, 47.0, 48.0, 52.0, 78.0, 75.0, 70.0, 66.0, 55.0, 51.0, 34.0, 46.0, 33.0, 37.0, 22.0, 20.0, 12.0, 18.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.164466857910156, -51.79619216918945, -50.427913665771484, -49.05963897705078, -47.69136428833008, -46.323089599609375, -44.954811096191406, -43.5865364074707, -42.21826171875, -40.8499870300293, -39.48170852661133, -38.113433837890625, -36.74515914916992, -35.37688446044922, -34.00860595703125, -32.64033126831055, -31.27205467224121, -29.903778076171875, -28.535503387451172, -27.167226791381836, -25.798952102661133, -24.430675506591797, -23.062400817871094, -21.694124221801758, -20.325847625732422, -18.957571029663086, -17.589296340942383, -16.221019744873047, -14.852745056152344, -13.484468460083008, -12.116192817687988, -10.747917175292969, -9.379642486572266, -8.011366844177246, -6.643091201782227, -5.274815082550049, -3.9065394401550293, -2.5382637977600098, -1.169987678527832, 0.1982879638671875, 1.566563606262207, 2.9348392486572266, 4.303114891052246, 5.671391010284424, 7.039666652679443, 8.407941818237305, 9.77621841430664, 11.14449405670166, 12.51276969909668, 13.8810453414917, 15.249320983886719, 16.617597579956055, 17.985872268676758, 19.354148864746094, 20.722423553466797, 22.090700149536133, 23.45897674560547, 24.827253341674805, 26.195528030395508, 27.563804626464844, 28.932079315185547, 30.300355911254883, 31.66863250732422, 33.03690719604492, 34.405181884765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 9.0, 20.0, 17.0, 29.0, 57.0, 100.0, 191.0, 347.0, 716.0, 1525.0, 3426.0, 9330.0, 38199.0, 3975536.0, 138118.0, 16995.0, 5215.0, 2245.0, 1046.0, 492.0, 300.0, 164.0, 75.0, 34.0, 34.0, 21.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.0087890625, -5.775390625, -5.5419921875, -5.30859375, -5.0751953125, -4.841796875, -4.6083984375, -4.375, -4.1416015625, -3.908203125, -3.6748046875, -3.44140625, -3.2080078125, -2.974609375, -2.7412109375, -2.5078125, -2.2744140625, -2.041015625, -1.8076171875, -1.57421875, -1.3408203125, -1.107421875, -0.8740234375, -0.640625, -0.4072265625, -0.173828125, 0.0595703125, 0.29296875, 0.5263671875, 0.759765625, 0.9931640625, 1.2265625, 1.4599609375, 1.693359375, 1.9267578125, 2.16015625, 2.3935546875, 2.626953125, 2.8603515625, 3.09375, 3.3271484375, 3.560546875, 3.7939453125, 4.02734375, 4.2607421875, 4.494140625, 4.7275390625, 4.9609375, 5.1943359375, 5.427734375, 5.6611328125, 5.89453125, 6.1279296875, 6.361328125, 6.5947265625, 6.828125, 7.0615234375, 7.294921875, 7.5283203125, 7.76171875, 7.9951171875, 8.228515625, 8.4619140625, 8.6953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 7.0, 14.0, 21.0, 18.0, 21.0, 33.0, 28.0, 40.0, 50.0, 57.0, 53.0, 67.0, 69.0, 59.0, 57.0, 64.0, 57.0, 54.0, 43.0, 32.0, 29.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.556640625, -2.487640380859375, -2.41864013671875, -2.349639892578125, -2.2806396484375, -2.211639404296875, -2.14263916015625, -2.073638916015625, -2.004638671875, -1.935638427734375, -1.86663818359375, -1.797637939453125, -1.7286376953125, -1.659637451171875, -1.59063720703125, -1.521636962890625, -1.45263671875, -1.383636474609375, -1.31463623046875, -1.245635986328125, -1.1766357421875, -1.107635498046875, -1.03863525390625, -0.969635009765625, -0.900634765625, -0.831634521484375, -0.76263427734375, -0.693634033203125, -0.6246337890625, -0.555633544921875, -0.48663330078125, -0.417633056640625, -0.3486328125, -0.279632568359375, -0.21063232421875, -0.141632080078125, -0.0726318359375, -0.003631591796875, 0.06536865234375, 0.134368896484375, 0.203369140625, 0.272369384765625, 0.34136962890625, 0.410369873046875, 0.4793701171875, 0.548370361328125, 0.61737060546875, 0.686370849609375, 0.75537109375, 0.824371337890625, 0.89337158203125, 0.962371826171875, 1.0313720703125, 1.100372314453125, 1.16937255859375, 1.238372802734375, 1.307373046875, 1.376373291015625, 1.44537353515625, 1.514373779296875, 1.5833740234375, 1.652374267578125, 1.72137451171875, 1.790374755859375, 1.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 16.0, 16.0, 34.0, 35.0, 51.0, 78.0, 115.0, 179.0, 268.0, 421.0, 707.0, 1152.0, 1934.0, 3424.0, 7092.0, 18143.0, 77336.0, 3801452.0, 230352.0, 30511.0, 10381.0, 4413.0, 2483.0, 1351.0, 896.0, 482.0, 299.0, 214.0, 137.0, 84.0, 67.0, 42.0, 19.0, 21.0, 18.0, 9.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.33837890625, -4.1923828125, -4.04638671875, -3.900390625, -3.75439453125, -3.6083984375, -3.46240234375, -3.31640625, -3.17041015625, -3.0244140625, -2.87841796875, -2.732421875, -2.58642578125, -2.4404296875, -2.29443359375, -2.1484375, -2.00244140625, -1.8564453125, -1.71044921875, -1.564453125, -1.41845703125, -1.2724609375, -1.12646484375, -0.98046875, -0.83447265625, -0.6884765625, -0.54248046875, -0.396484375, -0.25048828125, -0.1044921875, 0.04150390625, 0.1875, 0.33349609375, 0.4794921875, 0.62548828125, 0.771484375, 0.91748046875, 1.0634765625, 1.20947265625, 1.35546875, 1.50146484375, 1.6474609375, 1.79345703125, 1.939453125, 2.08544921875, 2.2314453125, 2.37744140625, 2.5234375, 2.66943359375, 2.8154296875, 2.96142578125, 3.107421875, 3.25341796875, 3.3994140625, 3.54541015625, 3.69140625, 3.83740234375, 3.9833984375, 4.12939453125, 4.275390625, 4.42138671875, 4.5673828125, 4.71337890625, 4.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 9.0, 12.0, 11.0, 20.0, 54.0, 90.0, 245.0, 2856.0, 469.0, 126.0, 57.0, 33.0, 21.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.94854736328125, -1.8756103515625, -1.80267333984375, -1.729736328125, -1.65679931640625, -1.5838623046875, -1.51092529296875, -1.43798828125, -1.36505126953125, -1.2921142578125, -1.21917724609375, -1.146240234375, -1.07330322265625, -1.0003662109375, -0.92742919921875, -0.8544921875, -0.78155517578125, -0.7086181640625, -0.63568115234375, -0.562744140625, -0.48980712890625, -0.4168701171875, -0.34393310546875, -0.27099609375, -0.19805908203125, -0.1251220703125, -0.05218505859375, 0.020751953125, 0.09368896484375, 0.1666259765625, 0.23956298828125, 0.3125, 0.38543701171875, 0.4583740234375, 0.53131103515625, 0.604248046875, 0.67718505859375, 0.7501220703125, 0.82305908203125, 0.89599609375, 0.96893310546875, 1.0418701171875, 1.11480712890625, 1.187744140625, 1.26068115234375, 1.3336181640625, 1.40655517578125, 1.4794921875, 1.55242919921875, 1.6253662109375, 1.69830322265625, 1.771240234375, 1.84417724609375, 1.9171142578125, 1.99005126953125, 2.06298828125, 2.13592529296875, 2.2088623046875, 2.28179931640625, 2.354736328125, 2.42767333984375, 2.5006103515625, 2.57354736328125, 2.646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 7.0, 6.0, 19.0, 27.0, 37.0, 58.0, 99.0, 133.0, 145.0, 161.0, 118.0, 74.0, 47.0, 23.0, 22.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.110759735107422, -9.742130279541016, -9.37350082397461, -9.004871368408203, -8.636241912841797, -8.26761245727539, -7.898983478546143, -7.530354022979736, -7.16172456741333, -6.793095111846924, -6.424465656280518, -6.0558366775512695, -5.687207221984863, -5.318577766418457, -4.949948310852051, -4.5813188552856445, -4.212689399719238, -3.844059944152832, -3.475430488586426, -3.1068012714385986, -2.7381718158721924, -2.369542360305786, -2.000913143157959, -1.6322836875915527, -1.2636542320251465, -0.895024836063385, -0.5263954401016235, -0.15776610374450684, 0.21086335182189941, 0.5794928073883057, 0.9481220245361328, 1.316751480102539, 1.685379981994629, 2.054009437561035, 2.4226388931274414, 2.7912681102752686, 3.159897565841675, 3.528527021408081, 3.897156238555908, 4.2657856941223145, 4.634415149688721, 5.003044605255127, 5.371674060821533, 5.740303039550781, 6.1089324951171875, 6.477561950683594, 6.84619140625, 7.214820861816406, 7.5834503173828125, 7.952079772949219, 8.320709228515625, 8.689338684082031, 9.057968139648438, 9.426597595214844, 9.79522705078125, 10.163856506347656, 10.532485961914062, 10.901115417480469, 11.269744873046875, 11.638374328613281, 12.007003784179688, 12.375633239746094, 12.7442626953125, 13.112892150878906, 13.481520652770996]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 5.0, 17.0, 16.0, 13.0, 22.0, 26.0, 22.0, 40.0, 23.0, 37.0, 43.0, 38.0, 47.0, 45.0, 44.0, 59.0, 50.0, 36.0, 38.0, 41.0, 29.0, 44.0, 36.0, 31.0, 30.0, 31.0, 26.0, 17.0, 15.0, 12.0, 20.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.804723262786865, -4.625757217407227, -4.44679069519043, -4.267824649810791, -4.088858604431152, -3.9098923206329346, -3.730926036834717, -3.551959991455078, -3.3729937076568604, -3.1940274238586426, -3.015061378479004, -2.836095094680786, -2.6571288108825684, -2.4781627655029297, -2.299196481704712, -2.120230197906494, -1.9412641525268555, -1.7622979879379272, -1.583331823348999, -1.4043655395507812, -1.225399374961853, -1.0464332103729248, -0.867466926574707, -0.6885007619857788, -0.5095345973968506, -0.3305684030056, -0.15160220861434937, 0.027364015579223633, 0.20633018016815186, 0.3852963447570801, 0.5642626285552979, 0.7432287931442261, 0.9221954345703125, 1.1011615991592407, 1.280127763748169, 1.4590940475463867, 1.638060212135315, 1.8170263767242432, 1.995992660522461, 2.1749587059020996, 2.3539249897003174, 2.532891273498535, 2.711857318878174, 2.8908236026763916, 3.0697898864746094, 3.248755931854248, 3.427722215652466, 3.6066884994506836, 3.7856545448303223, 3.96462082862854, 4.143587112426758, 4.3225531578063965, 4.501519203186035, 4.680485725402832, 4.859451770782471, 5.038417816162109, 5.217384338378906, 5.396350383758545, 5.575316905975342, 5.7542829513549805, 5.933248996734619, 6.112215042114258, 6.291181564331055, 6.470147609710693, 6.649113655090332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 3.0, 11.0, 17.0, 16.0, 43.0, 69.0, 120.0, 233.0, 472.0, 1169.0, 2903.0, 8065.0, 27037.0, 105325.0, 464332.0, 334662.0, 73743.0, 20001.0, 6296.0, 2265.0, 924.0, 408.0, 201.0, 89.0, 57.0, 32.0, 23.0, 10.0, 12.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.49493408203125, -4.2984619140625, -4.10198974609375, -3.905517578125, -3.70904541015625, -3.5125732421875, -3.31610107421875, -3.11962890625, -2.92315673828125, -2.7266845703125, -2.53021240234375, -2.333740234375, -2.13726806640625, -1.9407958984375, -1.74432373046875, -1.5478515625, -1.35137939453125, -1.1549072265625, -0.95843505859375, -0.761962890625, -0.56549072265625, -0.3690185546875, -0.17254638671875, 0.02392578125, 0.22039794921875, 0.4168701171875, 0.61334228515625, 0.809814453125, 1.00628662109375, 1.2027587890625, 1.39923095703125, 1.595703125, 1.79217529296875, 1.9886474609375, 2.18511962890625, 2.381591796875, 2.57806396484375, 2.7745361328125, 2.97100830078125, 3.16748046875, 3.36395263671875, 3.5604248046875, 3.75689697265625, 3.953369140625, 4.14984130859375, 4.3463134765625, 4.54278564453125, 4.7392578125, 4.93572998046875, 5.1322021484375, 5.32867431640625, 5.525146484375, 5.72161865234375, 5.9180908203125, 6.11456298828125, 6.31103515625, 6.50750732421875, 6.7039794921875, 6.90045166015625, 7.096923828125, 7.29339599609375, 7.4898681640625, 7.68634033203125, 7.8828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 14.0, 20.0, 20.0, 27.0, 21.0, 30.0, 36.0, 33.0, 49.0, 53.0, 54.0, 57.0, 55.0, 54.0, 48.0, 52.0, 54.0, 44.0, 51.0, 34.0, 43.0, 21.0, 20.0, 20.0, 16.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.15625, -2.0941314697265625, -2.032012939453125, -1.9698944091796875, -1.90777587890625, -1.8456573486328125, -1.783538818359375, -1.7214202880859375, -1.6593017578125, -1.5971832275390625, -1.535064697265625, -1.4729461669921875, -1.41082763671875, -1.3487091064453125, -1.286590576171875, -1.2244720458984375, -1.162353515625, -1.1002349853515625, -1.038116455078125, -0.9759979248046875, -0.91387939453125, -0.8517608642578125, -0.789642333984375, -0.7275238037109375, -0.6654052734375, -0.6032867431640625, -0.541168212890625, -0.4790496826171875, -0.41693115234375, -0.3548126220703125, -0.292694091796875, -0.2305755615234375, -0.16845703125, -0.1063385009765625, -0.044219970703125, 0.0178985595703125, 0.08001708984375, 0.1421356201171875, 0.204254150390625, 0.2663726806640625, 0.3284912109375, 0.3906097412109375, 0.452728271484375, 0.5148468017578125, 0.57696533203125, 0.6390838623046875, 0.701202392578125, 0.7633209228515625, 0.825439453125, 0.8875579833984375, 0.949676513671875, 1.0117950439453125, 1.07391357421875, 1.1360321044921875, 1.198150634765625, 1.2602691650390625, 1.3223876953125, 1.3845062255859375, 1.446624755859375, 1.5087432861328125, 1.57086181640625, 1.6329803466796875, 1.695098876953125, 1.7572174072265625, 1.8193359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 11.0, 21.0, 13.0, 20.0, 33.0, 29.0, 48.0, 75.0, 94.0, 137.0, 196.0, 322.0, 437.0, 707.0, 1194.0, 2467.0, 6475.0, 28654.0, 219443.0, 682245.0, 83539.0, 13957.0, 3931.0, 1795.0, 968.0, 564.0, 361.0, 228.0, 152.0, 111.0, 95.0, 58.0, 52.0, 29.0, 24.0, 20.0, 9.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.94140625, -7.7283935546875, -7.515380859375, -7.3023681640625, -7.08935546875, -6.8763427734375, -6.663330078125, -6.4503173828125, -6.2373046875, -6.0242919921875, -5.811279296875, -5.5982666015625, -5.38525390625, -5.1722412109375, -4.959228515625, -4.7462158203125, -4.533203125, -4.3201904296875, -4.107177734375, -3.8941650390625, -3.68115234375, -3.4681396484375, -3.255126953125, -3.0421142578125, -2.8291015625, -2.6160888671875, -2.403076171875, -2.1900634765625, -1.97705078125, -1.7640380859375, -1.551025390625, -1.3380126953125, -1.125, -0.9119873046875, -0.698974609375, -0.4859619140625, -0.27294921875, -0.0599365234375, 0.153076171875, 0.3660888671875, 0.5791015625, 0.7921142578125, 1.005126953125, 1.2181396484375, 1.43115234375, 1.6441650390625, 1.857177734375, 2.0701904296875, 2.283203125, 2.4962158203125, 2.709228515625, 2.9222412109375, 3.13525390625, 3.3482666015625, 3.561279296875, 3.7742919921875, 3.9873046875, 4.2003173828125, 4.413330078125, 4.6263427734375, 4.83935546875, 5.0523681640625, 5.265380859375, 5.4783935546875, 5.69140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 3.0, 10.0, 13.0, 15.0, 18.0, 17.0, 30.0, 29.0, 30.0, 45.0, 47.0, 60.0, 52.0, 48.0, 53.0, 62.0, 67.0, 50.0, 53.0, 41.0, 44.0, 36.0, 26.0, 25.0, 28.0, 22.0, 16.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.6484375, -9.403076171875, -9.15771484375, -8.912353515625, -8.6669921875, -8.421630859375, -8.17626953125, -7.930908203125, -7.685546875, -7.440185546875, -7.19482421875, -6.949462890625, -6.7041015625, -6.458740234375, -6.21337890625, -5.968017578125, -5.72265625, -5.477294921875, -5.23193359375, -4.986572265625, -4.7412109375, -4.495849609375, -4.25048828125, -4.005126953125, -3.759765625, -3.514404296875, -3.26904296875, -3.023681640625, -2.7783203125, -2.532958984375, -2.28759765625, -2.042236328125, -1.796875, -1.551513671875, -1.30615234375, -1.060791015625, -0.8154296875, -0.570068359375, -0.32470703125, -0.079345703125, 0.166015625, 0.411376953125, 0.65673828125, 0.902099609375, 1.1474609375, 1.392822265625, 1.63818359375, 1.883544921875, 2.12890625, 2.374267578125, 2.61962890625, 2.864990234375, 3.1103515625, 3.355712890625, 3.60107421875, 3.846435546875, 4.091796875, 4.337158203125, 4.58251953125, 4.827880859375, 5.0732421875, 5.318603515625, 5.56396484375, 5.809326171875, 6.0546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 7.0, 9.0, 6.0, 21.0, 23.0, 34.0, 55.0, 50.0, 79.0, 115.0, 153.0, 222.0, 332.0, 615.0, 950.0, 1782.0, 3486.0, 7622.0, 19299.0, 55593.0, 179897.0, 510079.0, 178105.0, 55123.0, 19161.0, 7785.0, 3507.0, 1797.0, 962.0, 542.0, 361.0, 200.0, 173.0, 106.0, 83.0, 48.0, 34.0, 22.0, 17.0, 16.0, 9.0, 18.0, 6.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0], "bins": [-1.6611328125, -1.610015869140625, -1.55889892578125, -1.507781982421875, -1.4566650390625, -1.405548095703125, -1.35443115234375, -1.303314208984375, -1.252197265625, -1.201080322265625, -1.14996337890625, -1.098846435546875, -1.0477294921875, -0.996612548828125, -0.94549560546875, -0.894378662109375, -0.84326171875, -0.792144775390625, -0.74102783203125, -0.689910888671875, -0.6387939453125, -0.587677001953125, -0.53656005859375, -0.485443115234375, -0.434326171875, -0.383209228515625, -0.33209228515625, -0.280975341796875, -0.2298583984375, -0.178741455078125, -0.12762451171875, -0.076507568359375, -0.025390625, 0.025726318359375, 0.07684326171875, 0.127960205078125, 0.1790771484375, 0.230194091796875, 0.28131103515625, 0.332427978515625, 0.383544921875, 0.434661865234375, 0.48577880859375, 0.536895751953125, 0.5880126953125, 0.639129638671875, 0.69024658203125, 0.741363525390625, 0.79248046875, 0.843597412109375, 0.89471435546875, 0.945831298828125, 0.9969482421875, 1.048065185546875, 1.09918212890625, 1.150299072265625, 1.201416015625, 1.252532958984375, 1.30364990234375, 1.354766845703125, 1.4058837890625, 1.457000732421875, 1.50811767578125, 1.559234619140625, 1.6103515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 11.0, 4.0, 11.0, 9.0, 27.0, 30.0, 38.0, 45.0, 60.0, 90.0, 145.0, 188.0, 110.0, 57.0, 40.0, 43.0, 18.0, 24.0, 18.0, 14.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009059906005859375, -0.0008816048502922058, -0.0008572190999984741, -0.0008328333497047424, -0.0008084475994110107, -0.000784061849117279, -0.0007596760988235474, -0.0007352903485298157, -0.000710904598236084, -0.0006865188479423523, -0.0006621330976486206, -0.0006377473473548889, -0.0006133615970611572, -0.0005889758467674255, -0.0005645900964736938, -0.0005402043461799622, -0.0005158185958862305, -0.0004914328455924988, -0.0004670470952987671, -0.0004426613450050354, -0.0004182755947113037, -0.000393889844417572, -0.00036950409412384033, -0.00034511834383010864, -0.00032073259353637695, -0.00029634684324264526, -0.0002719610929489136, -0.0002475753426551819, -0.0002231895923614502, -0.0001988038420677185, -0.00017441809177398682, -0.00015003234148025513, -0.00012564659118652344, -0.00010126084089279175, -7.687509059906006e-05, -5.248934030532837e-05, -2.810359001159668e-05, -3.7178397178649902e-06, 2.06679105758667e-05, 4.505366086959839e-05, 6.943941116333008e-05, 9.382516145706177e-05, 0.00011821091175079346, 0.00014259666204452515, 0.00016698241233825684, 0.00019136816263198853, 0.00021575391292572021, 0.0002401396632194519, 0.0002645254135131836, 0.0002889111638069153, 0.00031329691410064697, 0.00033768266439437866, 0.00036206841468811035, 0.00038645416498184204, 0.00041083991527557373, 0.0004352256655693054, 0.0004596114158630371, 0.0004839971661567688, 0.0005083829164505005, 0.0005327686667442322, 0.0005571544170379639, 0.0005815401673316956, 0.0006059259176254272, 0.0006303116679191589, 0.0006546974182128906]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 5.0, 9.0, 15.0, 21.0, 30.0, 45.0, 48.0, 65.0, 118.0, 179.0, 262.0, 437.0, 842.0, 1558.0, 3540.0, 10174.0, 40402.0, 225977.0, 602687.0, 124945.0, 24565.0, 6912.0, 2661.0, 1231.0, 709.0, 369.0, 259.0, 162.0, 107.0, 62.0, 42.0, 34.0, 20.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.272735595703125, -2.19781494140625, -2.122894287109375, -2.0479736328125, -1.973052978515625, -1.89813232421875, -1.823211669921875, -1.748291015625, -1.673370361328125, -1.59844970703125, -1.523529052734375, -1.4486083984375, -1.373687744140625, -1.29876708984375, -1.223846435546875, -1.14892578125, -1.074005126953125, -0.99908447265625, -0.924163818359375, -0.8492431640625, -0.774322509765625, -0.69940185546875, -0.624481201171875, -0.549560546875, -0.474639892578125, -0.39971923828125, -0.324798583984375, -0.2498779296875, -0.174957275390625, -0.10003662109375, -0.025115966796875, 0.0498046875, 0.124725341796875, 0.19964599609375, 0.274566650390625, 0.3494873046875, 0.424407958984375, 0.49932861328125, 0.574249267578125, 0.649169921875, 0.724090576171875, 0.79901123046875, 0.873931884765625, 0.9488525390625, 1.023773193359375, 1.09869384765625, 1.173614501953125, 1.24853515625, 1.323455810546875, 1.39837646484375, 1.473297119140625, 1.5482177734375, 1.623138427734375, 1.69805908203125, 1.772979736328125, 1.847900390625, 1.922821044921875, 1.99774169921875, 2.072662353515625, 2.1475830078125, 2.222503662109375, 2.29742431640625, 2.372344970703125, 2.447265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 8.0, 16.0, 19.0, 12.0, 26.0, 27.0, 19.0, 34.0, 41.0, 47.0, 56.0, 67.0, 84.0, 52.0, 80.0, 64.0, 56.0, 48.0, 22.0, 25.0, 26.0, 15.0, 28.0, 18.0, 15.0, 11.0, 12.0, 10.0, 3.0, 11.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61260986328125, -1.5592041015625, -1.50579833984375, -1.452392578125, -1.39898681640625, -1.3455810546875, -1.29217529296875, -1.23876953125, -1.18536376953125, -1.1319580078125, -1.07855224609375, -1.025146484375, -0.97174072265625, -0.9183349609375, -0.86492919921875, -0.8115234375, -0.75811767578125, -0.7047119140625, -0.65130615234375, -0.597900390625, -0.54449462890625, -0.4910888671875, -0.43768310546875, -0.38427734375, -0.33087158203125, -0.2774658203125, -0.22406005859375, -0.170654296875, -0.11724853515625, -0.0638427734375, -0.01043701171875, 0.04296875, 0.09637451171875, 0.1497802734375, 0.20318603515625, 0.256591796875, 0.30999755859375, 0.3634033203125, 0.41680908203125, 0.47021484375, 0.52362060546875, 0.5770263671875, 0.63043212890625, 0.683837890625, 0.73724365234375, 0.7906494140625, 0.84405517578125, 0.8974609375, 0.95086669921875, 1.0042724609375, 1.05767822265625, 1.111083984375, 1.16448974609375, 1.2178955078125, 1.27130126953125, 1.32470703125, 1.37811279296875, 1.4315185546875, 1.48492431640625, 1.538330078125, 1.59173583984375, 1.6451416015625, 1.69854736328125, 1.751953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 23.0, 82.0, 179.0, 253.0, 248.0, 117.0, 54.0, 22.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.33924865722656, -51.71582794189453, -49.0924072265625, -46.46898651123047, -43.8455696105957, -41.22214889526367, -38.59872817993164, -35.975311279296875, -33.351890563964844, -30.728469848632812, -28.105051040649414, -25.481630325317383, -22.858211517333984, -20.234790802001953, -17.611370086669922, -14.987951278686523, -12.36452865600586, -9.741108894348145, -7.1176886558532715, -4.494268417358398, -1.8708486557006836, 0.7525711059570312, 3.3759918212890625, 5.999410629272461, 8.622831344604492, 11.246251106262207, 13.869670867919922, 16.493091583251953, 19.116512298583984, 21.739931106567383, 24.363351821899414, 26.986770629882812, 29.610191345214844, 32.233612060546875, 34.857032775878906, 37.48045349121094, 40.1038703918457, 42.727291107177734, 45.350711822509766, 47.97412872314453, 50.59754943847656, 53.220970153808594, 55.844390869140625, 58.467811584472656, 61.09122848510742, 63.71464920043945, 66.33807373046875, 68.96148681640625, 71.58491516113281, 74.20833587646484, 76.83175659179688, 79.4551773071289, 82.07859802246094, 84.70201110839844, 87.325439453125, 89.9488525390625, 92.57227325439453, 95.19569396972656, 97.8191146850586, 100.44253540039062, 103.06595611572266, 105.68937683105469, 108.31278991699219, 110.93621063232422, 113.55963134765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 17.0, 50.0, 39.0, 38.0, 32.0, 44.0, 52.0, 50.0, 55.0, 39.0, 47.0, 30.0, 45.0, 39.0, 40.0, 37.0, 30.0, 22.0, 31.0, 24.0, 18.0, 15.0, 11.0, 12.0, 7.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.92465591430664, -24.99482536315918, -24.064992904663086, -23.135162353515625, -22.205331802368164, -21.275501251220703, -20.34566879272461, -19.41583824157715, -18.486007690429688, -17.556177139282227, -16.626344680786133, -15.696514129638672, -14.766683578491211, -13.836852073669434, -12.907020568847656, -11.977190017700195, -11.047358512878418, -10.11752700805664, -9.18769645690918, -8.257864952087402, -7.328034400939941, -6.398202896118164, -5.468371868133545, -4.538540840148926, -3.6087098121643066, -2.6788787841796875, -1.7490476369857788, -0.8192164897918701, 0.11061453819274902, 1.0404458045959473, 1.9702768325805664, 2.9001078605651855, 3.8299388885498047, 4.759769916534424, 5.689600944519043, 6.61943244934082, 7.549263000488281, 8.479094505310059, 9.408926010131836, 10.338756561279297, 11.268587112426758, 12.198418617248535, 13.128249168395996, 14.058080673217773, 14.987911224365234, 15.917742729187012, 16.84757423400879, 17.77740478515625, 18.707237243652344, 19.637067794799805, 20.5669002532959, 21.49673080444336, 22.42656135559082, 23.35639190673828, 24.286224365234375, 25.216054916381836, 26.145885467529297, 27.075716018676758, 28.00554847717285, 28.935379028320312, 29.865209579467773, 30.795040130615234, 31.724872589111328, 32.654701232910156, 33.58453369140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 13.0, 16.0, 27.0, 50.0, 82.0, 134.0, 218.0, 378.0, 730.0, 1398.0, 2791.0, 6263.0, 15490.0, 46147.0, 221830.0, 3062423.0, 714655.0, 81176.0, 23810.0, 9025.0, 3785.0, 1796.0, 880.0, 473.0, 279.0, 165.0, 81.0, 60.0, 39.0, 23.0, 16.0, 5.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.806640625, -3.682708740234375, -3.55877685546875, -3.434844970703125, -3.3109130859375, -3.186981201171875, -3.06304931640625, -2.939117431640625, -2.815185546875, -2.691253662109375, -2.56732177734375, -2.443389892578125, -2.3194580078125, -2.195526123046875, -2.07159423828125, -1.947662353515625, -1.82373046875, -1.699798583984375, -1.57586669921875, -1.451934814453125, -1.3280029296875, -1.204071044921875, -1.08013916015625, -0.956207275390625, -0.832275390625, -0.708343505859375, -0.58441162109375, -0.460479736328125, -0.3365478515625, -0.212615966796875, -0.08868408203125, 0.035247802734375, 0.1591796875, 0.283111572265625, 0.40704345703125, 0.530975341796875, 0.6549072265625, 0.778839111328125, 0.90277099609375, 1.026702880859375, 1.150634765625, 1.274566650390625, 1.39849853515625, 1.522430419921875, 1.6463623046875, 1.770294189453125, 1.89422607421875, 2.018157958984375, 2.14208984375, 2.266021728515625, 2.38995361328125, 2.513885498046875, 2.6378173828125, 2.761749267578125, 2.88568115234375, 3.009613037109375, 3.133544921875, 3.257476806640625, 3.38140869140625, 3.505340576171875, 3.6292724609375, 3.753204345703125, 3.87713623046875, 4.001068115234375, 4.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 2.0, 10.0, 14.0, 16.0, 11.0, 17.0, 29.0, 24.0, 37.0, 30.0, 37.0, 55.0, 46.0, 56.0, 55.0, 58.0, 49.0, 52.0, 51.0, 46.0, 47.0, 42.0, 37.0, 34.0, 37.0, 27.0, 21.0, 13.0, 12.0, 8.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.09765625, -2.0394134521484375, -1.981170654296875, -1.9229278564453125, -1.86468505859375, -1.8064422607421875, -1.748199462890625, -1.6899566650390625, -1.6317138671875, -1.5734710693359375, -1.515228271484375, -1.4569854736328125, -1.39874267578125, -1.3404998779296875, -1.282257080078125, -1.2240142822265625, -1.165771484375, -1.1075286865234375, -1.049285888671875, -0.9910430908203125, -0.93280029296875, -0.8745574951171875, -0.816314697265625, -0.7580718994140625, -0.6998291015625, -0.6415863037109375, -0.583343505859375, -0.5251007080078125, -0.46685791015625, -0.4086151123046875, -0.350372314453125, -0.2921295166015625, -0.23388671875, -0.1756439208984375, -0.117401123046875, -0.0591583251953125, -0.00091552734375, 0.0573272705078125, 0.115570068359375, 0.1738128662109375, 0.2320556640625, 0.2902984619140625, 0.348541259765625, 0.4067840576171875, 0.46502685546875, 0.5232696533203125, 0.581512451171875, 0.6397552490234375, 0.697998046875, 0.7562408447265625, 0.814483642578125, 0.8727264404296875, 0.93096923828125, 0.9892120361328125, 1.047454833984375, 1.1056976318359375, 1.1639404296875, 1.2221832275390625, 1.280426025390625, 1.3386688232421875, 1.39691162109375, 1.4551544189453125, 1.513397216796875, 1.5716400146484375, 1.6298828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 15.0, 18.0, 27.0, 27.0, 47.0, 72.0, 100.0, 161.0, 301.0, 481.0, 998.0, 2225.0, 5333.0, 14975.0, 55191.0, 409637.0, 3402055.0, 242913.0, 40631.0, 11417.0, 4124.0, 1687.0, 820.0, 417.0, 224.0, 133.0, 81.0, 51.0, 32.0, 12.0, 14.0, 22.0, 7.0, 8.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.1644287109375, -4.012451171875, -3.8604736328125, -3.70849609375, -3.5565185546875, -3.404541015625, -3.2525634765625, -3.1005859375, -2.9486083984375, -2.796630859375, -2.6446533203125, -2.49267578125, -2.3406982421875, -2.188720703125, -2.0367431640625, -1.884765625, -1.7327880859375, -1.580810546875, -1.4288330078125, -1.27685546875, -1.1248779296875, -0.972900390625, -0.8209228515625, -0.6689453125, -0.5169677734375, -0.364990234375, -0.2130126953125, -0.06103515625, 0.0909423828125, 0.242919921875, 0.3948974609375, 0.546875, 0.6988525390625, 0.850830078125, 1.0028076171875, 1.15478515625, 1.3067626953125, 1.458740234375, 1.6107177734375, 1.7626953125, 1.9146728515625, 2.066650390625, 2.2186279296875, 2.37060546875, 2.5225830078125, 2.674560546875, 2.8265380859375, 2.978515625, 3.1304931640625, 3.282470703125, 3.4344482421875, 3.58642578125, 3.7384033203125, 3.890380859375, 4.0423583984375, 4.1943359375, 4.3463134765625, 4.498291015625, 4.6502685546875, 4.80224609375, 4.9542236328125, 5.106201171875, 5.2581787109375, 5.41015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 11.0, 23.0, 23.0, 22.0, 47.0, 54.0, 94.0, 160.0, 294.0, 828.0, 1213.0, 620.0, 307.0, 144.0, 71.0, 44.0, 32.0, 14.0, 16.0, 6.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7998046875, -5.615234375, -5.4306640625, -5.24609375, -5.0615234375, -4.876953125, -4.6923828125, -4.5078125, -4.3232421875, -4.138671875, -3.9541015625, -3.76953125, -3.5849609375, -3.400390625, -3.2158203125, -3.03125, -2.8466796875, -2.662109375, -2.4775390625, -2.29296875, -2.1083984375, -1.923828125, -1.7392578125, -1.5546875, -1.3701171875, -1.185546875, -1.0009765625, -0.81640625, -0.6318359375, -0.447265625, -0.2626953125, -0.078125, 0.1064453125, 0.291015625, 0.4755859375, 0.66015625, 0.8447265625, 1.029296875, 1.2138671875, 1.3984375, 1.5830078125, 1.767578125, 1.9521484375, 2.13671875, 2.3212890625, 2.505859375, 2.6904296875, 2.875, 3.0595703125, 3.244140625, 3.4287109375, 3.61328125, 3.7978515625, 3.982421875, 4.1669921875, 4.3515625, 4.5361328125, 4.720703125, 4.9052734375, 5.08984375, 5.2744140625, 5.458984375, 5.6435546875, 5.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 0.0, 3.0, 4.0, 8.0, 6.0, 12.0, 20.0, 20.0, 42.0, 57.0, 116.0, 174.0, 215.0, 155.0, 85.0, 41.0, 16.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.24077606201172, -80.50762176513672, -78.77445983886719, -77.04130554199219, -75.30814361572266, -73.57498931884766, -71.84182739257812, -70.10867309570312, -68.3755111694336, -66.6423568725586, -64.90919494628906, -63.1760368347168, -61.44287872314453, -59.709720611572266, -57.9765625, -56.243404388427734, -54.51024627685547, -52.7770881652832, -51.04393005371094, -49.31077194213867, -47.577613830566406, -45.84445571899414, -44.111297607421875, -42.37813949584961, -40.64498519897461, -38.911827087402344, -37.17866897583008, -35.44551086425781, -33.71235275268555, -31.97919464111328, -30.246036529541016, -28.51287841796875, -26.779720306396484, -25.04656219482422, -23.313404083251953, -21.580245971679688, -19.847087860107422, -18.113929748535156, -16.38077163696289, -14.647614479064941, -12.914456367492676, -11.18129825592041, -9.448140144348145, -7.714982509613037, -5.9818243980407715, -4.248666763305664, -2.5155086517333984, -0.7823505401611328, 0.9508075714111328, 2.6839656829833984, 4.417123794555664, 6.1502814292907715, 7.883439540863037, 9.616597175598145, 11.34975528717041, 13.082913398742676, 14.816071510314941, 16.54922866821289, 18.282386779785156, 20.015544891357422, 21.748703002929688, 23.481861114501953, 25.21501922607422, 26.948177337646484, 28.68133544921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 15.0, 22.0, 22.0, 17.0, 25.0, 30.0, 24.0, 26.0, 39.0, 39.0, 31.0, 36.0, 38.0, 47.0, 38.0, 37.0, 43.0, 40.0, 33.0, 48.0, 38.0, 36.0, 38.0, 29.0, 39.0, 24.0, 24.0, 19.0, 18.0, 19.0, 6.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.709545135498047, -22.95271110534668, -22.195877075195312, -21.439043045043945, -20.682209014892578, -19.92537498474121, -19.168540954589844, -18.41170883178711, -17.65487289428711, -16.898038864135742, -16.141204833984375, -15.384370803833008, -14.62753677368164, -13.870702743530273, -13.113869667053223, -12.357035636901855, -11.600202560424805, -10.843368530273438, -10.08653450012207, -9.329700469970703, -8.572866439819336, -7.816032886505127, -7.059199333190918, -6.302365303039551, -5.545531272888184, -4.788697242736816, -4.031863212585449, -3.2750296592712402, -2.518195629119873, -1.7613615989685059, -1.0045280456542969, -0.2476940155029297, 0.5091381072998047, 1.2659720182418823, 2.02280592918396, 2.779639720916748, 3.5364737510681152, 4.293307781219482, 5.050141334533691, 5.806975364685059, 6.563809394836426, 7.320643424987793, 8.07747745513916, 8.834310531616211, 9.591144561767578, 10.347978591918945, 11.104812622070312, 11.86164665222168, 12.618480682373047, 13.375314712524414, 14.132148742675781, 14.888982772827148, 15.645816802978516, 16.402650833129883, 17.15948486328125, 17.916316986083984, 18.673152923583984, 19.42998695373535, 20.18682098388672, 20.943655014038086, 21.700489044189453, 22.45732307434082, 23.214157104492188, 23.970989227294922, 24.72782325744629]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 5.0, 18.0, 22.0, 35.0, 52.0, 85.0, 157.0, 235.0, 412.0, 721.0, 1248.0, 2263.0, 4441.0, 9073.0, 20757.0, 54174.0, 214790.0, 534412.0, 134038.0, 40176.0, 15953.0, 7209.0, 3651.0, 1978.0, 1121.0, 604.0, 347.0, 201.0, 146.0, 94.0, 45.0, 36.0, 16.0, 19.0, 14.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.82275390625, -4.6689453125, -4.51513671875, -4.361328125, -4.20751953125, -4.0537109375, -3.89990234375, -3.74609375, -3.59228515625, -3.4384765625, -3.28466796875, -3.130859375, -2.97705078125, -2.8232421875, -2.66943359375, -2.515625, -2.36181640625, -2.2080078125, -2.05419921875, -1.900390625, -1.74658203125, -1.5927734375, -1.43896484375, -1.28515625, -1.13134765625, -0.9775390625, -0.82373046875, -0.669921875, -0.51611328125, -0.3623046875, -0.20849609375, -0.0546875, 0.09912109375, 0.2529296875, 0.40673828125, 0.560546875, 0.71435546875, 0.8681640625, 1.02197265625, 1.17578125, 1.32958984375, 1.4833984375, 1.63720703125, 1.791015625, 1.94482421875, 2.0986328125, 2.25244140625, 2.40625, 2.56005859375, 2.7138671875, 2.86767578125, 3.021484375, 3.17529296875, 3.3291015625, 3.48291015625, 3.63671875, 3.79052734375, 3.9443359375, 4.09814453125, 4.251953125, 4.40576171875, 4.5595703125, 4.71337890625, 4.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 9.0, 17.0, 14.0, 19.0, 28.0, 26.0, 32.0, 30.0, 35.0, 35.0, 41.0, 43.0, 52.0, 40.0, 56.0, 55.0, 53.0, 48.0, 60.0, 39.0, 34.0, 32.0, 31.0, 29.0, 25.0, 22.0, 24.0, 16.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.172637939453125, -2.11480712890625, -2.056976318359375, -1.9991455078125, -1.941314697265625, -1.88348388671875, -1.825653076171875, -1.767822265625, -1.709991455078125, -1.65216064453125, -1.594329833984375, -1.5364990234375, -1.478668212890625, -1.42083740234375, -1.363006591796875, -1.30517578125, -1.247344970703125, -1.18951416015625, -1.131683349609375, -1.0738525390625, -1.016021728515625, -0.95819091796875, -0.900360107421875, -0.842529296875, -0.784698486328125, -0.72686767578125, -0.669036865234375, -0.6112060546875, -0.553375244140625, -0.49554443359375, -0.437713623046875, -0.3798828125, -0.322052001953125, -0.26422119140625, -0.206390380859375, -0.1485595703125, -0.090728759765625, -0.03289794921875, 0.024932861328125, 0.082763671875, 0.140594482421875, 0.19842529296875, 0.256256103515625, 0.3140869140625, 0.371917724609375, 0.42974853515625, 0.487579345703125, 0.54541015625, 0.603240966796875, 0.66107177734375, 0.718902587890625, 0.7767333984375, 0.834564208984375, 0.89239501953125, 0.950225830078125, 1.008056640625, 1.065887451171875, 1.12371826171875, 1.181549072265625, 1.2393798828125, 1.297210693359375, 1.35504150390625, 1.412872314453125, 1.470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 4.0, 9.0, 9.0, 20.0, 25.0, 39.0, 57.0, 91.0, 131.0, 209.0, 348.0, 601.0, 1139.0, 2652.0, 9504.0, 72258.0, 869258.0, 76908.0, 9888.0, 2738.0, 1208.0, 542.0, 314.0, 207.0, 131.0, 68.0, 65.0, 45.0, 19.0, 19.0, 14.0, 13.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0440673828125, -7.728759765625, -7.4134521484375, -7.09814453125, -6.7828369140625, -6.467529296875, -6.1522216796875, -5.8369140625, -5.5216064453125, -5.206298828125, -4.8909912109375, -4.57568359375, -4.2603759765625, -3.945068359375, -3.6297607421875, -3.314453125, -2.9991455078125, -2.683837890625, -2.3685302734375, -2.05322265625, -1.7379150390625, -1.422607421875, -1.1072998046875, -0.7919921875, -0.4766845703125, -0.161376953125, 0.1539306640625, 0.46923828125, 0.7845458984375, 1.099853515625, 1.4151611328125, 1.73046875, 2.0457763671875, 2.361083984375, 2.6763916015625, 2.99169921875, 3.3070068359375, 3.622314453125, 3.9376220703125, 4.2529296875, 4.5682373046875, 4.883544921875, 5.1988525390625, 5.51416015625, 5.8294677734375, 6.144775390625, 6.4600830078125, 6.775390625, 7.0906982421875, 7.406005859375, 7.7213134765625, 8.03662109375, 8.3519287109375, 8.667236328125, 8.9825439453125, 9.2978515625, 9.6131591796875, 9.928466796875, 10.2437744140625, 10.55908203125, 10.8743896484375, 11.189697265625, 11.5050048828125, 11.8203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 9.0, 6.0, 8.0, 3.0, 7.0, 9.0, 13.0, 13.0, 17.0, 25.0, 42.0, 27.0, 33.0, 40.0, 44.0, 57.0, 56.0, 57.0, 42.0, 48.0, 47.0, 55.0, 58.0, 44.0, 53.0, 37.0, 24.0, 35.0, 24.0, 19.0, 19.0, 6.0, 7.0, 4.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.89453125, -7.63128662109375, -7.3680419921875, -7.10479736328125, -6.841552734375, -6.57830810546875, -6.3150634765625, -6.05181884765625, -5.78857421875, -5.52532958984375, -5.2620849609375, -4.99884033203125, -4.735595703125, -4.47235107421875, -4.2091064453125, -3.94586181640625, -3.6826171875, -3.41937255859375, -3.1561279296875, -2.89288330078125, -2.629638671875, -2.36639404296875, -2.1031494140625, -1.83990478515625, -1.57666015625, -1.31341552734375, -1.0501708984375, -0.78692626953125, -0.523681640625, -0.26043701171875, 0.0028076171875, 0.26605224609375, 0.529296875, 0.79254150390625, 1.0557861328125, 1.31903076171875, 1.582275390625, 1.84552001953125, 2.1087646484375, 2.37200927734375, 2.63525390625, 2.89849853515625, 3.1617431640625, 3.42498779296875, 3.688232421875, 3.95147705078125, 4.2147216796875, 4.47796630859375, 4.7412109375, 5.00445556640625, 5.2677001953125, 5.53094482421875, 5.794189453125, 6.05743408203125, 6.3206787109375, 6.58392333984375, 6.84716796875, 7.11041259765625, 7.3736572265625, 7.63690185546875, 7.900146484375, 8.16339111328125, 8.4266357421875, 8.68988037109375, 8.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 16.0, 18.0, 25.0, 36.0, 51.0, 100.0, 166.0, 326.0, 588.0, 1319.0, 3443.0, 10184.0, 37700.0, 444717.0, 494895.0, 38450.0, 10274.0, 3521.0, 1364.0, 589.0, 293.0, 178.0, 99.0, 52.0, 32.0, 24.0, 19.0, 14.0, 13.0, 8.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0], "bins": [-5.20703125, -5.080047607421875, -4.95306396484375, -4.826080322265625, -4.6990966796875, -4.572113037109375, -4.44512939453125, -4.318145751953125, -4.191162109375, -4.064178466796875, -3.93719482421875, -3.810211181640625, -3.6832275390625, -3.556243896484375, -3.42926025390625, -3.302276611328125, -3.17529296875, -3.048309326171875, -2.92132568359375, -2.794342041015625, -2.6673583984375, -2.540374755859375, -2.41339111328125, -2.286407470703125, -2.159423828125, -2.032440185546875, -1.90545654296875, -1.778472900390625, -1.6514892578125, -1.524505615234375, -1.39752197265625, -1.270538330078125, -1.1435546875, -1.016571044921875, -0.88958740234375, -0.762603759765625, -0.6356201171875, -0.508636474609375, -0.38165283203125, -0.254669189453125, -0.127685546875, -0.000701904296875, 0.12628173828125, 0.253265380859375, 0.3802490234375, 0.507232666015625, 0.63421630859375, 0.761199951171875, 0.88818359375, 1.015167236328125, 1.14215087890625, 1.269134521484375, 1.3961181640625, 1.523101806640625, 1.65008544921875, 1.777069091796875, 1.904052734375, 2.031036376953125, 2.15802001953125, 2.285003662109375, 2.4119873046875, 2.538970947265625, 2.66595458984375, 2.792938232421875, 2.919921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 5.0, 6.0, 6.0, 7.0, 19.0, 17.0, 35.0, 38.0, 72.0, 198.0, 271.0, 134.0, 54.0, 27.0, 25.0, 17.0, 11.0, 5.0, 9.0, 4.0, 7.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011396408081054688, -0.0011032074689865112, -0.0010667741298675537, -0.0010303407907485962, -0.0009939074516296387, -0.0009574741125106812, -0.0009210407733917236, -0.0008846074342727661, -0.0008481740951538086, -0.0008117407560348511, -0.0007753074169158936, -0.000738874077796936, -0.0007024407386779785, -0.000666007399559021, -0.0006295740604400635, -0.000593140721321106, -0.0005567073822021484, -0.0005202740430831909, -0.0004838407039642334, -0.0004474073648452759, -0.00041097402572631836, -0.00037454068660736084, -0.0003381073474884033, -0.0003016740083694458, -0.0002652406692504883, -0.00022880733013153076, -0.00019237399101257324, -0.00015594065189361572, -0.0001195073127746582, -8.307397365570068e-05, -4.6640634536743164e-05, -1.0207295417785645e-05, 2.6226043701171875e-05, 6.26593828201294e-05, 9.909272193908691e-05, 0.00013552606105804443, 0.00017195940017700195, 0.00020839273929595947, 0.000244826078414917, 0.0002812594175338745, 0.00031769275665283203, 0.00035412609577178955, 0.00039055943489074707, 0.0004269927740097046, 0.0004634261131286621, 0.0004998594522476196, 0.0005362927913665771, 0.0005727261304855347, 0.0006091594696044922, 0.0006455928087234497, 0.0006820261478424072, 0.0007184594869613647, 0.0007548928260803223, 0.0007913261651992798, 0.0008277595043182373, 0.0008641928434371948, 0.0009006261825561523, 0.0009370595216751099, 0.0009734928607940674, 0.001009926199913025, 0.0010463595390319824, 0.00108279287815094, 0.0011192262172698975, 0.001155659556388855, 0.0011920928955078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 9.0, 8.0, 21.0, 19.0, 33.0, 45.0, 107.0, 160.0, 276.0, 534.0, 1222.0, 3217.0, 11507.0, 71179.0, 830680.0, 108069.0, 14768.0, 3920.0, 1381.0, 632.0, 300.0, 181.0, 90.0, 67.0, 41.0, 28.0, 18.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.015625, -4.86627197265625, -4.7169189453125, -4.56756591796875, -4.418212890625, -4.26885986328125, -4.1195068359375, -3.97015380859375, -3.82080078125, -3.67144775390625, -3.5220947265625, -3.37274169921875, -3.223388671875, -3.07403564453125, -2.9246826171875, -2.77532958984375, -2.6259765625, -2.47662353515625, -2.3272705078125, -2.17791748046875, -2.028564453125, -1.87921142578125, -1.7298583984375, -1.58050537109375, -1.43115234375, -1.28179931640625, -1.1324462890625, -0.98309326171875, -0.833740234375, -0.68438720703125, -0.5350341796875, -0.38568115234375, -0.236328125, -0.08697509765625, 0.0623779296875, 0.21173095703125, 0.361083984375, 0.51043701171875, 0.6597900390625, 0.80914306640625, 0.95849609375, 1.10784912109375, 1.2572021484375, 1.40655517578125, 1.555908203125, 1.70526123046875, 1.8546142578125, 2.00396728515625, 2.1533203125, 2.30267333984375, 2.4520263671875, 2.60137939453125, 2.750732421875, 2.90008544921875, 3.0494384765625, 3.19879150390625, 3.34814453125, 3.49749755859375, 3.6468505859375, 3.79620361328125, 3.945556640625, 4.09490966796875, 4.2442626953125, 4.39361572265625, 4.54296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 6.0, 7.0, 12.0, 16.0, 18.0, 26.0, 38.0, 45.0, 65.0, 97.0, 123.0, 114.0, 110.0, 81.0, 51.0, 45.0, 31.0, 29.0, 21.0, 13.0, 7.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.39666748046875, -2.2933349609375, -2.19000244140625, -2.086669921875, -1.98333740234375, -1.8800048828125, -1.77667236328125, -1.67333984375, -1.57000732421875, -1.4666748046875, -1.36334228515625, -1.260009765625, -1.15667724609375, -1.0533447265625, -0.95001220703125, -0.8466796875, -0.74334716796875, -0.6400146484375, -0.53668212890625, -0.433349609375, -0.33001708984375, -0.2266845703125, -0.12335205078125, -0.02001953125, 0.08331298828125, 0.1866455078125, 0.28997802734375, 0.393310546875, 0.49664306640625, 0.5999755859375, 0.70330810546875, 0.806640625, 0.90997314453125, 1.0133056640625, 1.11663818359375, 1.219970703125, 1.32330322265625, 1.4266357421875, 1.52996826171875, 1.63330078125, 1.73663330078125, 1.8399658203125, 1.94329833984375, 2.046630859375, 2.14996337890625, 2.2532958984375, 2.35662841796875, 2.4599609375, 2.56329345703125, 2.6666259765625, 2.76995849609375, 2.873291015625, 2.97662353515625, 3.0799560546875, 3.18328857421875, 3.28662109375, 3.38995361328125, 3.4932861328125, 3.59661865234375, 3.699951171875, 3.80328369140625, 3.9066162109375, 4.00994873046875, 4.11328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 1.0, 5.0, 5.0, 13.0, 26.0, 42.0, 83.0, 93.0, 141.0, 159.0, 139.0, 94.0, 75.0, 42.0, 32.0, 14.0, 11.0, 5.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.12789535522461, -34.59796905517578, -33.06803894042969, -31.53811264038086, -30.00818634033203, -28.47825813293457, -26.94832992553711, -25.41840362548828, -23.88847541809082, -22.35854721069336, -20.82862091064453, -19.29869270324707, -17.76876449584961, -16.23883819580078, -14.70890998840332, -13.178982734680176, -11.649055480957031, -10.119128227233887, -8.589200973510742, -7.059272766113281, -5.529345512390137, -3.999418258666992, -2.4694900512695312, -0.9395627975463867, 0.5903644561767578, 2.1202919483184814, 3.650219440460205, 5.180147171020508, 6.710074424743652, 8.240001678466797, 9.769929885864258, 11.299857139587402, 12.829784393310547, 14.359711647033691, 15.889638900756836, 17.419567108154297, 18.949493408203125, 20.479421615600586, 22.009349822998047, 23.539276123046875, 25.069204330444336, 26.599132537841797, 28.129058837890625, 29.658987045288086, 31.188915252685547, 32.718841552734375, 34.24877166748047, 35.7786979675293, 37.308624267578125, 38.83855056762695, 40.36848068237305, 41.898406982421875, 43.4283332824707, 44.95825958251953, 46.488189697265625, 48.01811599731445, 49.54804229736328, 51.07796859741211, 52.6078987121582, 54.13782501220703, 55.66775131225586, 57.19767761230469, 58.72760772705078, 60.25753402709961, 61.7874641418457]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 5.0, 9.0, 9.0, 16.0, 8.0, 18.0, 15.0, 26.0, 17.0, 15.0, 18.0, 27.0, 29.0, 26.0, 29.0, 33.0, 52.0, 42.0, 47.0, 41.0, 47.0, 49.0, 43.0, 50.0, 31.0, 35.0, 24.0, 31.0, 41.0, 22.0, 15.0, 23.0, 16.0, 16.0, 10.0, 16.0, 10.0, 8.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.409465789794922, -26.574079513549805, -25.738693237304688, -24.903305053710938, -24.06791877746582, -23.232532501220703, -22.397144317626953, -21.561758041381836, -20.72637176513672, -19.8909854888916, -19.055599212646484, -18.220211029052734, -17.384824752807617, -16.5494384765625, -15.714051246643066, -14.878664016723633, -14.043277740478516, -13.207891464233398, -12.372504234313965, -11.537117004394531, -10.701730728149414, -9.866344451904297, -9.030957221984863, -8.19556999206543, -7.3601837158203125, -6.524796962738037, -5.689410209655762, -4.854023456573486, -4.018636703491211, -3.1832499504089355, -2.34786319732666, -1.5124764442443848, -0.6770896911621094, 0.15829706192016602, 0.9936838150024414, 1.8290705680847168, 2.664457321166992, 3.4998440742492676, 4.335230827331543, 5.170617580413818, 6.006004333496094, 6.841391086578369, 7.6767778396606445, 8.512165069580078, 9.347551345825195, 10.182937622070312, 11.018324851989746, 11.85371208190918, 12.689098358154297, 13.524484634399414, 14.359871864318848, 15.195259094238281, 16.0306453704834, 16.866031646728516, 17.701419830322266, 18.536806106567383, 19.3721923828125, 20.207578659057617, 21.042964935302734, 21.878353118896484, 22.7137393951416, 23.54912567138672, 24.38451385498047, 25.219900131225586, 26.055286407470703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 10.0, 19.0, 21.0, 19.0, 36.0, 46.0, 72.0, 77.0, 130.0, 240.0, 795.0, 9504.0, 2650207.0, 1523389.0, 8351.0, 713.0, 200.0, 132.0, 76.0, 54.0, 47.0, 37.0, 20.0, 17.0, 21.0, 11.0, 6.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.2342529296875, -9.788818359375, -9.3433837890625, -8.89794921875, -8.4525146484375, -8.007080078125, -7.5616455078125, -7.1162109375, -6.6707763671875, -6.225341796875, -5.7799072265625, -5.33447265625, -4.8890380859375, -4.443603515625, -3.9981689453125, -3.552734375, -3.1072998046875, -2.661865234375, -2.2164306640625, -1.77099609375, -1.3255615234375, -0.880126953125, -0.4346923828125, 0.0107421875, 0.4561767578125, 0.901611328125, 1.3470458984375, 1.79248046875, 2.2379150390625, 2.683349609375, 3.1287841796875, 3.57421875, 4.0196533203125, 4.465087890625, 4.9105224609375, 5.35595703125, 5.8013916015625, 6.246826171875, 6.6922607421875, 7.1376953125, 7.5831298828125, 8.028564453125, 8.4739990234375, 8.91943359375, 9.3648681640625, 9.810302734375, 10.2557373046875, 10.701171875, 11.1466064453125, 11.592041015625, 12.0374755859375, 12.48291015625, 12.9283447265625, 13.373779296875, 13.8192138671875, 14.2646484375, 14.7100830078125, 15.155517578125, 15.6009521484375, 16.04638671875, 16.4918212890625, 16.937255859375, 17.3826904296875, 17.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 8.0, 15.0, 19.0, 16.0, 20.0, 22.0, 34.0, 45.0, 34.0, 42.0, 54.0, 58.0, 59.0, 76.0, 39.0, 50.0, 52.0, 58.0, 60.0, 44.0, 26.0, 31.0, 35.0, 20.0, 20.0, 17.0, 7.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.12127685546875, -2.0589599609375, -1.99664306640625, -1.934326171875, -1.87200927734375, -1.8096923828125, -1.74737548828125, -1.68505859375, -1.62274169921875, -1.5604248046875, -1.49810791015625, -1.435791015625, -1.37347412109375, -1.3111572265625, -1.24884033203125, -1.1865234375, -1.12420654296875, -1.0618896484375, -0.99957275390625, -0.937255859375, -0.87493896484375, -0.8126220703125, -0.75030517578125, -0.68798828125, -0.62567138671875, -0.5633544921875, -0.50103759765625, -0.438720703125, -0.37640380859375, -0.3140869140625, -0.25177001953125, -0.189453125, -0.12713623046875, -0.0648193359375, -0.00250244140625, 0.059814453125, 0.12213134765625, 0.1844482421875, 0.24676513671875, 0.30908203125, 0.37139892578125, 0.4337158203125, 0.49603271484375, 0.558349609375, 0.62066650390625, 0.6829833984375, 0.74530029296875, 0.8076171875, 0.86993408203125, 0.9322509765625, 0.99456787109375, 1.056884765625, 1.11920166015625, 1.1815185546875, 1.24383544921875, 1.30615234375, 1.36846923828125, 1.4307861328125, 1.49310302734375, 1.555419921875, 1.61773681640625, 1.6800537109375, 1.74237060546875, 1.8046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 19.0, 34.0, 31.0, 53.0, 92.0, 174.0, 239.0, 436.0, 855.0, 1449.0, 2980.0, 5939.0, 12725.0, 31139.0, 94880.0, 517164.0, 2870596.0, 505603.0, 94379.0, 30657.0, 12413.0, 5840.0, 2870.0, 1581.0, 848.0, 492.0, 281.0, 190.0, 104.0, 70.0, 37.0, 27.0, 20.0, 10.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.139251708984375, -3.03631591796875, -2.933380126953125, -2.8304443359375, -2.727508544921875, -2.62457275390625, -2.521636962890625, -2.418701171875, -2.315765380859375, -2.21282958984375, -2.109893798828125, -2.0069580078125, -1.904022216796875, -1.80108642578125, -1.698150634765625, -1.59521484375, -1.492279052734375, -1.38934326171875, -1.286407470703125, -1.1834716796875, -1.080535888671875, -0.97760009765625, -0.874664306640625, -0.771728515625, -0.668792724609375, -0.56585693359375, -0.462921142578125, -0.3599853515625, -0.257049560546875, -0.15411376953125, -0.051177978515625, 0.0517578125, 0.154693603515625, 0.25762939453125, 0.360565185546875, 0.4635009765625, 0.566436767578125, 0.66937255859375, 0.772308349609375, 0.875244140625, 0.978179931640625, 1.08111572265625, 1.184051513671875, 1.2869873046875, 1.389923095703125, 1.49285888671875, 1.595794677734375, 1.69873046875, 1.801666259765625, 1.90460205078125, 2.007537841796875, 2.1104736328125, 2.213409423828125, 2.31634521484375, 2.419281005859375, 2.522216796875, 2.625152587890625, 2.72808837890625, 2.831024169921875, 2.9339599609375, 3.036895751953125, 3.13983154296875, 3.242767333984375, 3.345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 11.0, 12.0, 10.0, 18.0, 15.0, 32.0, 38.0, 58.0, 74.0, 119.0, 203.0, 368.0, 654.0, 878.0, 601.0, 346.0, 219.0, 130.0, 73.0, 50.0, 36.0, 27.0, 19.0, 21.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.69921875, -3.56488037109375, -3.4305419921875, -3.29620361328125, -3.161865234375, -3.02752685546875, -2.8931884765625, -2.75885009765625, -2.62451171875, -2.49017333984375, -2.3558349609375, -2.22149658203125, -2.087158203125, -1.95281982421875, -1.8184814453125, -1.68414306640625, -1.5498046875, -1.41546630859375, -1.2811279296875, -1.14678955078125, -1.012451171875, -0.87811279296875, -0.7437744140625, -0.60943603515625, -0.47509765625, -0.34075927734375, -0.2064208984375, -0.07208251953125, 0.062255859375, 0.19659423828125, 0.3309326171875, 0.46527099609375, 0.599609375, 0.73394775390625, 0.8682861328125, 1.00262451171875, 1.136962890625, 1.27130126953125, 1.4056396484375, 1.53997802734375, 1.67431640625, 1.80865478515625, 1.9429931640625, 2.07733154296875, 2.211669921875, 2.34600830078125, 2.4803466796875, 2.61468505859375, 2.7490234375, 2.88336181640625, 3.0177001953125, 3.15203857421875, 3.286376953125, 3.42071533203125, 3.5550537109375, 3.68939208984375, 3.82373046875, 3.95806884765625, 4.0924072265625, 4.22674560546875, 4.361083984375, 4.49542236328125, 4.6297607421875, 4.76409912109375, 4.8984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 37.0, 132.0, 365.0, 326.0, 84.0, 31.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.76509094238281, -65.88572692871094, -63.006370544433594, -60.127010345458984, -57.247650146484375, -54.368289947509766, -51.488929748535156, -48.60956573486328, -45.73020935058594, -42.85084915161133, -39.97148895263672, -37.09212875366211, -34.2127685546875, -31.33340835571289, -28.45404624938965, -25.57468605041504, -22.695323944091797, -19.815963745117188, -16.936603546142578, -14.057242393493652, -11.177882194519043, -8.298521995544434, -5.419160842895508, -2.5398006439208984, 0.33955955505371094, 3.2189199924468994, 6.098280429840088, 8.977641105651855, 11.857001304626465, 14.736361503601074, 17.61572265625, 20.49508285522461, 23.37444305419922, 26.253803253173828, 29.133163452148438, 32.01252365112305, 34.891883850097656, 37.771244049072266, 40.650604248046875, 43.52996826171875, 46.409324645996094, 49.2886848449707, 52.16804504394531, 55.04740524291992, 57.92676544189453, 60.80612564086914, 63.68548583984375, 66.56484985351562, 69.4442138671875, 72.32357788085938, 75.20293426513672, 78.0822982788086, 80.96165466308594, 83.84101867675781, 86.72037506103516, 89.59973907470703, 92.47909545898438, 95.35845947265625, 98.2378158569336, 101.11717987060547, 103.99653625488281, 106.87590026855469, 109.75525665283203, 112.6346206665039, 115.51397705078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 4.0, 7.0, 7.0, 4.0, 9.0, 6.0, 15.0, 10.0, 13.0, 19.0, 24.0, 20.0, 30.0, 25.0, 30.0, 28.0, 52.0, 44.0, 28.0, 51.0, 36.0, 41.0, 46.0, 44.0, 35.0, 37.0, 46.0, 36.0, 29.0, 33.0, 17.0, 28.0, 20.0, 21.0, 19.0, 11.0, 7.0, 7.0, 9.0, 5.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.872273445129395, -15.355517387390137, -14.838761329650879, -14.322005271911621, -13.805248260498047, -13.288492202758789, -12.771736145019531, -12.254980087280273, -11.738224029541016, -11.221467971801758, -10.7047119140625, -10.187955856323242, -9.671199798583984, -9.154443740844727, -8.637686729431152, -8.120930671691895, -7.604174613952637, -7.087418556213379, -6.570662498474121, -6.053905963897705, -5.537149906158447, -5.0203938484191895, -4.503637313842773, -3.9868812561035156, -3.470125198364258, -2.953369140625, -2.436612844467163, -1.9198566675186157, -1.4031004905700684, -0.8863444328308105, -0.36958813667297363, 0.14716815948486328, 0.6639251708984375, 1.1806813478469849, 1.6974375247955322, 2.214193820953369, 2.730949878692627, 3.2477059364318848, 3.7644622325897217, 4.281218528747559, 4.797974586486816, 5.314730644226074, 5.831486701965332, 6.348243236541748, 6.864999294281006, 7.381755352020264, 7.89851188659668, 8.415267944335938, 8.932024002075195, 9.448780059814453, 9.965536117553711, 10.482292175292969, 10.999048233032227, 11.515804290771484, 12.032561302185059, 12.549317359924316, 13.066073417663574, 13.582829475402832, 14.09958553314209, 14.616341590881348, 15.133098602294922, 15.64985466003418, 16.166610717773438, 16.683366775512695, 17.200122833251953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 7.0, 9.0, 17.0, 29.0, 28.0, 44.0, 75.0, 90.0, 134.0, 217.0, 344.0, 540.0, 895.0, 1813.0, 3478.0, 7481.0, 17962.0, 48083.0, 196729.0, 561021.0, 141883.0, 39349.0, 15144.0, 6389.0, 3085.0, 1553.0, 773.0, 466.0, 274.0, 203.0, 145.0, 79.0, 67.0, 35.0, 24.0, 26.0, 16.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.386962890625, -4.24267578125, -4.098388671875, -3.9541015625, -3.809814453125, -3.66552734375, -3.521240234375, -3.376953125, -3.232666015625, -3.08837890625, -2.944091796875, -2.7998046875, -2.655517578125, -2.51123046875, -2.366943359375, -2.22265625, -2.078369140625, -1.93408203125, -1.789794921875, -1.6455078125, -1.501220703125, -1.35693359375, -1.212646484375, -1.068359375, -0.924072265625, -0.77978515625, -0.635498046875, -0.4912109375, -0.346923828125, -0.20263671875, -0.058349609375, 0.0859375, 0.230224609375, 0.37451171875, 0.518798828125, 0.6630859375, 0.807373046875, 0.95166015625, 1.095947265625, 1.240234375, 1.384521484375, 1.52880859375, 1.673095703125, 1.8173828125, 1.961669921875, 2.10595703125, 2.250244140625, 2.39453125, 2.538818359375, 2.68310546875, 2.827392578125, 2.9716796875, 3.115966796875, 3.26025390625, 3.404541015625, 3.548828125, 3.693115234375, 3.83740234375, 3.981689453125, 4.1259765625, 4.270263671875, 4.41455078125, 4.558837890625, 4.703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 10.0, 8.0, 19.0, 22.0, 15.0, 17.0, 25.0, 32.0, 32.0, 41.0, 39.0, 47.0, 47.0, 37.0, 50.0, 55.0, 41.0, 47.0, 45.0, 44.0, 33.0, 31.0, 48.0, 27.0, 27.0, 27.0, 25.0, 13.0, 17.0, 17.0, 11.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -2.0131378173828125, -1.959869384765625, -1.9066009521484375, -1.85333251953125, -1.8000640869140625, -1.746795654296875, -1.6935272216796875, -1.6402587890625, -1.5869903564453125, -1.533721923828125, -1.4804534912109375, -1.42718505859375, -1.3739166259765625, -1.320648193359375, -1.2673797607421875, -1.214111328125, -1.1608428955078125, -1.107574462890625, -1.0543060302734375, -1.00103759765625, -0.9477691650390625, -0.894500732421875, -0.8412322998046875, -0.7879638671875, -0.7346954345703125, -0.681427001953125, -0.6281585693359375, -0.57489013671875, -0.5216217041015625, -0.468353271484375, -0.4150848388671875, -0.36181640625, -0.3085479736328125, -0.255279541015625, -0.2020111083984375, -0.14874267578125, -0.0954742431640625, -0.042205810546875, 0.0110626220703125, 0.0643310546875, 0.1175994873046875, 0.170867919921875, 0.2241363525390625, 0.27740478515625, 0.3306732177734375, 0.383941650390625, 0.4372100830078125, 0.490478515625, 0.5437469482421875, 0.597015380859375, 0.6502838134765625, 0.70355224609375, 0.7568206787109375, 0.810089111328125, 0.8633575439453125, 0.9166259765625, 0.9698944091796875, 1.023162841796875, 1.0764312744140625, 1.12969970703125, 1.1829681396484375, 1.236236572265625, 1.2895050048828125, 1.3427734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 10.0, 11.0, 9.0, 15.0, 22.0, 24.0, 33.0, 40.0, 58.0, 99.0, 138.0, 224.0, 344.0, 627.0, 1287.0, 3094.0, 9175.0, 36008.0, 313049.0, 614501.0, 50560.0, 12074.0, 3764.0, 1527.0, 682.0, 421.0, 251.0, 158.0, 103.0, 80.0, 44.0, 36.0, 18.0, 7.0, 15.0, 14.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-7.73046875, -7.527587890625, -7.32470703125, -7.121826171875, -6.9189453125, -6.716064453125, -6.51318359375, -6.310302734375, -6.107421875, -5.904541015625, -5.70166015625, -5.498779296875, -5.2958984375, -5.093017578125, -4.89013671875, -4.687255859375, -4.484375, -4.281494140625, -4.07861328125, -3.875732421875, -3.6728515625, -3.469970703125, -3.26708984375, -3.064208984375, -2.861328125, -2.658447265625, -2.45556640625, -2.252685546875, -2.0498046875, -1.846923828125, -1.64404296875, -1.441162109375, -1.23828125, -1.035400390625, -0.83251953125, -0.629638671875, -0.4267578125, -0.223876953125, -0.02099609375, 0.181884765625, 0.384765625, 0.587646484375, 0.79052734375, 0.993408203125, 1.1962890625, 1.399169921875, 1.60205078125, 1.804931640625, 2.0078125, 2.210693359375, 2.41357421875, 2.616455078125, 2.8193359375, 3.022216796875, 3.22509765625, 3.427978515625, 3.630859375, 3.833740234375, 4.03662109375, 4.239501953125, 4.4423828125, 4.645263671875, 4.84814453125, 5.051025390625, 5.25390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 6.0, 15.0, 10.0, 21.0, 17.0, 28.0, 29.0, 33.0, 44.0, 60.0, 53.0, 59.0, 55.0, 61.0, 69.0, 51.0, 51.0, 51.0, 52.0, 45.0, 29.0, 34.0, 25.0, 22.0, 18.0, 15.0, 7.0, 4.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.0108642578125, -7.756103515625, -7.5013427734375, -7.24658203125, -6.9918212890625, -6.737060546875, -6.4822998046875, -6.2275390625, -5.9727783203125, -5.718017578125, -5.4632568359375, -5.20849609375, -4.9537353515625, -4.698974609375, -4.4442138671875, -4.189453125, -3.9346923828125, -3.679931640625, -3.4251708984375, -3.17041015625, -2.9156494140625, -2.660888671875, -2.4061279296875, -2.1513671875, -1.8966064453125, -1.641845703125, -1.3870849609375, -1.13232421875, -0.8775634765625, -0.622802734375, -0.3680419921875, -0.11328125, 0.1414794921875, 0.396240234375, 0.6510009765625, 0.90576171875, 1.1605224609375, 1.415283203125, 1.6700439453125, 1.9248046875, 2.1795654296875, 2.434326171875, 2.6890869140625, 2.94384765625, 3.1986083984375, 3.453369140625, 3.7081298828125, 3.962890625, 4.2176513671875, 4.472412109375, 4.7271728515625, 4.98193359375, 5.2366943359375, 5.491455078125, 5.7462158203125, 6.0009765625, 6.2557373046875, 6.510498046875, 6.7652587890625, 7.02001953125, 7.2747802734375, 7.529541015625, 7.7843017578125, 8.0390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 17.0, 21.0, 43.0, 85.0, 160.0, 381.0, 1127.0, 3974.0, 22097.0, 589497.0, 405792.0, 19839.0, 3717.0, 1054.0, 388.0, 154.0, 72.0, 42.0, 28.0, 19.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.390625, -6.2177734375, -6.044921875, -5.8720703125, -5.69921875, -5.5263671875, -5.353515625, -5.1806640625, -5.0078125, -4.8349609375, -4.662109375, -4.4892578125, -4.31640625, -4.1435546875, -3.970703125, -3.7978515625, -3.625, -3.4521484375, -3.279296875, -3.1064453125, -2.93359375, -2.7607421875, -2.587890625, -2.4150390625, -2.2421875, -2.0693359375, -1.896484375, -1.7236328125, -1.55078125, -1.3779296875, -1.205078125, -1.0322265625, -0.859375, -0.6865234375, -0.513671875, -0.3408203125, -0.16796875, 0.0048828125, 0.177734375, 0.3505859375, 0.5234375, 0.6962890625, 0.869140625, 1.0419921875, 1.21484375, 1.3876953125, 1.560546875, 1.7333984375, 1.90625, 2.0791015625, 2.251953125, 2.4248046875, 2.59765625, 2.7705078125, 2.943359375, 3.1162109375, 3.2890625, 3.4619140625, 3.634765625, 3.8076171875, 3.98046875, 4.1533203125, 4.326171875, 4.4990234375, 4.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 3.0, 10.0, 14.0, 4.0, 15.0, 13.0, 25.0, 40.0, 59.0, 97.0, 143.0, 184.0, 111.0, 69.0, 49.0, 43.0, 31.0, 14.0, 12.0, 14.0, 3.0, 5.0, 5.0, 11.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00080108642578125, -0.0007783696055412292, -0.0007556527853012085, -0.0007329359650611877, -0.000710219144821167, -0.0006875023245811462, -0.0006647855043411255, -0.0006420686841011047, -0.000619351863861084, -0.0005966350436210632, -0.0005739182233810425, -0.0005512014031410217, -0.000528484582901001, -0.0005057677626609802, -0.00048305094242095947, -0.0004603341221809387, -0.00043761730194091797, -0.0004149004817008972, -0.00039218366146087646, -0.0003694668412208557, -0.00034675002098083496, -0.0003240332007408142, -0.00030131638050079346, -0.0002785995602607727, -0.00025588274002075195, -0.0002331659197807312, -0.00021044909954071045, -0.0001877322793006897, -0.00016501545906066895, -0.0001422986388206482, -0.00011958181858062744, -9.686499834060669e-05, -7.414817810058594e-05, -5.1431357860565186e-05, -2.8714537620544434e-05, -5.997717380523682e-06, 1.671910285949707e-05, 3.943592309951782e-05, 6.215274333953857e-05, 8.486956357955933e-05, 0.00010758638381958008, 0.00013030320405960083, 0.00015302002429962158, 0.00017573684453964233, 0.00019845366477966309, 0.00022117048501968384, 0.0002438873052597046, 0.00026660412549972534, 0.0002893209457397461, 0.00031203776597976685, 0.0003347545862197876, 0.00035747140645980835, 0.0003801882266998291, 0.00040290504693984985, 0.0004256218671798706, 0.00044833868741989136, 0.0004710555076599121, 0.0004937723278999329, 0.0005164891481399536, 0.0005392059683799744, 0.0005619227886199951, 0.0005846396088600159, 0.0006073564291000366, 0.0006300732493400574, 0.0006527900695800781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 12.0, 9.0, 15.0, 34.0, 65.0, 112.0, 148.0, 268.0, 495.0, 948.0, 2083.0, 5288.0, 20155.0, 171669.0, 766134.0, 63127.0, 11299.0, 3522.0, 1484.0, 696.0, 400.0, 223.0, 138.0, 85.0, 44.0, 37.0, 19.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.46875, -3.34619140625, -3.2236328125, -3.10107421875, -2.978515625, -2.85595703125, -2.7333984375, -2.61083984375, -2.48828125, -2.36572265625, -2.2431640625, -2.12060546875, -1.998046875, -1.87548828125, -1.7529296875, -1.63037109375, -1.5078125, -1.38525390625, -1.2626953125, -1.14013671875, -1.017578125, -0.89501953125, -0.7724609375, -0.64990234375, -0.52734375, -0.40478515625, -0.2822265625, -0.15966796875, -0.037109375, 0.08544921875, 0.2080078125, 0.33056640625, 0.453125, 0.57568359375, 0.6982421875, 0.82080078125, 0.943359375, 1.06591796875, 1.1884765625, 1.31103515625, 1.43359375, 1.55615234375, 1.6787109375, 1.80126953125, 1.923828125, 2.04638671875, 2.1689453125, 2.29150390625, 2.4140625, 2.53662109375, 2.6591796875, 2.78173828125, 2.904296875, 3.02685546875, 3.1494140625, 3.27197265625, 3.39453125, 3.51708984375, 3.6396484375, 3.76220703125, 3.884765625, 4.00732421875, 4.1298828125, 4.25244140625, 4.375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 2.0, 13.0, 18.0, 15.0, 19.0, 27.0, 54.0, 75.0, 116.0, 127.0, 130.0, 105.0, 74.0, 55.0, 45.0, 23.0, 17.0, 9.0, 15.0, 10.0, 2.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.506744384765625, -2.41387939453125, -2.321014404296875, -2.2281494140625, -2.135284423828125, -2.04241943359375, -1.949554443359375, -1.856689453125, -1.763824462890625, -1.67095947265625, -1.578094482421875, -1.4852294921875, -1.392364501953125, -1.29949951171875, -1.206634521484375, -1.11376953125, -1.020904541015625, -0.92803955078125, -0.835174560546875, -0.7423095703125, -0.649444580078125, -0.55657958984375, -0.463714599609375, -0.370849609375, -0.277984619140625, -0.18511962890625, -0.092254638671875, 0.0006103515625, 0.093475341796875, 0.18634033203125, 0.279205322265625, 0.3720703125, 0.464935302734375, 0.55780029296875, 0.650665283203125, 0.7435302734375, 0.836395263671875, 0.92926025390625, 1.022125244140625, 1.114990234375, 1.207855224609375, 1.30072021484375, 1.393585205078125, 1.4864501953125, 1.579315185546875, 1.67218017578125, 1.765045166015625, 1.85791015625, 1.950775146484375, 2.04364013671875, 2.136505126953125, 2.2293701171875, 2.322235107421875, 2.41510009765625, 2.507965087890625, 2.600830078125, 2.693695068359375, 2.78656005859375, 2.879425048828125, 2.9722900390625, 3.065155029296875, 3.15802001953125, 3.250885009765625, 3.34375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 38.0, 87.0, 217.0, 337.0, 196.0, 53.0, 25.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.62693786621094, -117.05058288574219, -114.47422790527344, -111.89787292480469, -109.32151794433594, -106.74517059326172, -104.16881561279297, -101.59246063232422, -99.01610565185547, -96.43975067138672, -93.86339569091797, -91.28704071044922, -88.710693359375, -86.13433837890625, -83.5579833984375, -80.98162841796875, -78.4052734375, -75.82891845703125, -73.2525634765625, -70.67620849609375, -68.099853515625, -65.52350616455078, -62.94715118408203, -60.37079620361328, -57.79444122314453, -55.21808624267578, -52.64173126220703, -50.06538009643555, -47.4890251159668, -44.91267013549805, -42.33631896972656, -39.75996398925781, -37.183616638183594, -34.607261657714844, -32.030906677246094, -29.45455551147461, -26.87820053100586, -24.30184555053711, -21.725492477416992, -19.149139404296875, -16.572784423828125, -13.996430397033691, -11.420076370239258, -8.843722343444824, -6.267368316650391, -3.691014289855957, -1.1146602630615234, 1.4616928100585938, 4.038047790527344, 6.614401817321777, 9.190755844116211, 11.767109870910645, 14.343463897705078, 16.919818878173828, 19.496171951293945, 22.072525024414062, 24.648880004882812, 27.225234985351562, 29.80158805847168, 32.3779411315918, 34.95429611206055, 37.5306510925293, 40.10700225830078, 42.68335723876953, 45.25971221923828]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 9.0, 20.0, 21.0, 18.0, 24.0, 19.0, 20.0, 27.0, 28.0, 35.0, 38.0, 55.0, 44.0, 55.0, 68.0, 45.0, 52.0, 38.0, 42.0, 36.0, 36.0, 32.0, 27.0, 21.0, 27.0, 24.0, 18.0, 24.0, 16.0, 7.0, 15.0, 5.0, 9.0, 6.0, 6.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.12070083618164, -24.28488540649414, -23.449068069458008, -22.613252639770508, -21.777437210083008, -20.941619873046875, -20.105804443359375, -19.269989013671875, -18.434173583984375, -17.598358154296875, -16.762540817260742, -15.926725387573242, -15.090909957885742, -14.255093574523926, -13.41927719116211, -12.58346176147461, -11.747644424438477, -10.91182804107666, -10.07601261138916, -9.240196228027344, -8.404380798339844, -7.568564414978027, -6.732748031616211, -5.896932125091553, -5.0611162185668945, -4.225300312042236, -3.389484167098999, -2.5536680221557617, -1.7178521156311035, -0.8820362091064453, -0.046219825744628906, 0.7895960807800293, 1.6254119873046875, 2.4612278938293457, 3.297044038772583, 4.13286018371582, 4.9686760902404785, 5.804491996765137, 6.640308380126953, 7.476124286651611, 8.31194019317627, 9.147756576538086, 9.983572006225586, 10.819388389587402, 11.655204772949219, 12.491020202636719, 13.326836585998535, 14.162652969360352, 14.998468399047852, 15.834284782409668, 16.670101165771484, 17.505916595458984, 18.341732025146484, 19.177547454833984, 20.013364791870117, 20.849180221557617, 21.68499755859375, 22.52081298828125, 23.356630325317383, 24.192445755004883, 25.028261184692383, 25.864078521728516, 26.699893951416016, 27.535709381103516, 28.371524810791016]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 11.0, 12.0, 16.0, 17.0, 51.0, 83.0, 97.0, 175.0, 303.0, 536.0, 938.0, 1821.0, 3442.0, 7060.0, 16181.0, 39772.0, 121458.0, 586430.0, 2406296.0, 776869.0, 150948.0, 47334.0, 18301.0, 8101.0, 3846.0, 1836.0, 985.0, 560.0, 300.0, 191.0, 100.0, 71.0, 40.0, 27.0, 23.0, 15.0, 8.0, 12.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.90374755859375, -2.8172607421875, -2.73077392578125, -2.644287109375, -2.55780029296875, -2.4713134765625, -2.38482666015625, -2.29833984375, -2.21185302734375, -2.1253662109375, -2.03887939453125, -1.952392578125, -1.86590576171875, -1.7794189453125, -1.69293212890625, -1.6064453125, -1.51995849609375, -1.4334716796875, -1.34698486328125, -1.260498046875, -1.17401123046875, -1.0875244140625, -1.00103759765625, -0.91455078125, -0.82806396484375, -0.7415771484375, -0.65509033203125, -0.568603515625, -0.48211669921875, -0.3956298828125, -0.30914306640625, -0.22265625, -0.13616943359375, -0.0496826171875, 0.03680419921875, 0.123291015625, 0.20977783203125, 0.2962646484375, 0.38275146484375, 0.46923828125, 0.55572509765625, 0.6422119140625, 0.72869873046875, 0.815185546875, 0.90167236328125, 0.9881591796875, 1.07464599609375, 1.1611328125, 1.24761962890625, 1.3341064453125, 1.42059326171875, 1.507080078125, 1.59356689453125, 1.6800537109375, 1.76654052734375, 1.85302734375, 1.93951416015625, 2.0260009765625, 2.11248779296875, 2.198974609375, 2.28546142578125, 2.3719482421875, 2.45843505859375, 2.544921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 10.0, 7.0, 9.0, 18.0, 25.0, 20.0, 25.0, 27.0, 32.0, 25.0, 53.0, 39.0, 42.0, 36.0, 52.0, 52.0, 54.0, 48.0, 37.0, 45.0, 32.0, 35.0, 38.0, 36.0, 30.0, 37.0, 25.0, 19.0, 20.0, 10.0, 11.0, 16.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.8515625, -1.8030242919921875, -1.754486083984375, -1.7059478759765625, -1.65740966796875, -1.6088714599609375, -1.560333251953125, -1.5117950439453125, -1.4632568359375, -1.4147186279296875, -1.366180419921875, -1.3176422119140625, -1.26910400390625, -1.2205657958984375, -1.172027587890625, -1.1234893798828125, -1.074951171875, -1.0264129638671875, -0.977874755859375, -0.9293365478515625, -0.88079833984375, -0.8322601318359375, -0.783721923828125, -0.7351837158203125, -0.6866455078125, -0.6381072998046875, -0.589569091796875, -0.5410308837890625, -0.49249267578125, -0.4439544677734375, -0.395416259765625, -0.3468780517578125, -0.29833984375, -0.2498016357421875, -0.201263427734375, -0.1527252197265625, -0.10418701171875, -0.0556488037109375, -0.007110595703125, 0.0414276123046875, 0.0899658203125, 0.1385040283203125, 0.187042236328125, 0.2355804443359375, 0.28411865234375, 0.3326568603515625, 0.381195068359375, 0.4297332763671875, 0.478271484375, 0.5268096923828125, 0.575347900390625, 0.6238861083984375, 0.67242431640625, 0.7209625244140625, 0.769500732421875, 0.8180389404296875, 0.8665771484375, 0.9151153564453125, 0.963653564453125, 1.0121917724609375, 1.06072998046875, 1.1092681884765625, 1.157806396484375, 1.2063446044921875, 1.2548828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 12.0, 26.0, 30.0, 45.0, 83.0, 151.0, 248.0, 551.0, 973.0, 2423.0, 7166.0, 25878.0, 128970.0, 1794426.0, 2038948.0, 149610.0, 30764.0, 8512.0, 2908.0, 1212.0, 602.0, 294.0, 175.0, 95.0, 56.0, 31.0, 21.0, 20.0, 13.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.84100341796875, -4.6741943359375, -4.50738525390625, -4.340576171875, -4.17376708984375, -4.0069580078125, -3.84014892578125, -3.67333984375, -3.50653076171875, -3.3397216796875, -3.17291259765625, -3.006103515625, -2.83929443359375, -2.6724853515625, -2.50567626953125, -2.3388671875, -2.17205810546875, -2.0052490234375, -1.83843994140625, -1.671630859375, -1.50482177734375, -1.3380126953125, -1.17120361328125, -1.00439453125, -0.83758544921875, -0.6707763671875, -0.50396728515625, -0.337158203125, -0.17034912109375, -0.0035400390625, 0.16326904296875, 0.330078125, 0.49688720703125, 0.6636962890625, 0.83050537109375, 0.997314453125, 1.16412353515625, 1.3309326171875, 1.49774169921875, 1.66455078125, 1.83135986328125, 1.9981689453125, 2.16497802734375, 2.331787109375, 2.49859619140625, 2.6654052734375, 2.83221435546875, 2.9990234375, 3.16583251953125, 3.3326416015625, 3.49945068359375, 3.666259765625, 3.83306884765625, 3.9998779296875, 4.16668701171875, 4.33349609375, 4.50030517578125, 4.6671142578125, 4.83392333984375, 5.000732421875, 5.16754150390625, 5.3343505859375, 5.50115966796875, 5.66796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 15.0, 11.0, 21.0, 34.0, 42.0, 64.0, 92.0, 123.0, 223.0, 362.0, 677.0, 800.0, 530.0, 331.0, 218.0, 133.0, 101.0, 65.0, 57.0, 41.0, 18.0, 26.0, 13.0, 15.0, 7.0, 8.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.34765625, -6.17340087890625, -5.9991455078125, -5.82489013671875, -5.650634765625, -5.47637939453125, -5.3021240234375, -5.12786865234375, -4.95361328125, -4.77935791015625, -4.6051025390625, -4.43084716796875, -4.256591796875, -4.08233642578125, -3.9080810546875, -3.73382568359375, -3.5595703125, -3.38531494140625, -3.2110595703125, -3.03680419921875, -2.862548828125, -2.68829345703125, -2.5140380859375, -2.33978271484375, -2.16552734375, -1.99127197265625, -1.8170166015625, -1.64276123046875, -1.468505859375, -1.29425048828125, -1.1199951171875, -0.94573974609375, -0.771484375, -0.59722900390625, -0.4229736328125, -0.24871826171875, -0.074462890625, 0.09979248046875, 0.2740478515625, 0.44830322265625, 0.62255859375, 0.79681396484375, 0.9710693359375, 1.14532470703125, 1.319580078125, 1.49383544921875, 1.6680908203125, 1.84234619140625, 2.0166015625, 2.19085693359375, 2.3651123046875, 2.53936767578125, 2.713623046875, 2.88787841796875, 3.0621337890625, 3.23638916015625, 3.41064453125, 3.58489990234375, 3.7591552734375, 3.93341064453125, 4.107666015625, 4.28192138671875, 4.4561767578125, 4.63043212890625, 4.8046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 21.0, 45.0, 68.0, 123.0, 211.0, 190.0, 118.0, 95.0, 39.0, 27.0, 13.0, 5.0, 10.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.571048736572266, -44.5204963684082, -42.469940185546875, -40.41938781738281, -38.36883544921875, -36.31828308105469, -34.267730712890625, -32.2171745300293, -30.166622161865234, -28.116069793701172, -26.065515518188477, -24.01496124267578, -21.96440887451172, -19.913856506347656, -17.86330223083496, -15.812748908996582, -13.762195587158203, -11.711642265319824, -9.661088943481445, -7.610535621643066, -5.5599822998046875, -3.5094289779663086, -1.4588756561279297, 0.5916776657104492, 2.642230987548828, 4.692784309387207, 6.743337631225586, 8.793890953063965, 10.844444274902344, 12.894997596740723, 14.945550918579102, 16.996105194091797, 19.046661376953125, 21.097213745117188, 23.147768020629883, 25.198322296142578, 27.24887466430664, 29.299427032470703, 31.3499813079834, 33.400535583496094, 35.451087951660156, 37.50164031982422, 39.55219268798828, 41.60274887084961, 43.65330123901367, 45.703853607177734, 47.75440979003906, 49.804962158203125, 51.85551452636719, 53.90606689453125, 55.95661926269531, 58.00717544555664, 60.0577278137207, 62.108280181884766, 64.1588363647461, 66.20938873291016, 68.25994110107422, 70.31049346923828, 72.36104583740234, 74.4115982055664, 76.462158203125, 78.51271057128906, 80.56326293945312, 82.61381530761719, 84.66436767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 8.0, 16.0, 17.0, 19.0, 17.0, 21.0, 25.0, 32.0, 33.0, 41.0, 32.0, 43.0, 36.0, 49.0, 49.0, 53.0, 43.0, 40.0, 43.0, 45.0, 44.0, 45.0, 29.0, 26.0, 31.0, 27.0, 19.0, 18.0, 16.0, 7.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.193378448486328, -29.28727149963379, -28.381162643432617, -27.475055694580078, -26.568946838378906, -25.662839889526367, -24.756732940673828, -23.850624084472656, -22.944517135620117, -22.038410186767578, -21.132301330566406, -20.226194381713867, -19.320087432861328, -18.413978576660156, -17.507871627807617, -16.601764678955078, -15.695655822753906, -14.78954792022705, -13.883440017700195, -12.977333068847656, -12.0712251663208, -11.165117263793945, -10.259010314941406, -9.35290241241455, -8.446794509887695, -7.54068660736084, -6.634579181671143, -5.728471755981445, -4.82236385345459, -3.9162559509277344, -3.010148525238037, -2.10404109954834, -1.1979351043701172, -0.2918274402618408, 0.6142802238464355, 1.520387887954712, 2.4264955520629883, 3.3326034545898438, 4.238710880279541, 5.144818305969238, 6.050926208496094, 6.957034111022949, 7.8631415367126465, 8.769248962402344, 9.6753568649292, 10.581464767456055, 11.487571716308594, 12.39367961883545, 13.299787521362305, 14.20589542388916, 15.112003326416016, 16.018110275268555, 16.924217224121094, 17.830326080322266, 18.736433029174805, 19.642539978027344, 20.548648834228516, 21.454755783081055, 22.360864639282227, 23.266971588134766, 24.173080444335938, 25.079187393188477, 25.985294342041016, 26.891403198242188, 27.797510147094727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 14.0, 19.0, 36.0, 46.0, 113.0, 191.0, 495.0, 1221.0, 2994.0, 9012.0, 31260.0, 130595.0, 602408.0, 206221.0, 44887.0, 12426.0, 4033.0, 1409.0, 599.0, 275.0, 131.0, 76.0, 32.0, 20.0, 19.0, 9.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.9344482421875, -6.728271484375, -6.5220947265625, -6.31591796875, -6.1097412109375, -5.903564453125, -5.6973876953125, -5.4912109375, -5.2850341796875, -5.078857421875, -4.8726806640625, -4.66650390625, -4.4603271484375, -4.254150390625, -4.0479736328125, -3.841796875, -3.6356201171875, -3.429443359375, -3.2232666015625, -3.01708984375, -2.8109130859375, -2.604736328125, -2.3985595703125, -2.1923828125, -1.9862060546875, -1.780029296875, -1.5738525390625, -1.36767578125, -1.1614990234375, -0.955322265625, -0.7491455078125, -0.54296875, -0.3367919921875, -0.130615234375, 0.0755615234375, 0.28173828125, 0.4879150390625, 0.694091796875, 0.9002685546875, 1.1064453125, 1.3126220703125, 1.518798828125, 1.7249755859375, 1.93115234375, 2.1373291015625, 2.343505859375, 2.5496826171875, 2.755859375, 2.9620361328125, 3.168212890625, 3.3743896484375, 3.58056640625, 3.7867431640625, 3.992919921875, 4.1990966796875, 4.4052734375, 4.6114501953125, 4.817626953125, 5.0238037109375, 5.22998046875, 5.4361572265625, 5.642333984375, 5.8485107421875, 6.0546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 11.0, 19.0, 28.0, 19.0, 35.0, 39.0, 42.0, 35.0, 45.0, 46.0, 61.0, 64.0, 64.0, 67.0, 57.0, 53.0, 48.0, 41.0, 39.0, 37.0, 29.0, 28.0, 24.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 0.0, 1.0, 3.0], "bins": [-2.98828125, -2.9210205078125, -2.853759765625, -2.7864990234375, -2.71923828125, -2.6519775390625, -2.584716796875, -2.5174560546875, -2.4501953125, -2.3829345703125, -2.315673828125, -2.2484130859375, -2.18115234375, -2.1138916015625, -2.046630859375, -1.9793701171875, -1.912109375, -1.8448486328125, -1.777587890625, -1.7103271484375, -1.64306640625, -1.5758056640625, -1.508544921875, -1.4412841796875, -1.3740234375, -1.3067626953125, -1.239501953125, -1.1722412109375, -1.10498046875, -1.0377197265625, -0.970458984375, -0.9031982421875, -0.8359375, -0.7686767578125, -0.701416015625, -0.6341552734375, -0.56689453125, -0.4996337890625, -0.432373046875, -0.3651123046875, -0.2978515625, -0.2305908203125, -0.163330078125, -0.0960693359375, -0.02880859375, 0.0384521484375, 0.105712890625, 0.1729736328125, 0.240234375, 0.3074951171875, 0.374755859375, 0.4420166015625, 0.50927734375, 0.5765380859375, 0.643798828125, 0.7110595703125, 0.7783203125, 0.8455810546875, 0.912841796875, 0.9801025390625, 1.04736328125, 1.1146240234375, 1.181884765625, 1.2491455078125, 1.31640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 20.0, 20.0, 33.0, 61.0, 80.0, 136.0, 229.0, 348.0, 599.0, 1126.0, 2498.0, 6922.0, 33266.0, 647087.0, 319965.0, 25523.0, 5806.0, 2264.0, 1029.0, 576.0, 326.0, 224.0, 123.0, 70.0, 65.0, 37.0, 24.0, 10.0, 12.0, 9.0, 4.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0546875, -10.718994140625, -10.38330078125, -10.047607421875, -9.7119140625, -9.376220703125, -9.04052734375, -8.704833984375, -8.369140625, -8.033447265625, -7.69775390625, -7.362060546875, -7.0263671875, -6.690673828125, -6.35498046875, -6.019287109375, -5.68359375, -5.347900390625, -5.01220703125, -4.676513671875, -4.3408203125, -4.005126953125, -3.66943359375, -3.333740234375, -2.998046875, -2.662353515625, -2.32666015625, -1.990966796875, -1.6552734375, -1.319580078125, -0.98388671875, -0.648193359375, -0.3125, 0.023193359375, 0.35888671875, 0.694580078125, 1.0302734375, 1.365966796875, 1.70166015625, 2.037353515625, 2.373046875, 2.708740234375, 3.04443359375, 3.380126953125, 3.7158203125, 4.051513671875, 4.38720703125, 4.722900390625, 5.05859375, 5.394287109375, 5.72998046875, 6.065673828125, 6.4013671875, 6.737060546875, 7.07275390625, 7.408447265625, 7.744140625, 8.079833984375, 8.41552734375, 8.751220703125, 9.0869140625, 9.422607421875, 9.75830078125, 10.093994140625, 10.4296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 15.0, 24.0, 21.0, 21.0, 26.0, 30.0, 38.0, 40.0, 30.0, 35.0, 62.0, 42.0, 51.0, 51.0, 48.0, 57.0, 36.0, 36.0, 36.0, 38.0, 38.0, 41.0, 27.0, 15.0, 20.0, 12.0, 16.0, 8.0, 11.0, 6.0, 6.0, 8.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.078125, -7.8057861328125, -7.533447265625, -7.2611083984375, -6.98876953125, -6.7164306640625, -6.444091796875, -6.1717529296875, -5.8994140625, -5.6270751953125, -5.354736328125, -5.0823974609375, -4.81005859375, -4.5377197265625, -4.265380859375, -3.9930419921875, -3.720703125, -3.4483642578125, -3.176025390625, -2.9036865234375, -2.63134765625, -2.3590087890625, -2.086669921875, -1.8143310546875, -1.5419921875, -1.2696533203125, -0.997314453125, -0.7249755859375, -0.45263671875, -0.1802978515625, 0.092041015625, 0.3643798828125, 0.63671875, 0.9090576171875, 1.181396484375, 1.4537353515625, 1.72607421875, 1.9984130859375, 2.270751953125, 2.5430908203125, 2.8154296875, 3.0877685546875, 3.360107421875, 3.6324462890625, 3.90478515625, 4.1771240234375, 4.449462890625, 4.7218017578125, 4.994140625, 5.2664794921875, 5.538818359375, 5.8111572265625, 6.08349609375, 6.3558349609375, 6.628173828125, 6.9005126953125, 7.1728515625, 7.4451904296875, 7.717529296875, 7.9898681640625, 8.26220703125, 8.5345458984375, 8.806884765625, 9.0792236328125, 9.3515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 12.0, 14.0, 11.0, 25.0, 40.0, 51.0, 81.0, 112.0, 176.0, 293.0, 472.0, 808.0, 1557.0, 2923.0, 6744.0, 17495.0, 53191.0, 243205.0, 599157.0, 80909.0, 24213.0, 8792.0, 3836.0, 1877.0, 989.0, 567.0, 324.0, 220.0, 136.0, 95.0, 69.0, 40.0, 26.0, 22.0, 14.0, 5.0, 6.0, 10.0, 9.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.693878173828125, -2.60455322265625, -2.515228271484375, -2.4259033203125, -2.336578369140625, -2.24725341796875, -2.157928466796875, -2.068603515625, -1.979278564453125, -1.88995361328125, -1.800628662109375, -1.7113037109375, -1.621978759765625, -1.53265380859375, -1.443328857421875, -1.35400390625, -1.264678955078125, -1.17535400390625, -1.086029052734375, -0.9967041015625, -0.907379150390625, -0.81805419921875, -0.728729248046875, -0.639404296875, -0.550079345703125, -0.46075439453125, -0.371429443359375, -0.2821044921875, -0.192779541015625, -0.10345458984375, -0.014129638671875, 0.0751953125, 0.164520263671875, 0.25384521484375, 0.343170166015625, 0.4324951171875, 0.521820068359375, 0.61114501953125, 0.700469970703125, 0.789794921875, 0.879119873046875, 0.96844482421875, 1.057769775390625, 1.1470947265625, 1.236419677734375, 1.32574462890625, 1.415069580078125, 1.50439453125, 1.593719482421875, 1.68304443359375, 1.772369384765625, 1.8616943359375, 1.951019287109375, 2.04034423828125, 2.129669189453125, 2.218994140625, 2.308319091796875, 2.39764404296875, 2.486968994140625, 2.5762939453125, 2.665618896484375, 2.75494384765625, 2.844268798828125, 2.93359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 9.0, 7.0, 16.0, 17.0, 15.0, 26.0, 29.0, 44.0, 58.0, 84.0, 212.0, 145.0, 80.0, 57.0, 35.0, 33.0, 27.0, 19.0, 16.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00118255615234375, -0.001147627830505371, -0.0011126995086669922, -0.0010777711868286133, -0.0010428428649902344, -0.0010079145431518555, -0.0009729862213134766, -0.0009380578994750977, -0.0009031295776367188, -0.0008682012557983398, -0.0008332729339599609, -0.000798344612121582, -0.0007634162902832031, -0.0007284879684448242, -0.0006935596466064453, -0.0006586313247680664, -0.0006237030029296875, -0.0005887746810913086, -0.0005538463592529297, -0.0005189180374145508, -0.0004839897155761719, -0.00044906139373779297, -0.00041413307189941406, -0.00037920475006103516, -0.00034427642822265625, -0.00030934810638427734, -0.00027441978454589844, -0.00023949146270751953, -0.00020456314086914062, -0.00016963481903076172, -0.0001347064971923828, -9.97781753540039e-05, -6.4849853515625e-05, -2.9921531677246094e-05, 5.0067901611328125e-06, 3.993511199951172e-05, 7.486343383789062e-05, 0.00010979175567626953, 0.00014472007751464844, 0.00017964839935302734, 0.00021457672119140625, 0.00024950504302978516, 0.00028443336486816406, 0.00031936168670654297, 0.0003542900085449219, 0.0003892183303833008, 0.0004241466522216797, 0.0004590749740600586, 0.0004940032958984375, 0.0005289316177368164, 0.0005638599395751953, 0.0005987882614135742, 0.0006337165832519531, 0.000668644905090332, 0.0007035732269287109, 0.0007385015487670898, 0.0007734298706054688, 0.0008083581924438477, 0.0008432865142822266, 0.0008782148361206055, 0.0009131431579589844, 0.0009480714797973633, 0.0009829998016357422, 0.001017928123474121, 0.0010528564453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 17.0, 23.0, 39.0, 47.0, 63.0, 125.0, 178.0, 321.0, 570.0, 1039.0, 2117.0, 5057.0, 15002.0, 62453.0, 599093.0, 297054.0, 45394.0, 11795.0, 4085.0, 1864.0, 931.0, 488.0, 279.0, 156.0, 113.0, 78.0, 43.0, 29.0, 17.0, 9.0, 17.0, 12.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.928253173828125, -2.82330322265625, -2.718353271484375, -2.6134033203125, -2.508453369140625, -2.40350341796875, -2.298553466796875, -2.193603515625, -2.088653564453125, -1.98370361328125, -1.878753662109375, -1.7738037109375, -1.668853759765625, -1.56390380859375, -1.458953857421875, -1.35400390625, -1.249053955078125, -1.14410400390625, -1.039154052734375, -0.9342041015625, -0.829254150390625, -0.72430419921875, -0.619354248046875, -0.514404296875, -0.409454345703125, -0.30450439453125, -0.199554443359375, -0.0946044921875, 0.010345458984375, 0.11529541015625, 0.220245361328125, 0.3251953125, 0.430145263671875, 0.53509521484375, 0.640045166015625, 0.7449951171875, 0.849945068359375, 0.95489501953125, 1.059844970703125, 1.164794921875, 1.269744873046875, 1.37469482421875, 1.479644775390625, 1.5845947265625, 1.689544677734375, 1.79449462890625, 1.899444580078125, 2.00439453125, 2.109344482421875, 2.21429443359375, 2.319244384765625, 2.4241943359375, 2.529144287109375, 2.63409423828125, 2.739044189453125, 2.843994140625, 2.948944091796875, 3.05389404296875, 3.158843994140625, 3.2637939453125, 3.368743896484375, 3.47369384765625, 3.578643798828125, 3.68359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 4.0, 4.0, 14.0, 8.0, 12.0, 18.0, 16.0, 18.0, 36.0, 28.0, 20.0, 38.0, 34.0, 58.0, 53.0, 75.0, 68.0, 79.0, 62.0, 50.0, 40.0, 29.0, 24.0, 26.0, 19.0, 19.0, 15.0, 12.0, 16.0, 14.0, 13.0, 11.0, 3.0, 7.0, 6.0, 5.0, 7.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.248046875, -2.178863525390625, -2.10968017578125, -2.040496826171875, -1.9713134765625, -1.902130126953125, -1.83294677734375, -1.763763427734375, -1.694580078125, -1.625396728515625, -1.55621337890625, -1.487030029296875, -1.4178466796875, -1.348663330078125, -1.27947998046875, -1.210296630859375, -1.14111328125, -1.071929931640625, -1.00274658203125, -0.933563232421875, -0.8643798828125, -0.795196533203125, -0.72601318359375, -0.656829833984375, -0.587646484375, -0.518463134765625, -0.44927978515625, -0.380096435546875, -0.3109130859375, -0.241729736328125, -0.17254638671875, -0.103363037109375, -0.0341796875, 0.035003662109375, 0.10418701171875, 0.173370361328125, 0.2425537109375, 0.311737060546875, 0.38092041015625, 0.450103759765625, 0.519287109375, 0.588470458984375, 0.65765380859375, 0.726837158203125, 0.7960205078125, 0.865203857421875, 0.93438720703125, 1.003570556640625, 1.07275390625, 1.141937255859375, 1.21112060546875, 1.280303955078125, 1.3494873046875, 1.418670654296875, 1.48785400390625, 1.557037353515625, 1.626220703125, 1.695404052734375, 1.76458740234375, 1.833770751953125, 1.9029541015625, 1.972137451171875, 2.04132080078125, 2.110504150390625, 2.1796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 9.0, 15.0, 49.0, 114.0, 217.0, 304.0, 157.0, 75.0, 17.0, 15.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-75.54513549804688, -72.65704345703125, -69.7689437866211, -66.88085174560547, -63.99275207519531, -61.10465621948242, -58.21656036376953, -55.328468322753906, -52.44036865234375, -49.55227279663086, -46.66417694091797, -43.77608108520508, -40.88798522949219, -37.9998893737793, -35.111793518066406, -32.22370147705078, -29.33560562133789, -26.447509765625, -23.55941390991211, -20.67131805419922, -17.783222198486328, -14.895127296447754, -12.00703239440918, -9.118936538696289, -6.230840682983398, -3.342745065689087, -0.4546494483947754, 2.433445930480957, 5.321541786193848, 8.209637641906738, 11.097732543945312, 13.985828399658203, 16.873924255371094, 19.762020111083984, 22.650115966796875, 25.538211822509766, 28.426307678222656, 31.314403533935547, 34.20249938964844, 37.09059143066406, 39.97869110107422, 42.86678695678711, 45.7548828125, 48.64297866821289, 51.53107452392578, 54.41917037963867, 57.30726623535156, 60.19535827636719, 63.08345413208008, 65.97154998779297, 68.8596420288086, 71.74774169921875, 74.63583374023438, 77.52393341064453, 80.41202545166016, 83.30012512207031, 86.18821716308594, 89.07630920410156, 91.96440887451172, 94.85250091552734, 97.7406005859375, 100.62869262695312, 103.51679229736328, 106.4048843383789, 109.29298400878906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 8.0, 9.0, 9.0, 11.0, 6.0, 15.0, 17.0, 18.0, 27.0, 29.0, 27.0, 34.0, 24.0, 29.0, 33.0, 48.0, 46.0, 48.0, 65.0, 42.0, 46.0, 38.0, 36.0, 45.0, 12.0, 29.0, 23.0, 32.0, 17.0, 22.0, 15.0, 15.0, 16.0, 21.0, 8.0, 9.0, 12.0, 5.0, 6.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.49323081970215, -22.629426956176758, -21.765621185302734, -20.901817321777344, -20.038013458251953, -19.17420768737793, -18.31040382385254, -17.446598052978516, -16.582794189453125, -15.718989372253418, -14.855184555053711, -13.99138069152832, -13.127575874328613, -12.263771057128906, -11.399967193603516, -10.536162376403809, -9.672357559204102, -8.808552742004395, -7.944748401641846, -7.080944061279297, -6.21713924407959, -5.353334426879883, -4.489530086517334, -3.625725746154785, -2.761920928955078, -1.8981163501739502, -1.0343117713928223, -0.17050719261169434, 0.6932973861694336, 1.5571022033691406, 2.4209065437316895, 3.2847108840942383, 4.148517608642578, 5.012322425842285, 5.876126766204834, 6.739931106567383, 7.60373592376709, 8.467540740966797, 9.331344604492188, 10.195149421691895, 11.058954238891602, 11.922759056091309, 12.786563873291016, 13.650367736816406, 14.514172554016113, 15.37797737121582, 16.24178123474121, 17.105587005615234, 17.969390869140625, 18.833194732666016, 19.69700050354004, 20.56080436706543, 21.424610137939453, 22.288414001464844, 23.152217864990234, 24.016021728515625, 24.87982749938965, 25.74363136291504, 26.607437133789062, 27.471240997314453, 28.335044860839844, 29.198850631713867, 30.062654495239258, 30.92646026611328, 31.790264129638672]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 9.0, 19.0, 25.0, 33.0, 40.0, 55.0, 78.0, 105.0, 184.0, 301.0, 450.0, 740.0, 1422.0, 2520.0, 5222.0, 11600.0, 29860.0, 99581.0, 577906.0, 2602619.0, 688151.0, 115385.0, 33306.0, 12867.0, 5518.0, 2714.0, 1467.0, 764.0, 447.0, 271.0, 200.0, 127.0, 81.0, 52.0, 36.0, 23.0, 20.0, 14.0, 13.0, 10.0, 1.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.86328125, -2.76953125, -2.67578125, -2.58203125, -2.48828125, -2.39453125, -2.30078125, -2.20703125, -2.11328125, -2.01953125, -1.92578125, -1.83203125, -1.73828125, -1.64453125, -1.55078125, -1.45703125, -1.36328125, -1.26953125, -1.17578125, -1.08203125, -0.98828125, -0.89453125, -0.80078125, -0.70703125, -0.61328125, -0.51953125, -0.42578125, -0.33203125, -0.23828125, -0.14453125, -0.05078125, 0.04296875, 0.13671875, 0.23046875, 0.32421875, 0.41796875, 0.51171875, 0.60546875, 0.69921875, 0.79296875, 0.88671875, 0.98046875, 1.07421875, 1.16796875, 1.26171875, 1.35546875, 1.44921875, 1.54296875, 1.63671875, 1.73046875, 1.82421875, 1.91796875, 2.01171875, 2.10546875, 2.19921875, 2.29296875, 2.38671875, 2.48046875, 2.57421875, 2.66796875, 2.76171875, 2.85546875, 2.94921875, 3.04296875, 3.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 2.0, 7.0, 10.0, 9.0, 8.0, 15.0, 17.0, 17.0, 32.0, 34.0, 35.0, 36.0, 41.0, 55.0, 50.0, 65.0, 59.0, 59.0, 71.0, 46.0, 41.0, 53.0, 38.0, 46.0, 33.0, 28.0, 28.0, 18.0, 18.0, 12.0, 7.0, 8.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.865234375, -2.7971343994140625, -2.729034423828125, -2.6609344482421875, -2.59283447265625, -2.5247344970703125, -2.456634521484375, -2.3885345458984375, -2.3204345703125, -2.2523345947265625, -2.184234619140625, -2.1161346435546875, -2.04803466796875, -1.9799346923828125, -1.911834716796875, -1.8437347412109375, -1.775634765625, -1.7075347900390625, -1.639434814453125, -1.5713348388671875, -1.50323486328125, -1.4351348876953125, -1.367034912109375, -1.2989349365234375, -1.2308349609375, -1.1627349853515625, -1.094635009765625, -1.0265350341796875, -0.95843505859375, -0.8903350830078125, -0.822235107421875, -0.7541351318359375, -0.68603515625, -0.6179351806640625, -0.549835205078125, -0.4817352294921875, -0.41363525390625, -0.3455352783203125, -0.277435302734375, -0.2093353271484375, -0.1412353515625, -0.0731353759765625, -0.005035400390625, 0.0630645751953125, 0.13116455078125, 0.1992645263671875, 0.267364501953125, 0.3354644775390625, 0.403564453125, 0.4716644287109375, 0.539764404296875, 0.6078643798828125, 0.67596435546875, 0.7440643310546875, 0.812164306640625, 0.8802642822265625, 0.9483642578125, 1.0164642333984375, 1.084564208984375, 1.1526641845703125, 1.22076416015625, 1.2888641357421875, 1.356964111328125, 1.4250640869140625, 1.4931640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 11.0, 9.0, 27.0, 45.0, 65.0, 137.0, 330.0, 825.0, 2479.0, 9527.0, 55307.0, 773655.0, 3185266.0, 140944.0, 18764.0, 4325.0, 1382.0, 591.0, 258.0, 145.0, 72.0, 40.0, 28.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.72650146484375, -4.5037841796875, -4.28106689453125, -4.058349609375, -3.83563232421875, -3.6129150390625, -3.39019775390625, -3.16748046875, -2.94476318359375, -2.7220458984375, -2.49932861328125, -2.276611328125, -2.05389404296875, -1.8311767578125, -1.60845947265625, -1.3857421875, -1.16302490234375, -0.9403076171875, -0.71759033203125, -0.494873046875, -0.27215576171875, -0.0494384765625, 0.17327880859375, 0.39599609375, 0.61871337890625, 0.8414306640625, 1.06414794921875, 1.286865234375, 1.50958251953125, 1.7322998046875, 1.95501708984375, 2.177734375, 2.40045166015625, 2.6231689453125, 2.84588623046875, 3.068603515625, 3.29132080078125, 3.5140380859375, 3.73675537109375, 3.95947265625, 4.18218994140625, 4.4049072265625, 4.62762451171875, 4.850341796875, 5.07305908203125, 5.2957763671875, 5.51849365234375, 5.7412109375, 5.96392822265625, 6.1866455078125, 6.40936279296875, 6.632080078125, 6.85479736328125, 7.0775146484375, 7.30023193359375, 7.52294921875, 7.74566650390625, 7.9683837890625, 8.19110107421875, 8.413818359375, 8.63653564453125, 8.8592529296875, 9.08197021484375, 9.3046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 7.0, 4.0, 15.0, 8.0, 36.0, 41.0, 57.0, 84.0, 115.0, 201.0, 368.0, 667.0, 948.0, 652.0, 316.0, 203.0, 107.0, 73.0, 54.0, 24.0, 30.0, 19.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.2088623046875, -4.995849609375, -4.7828369140625, -4.56982421875, -4.3568115234375, -4.143798828125, -3.9307861328125, -3.7177734375, -3.5047607421875, -3.291748046875, -3.0787353515625, -2.86572265625, -2.6527099609375, -2.439697265625, -2.2266845703125, -2.013671875, -1.8006591796875, -1.587646484375, -1.3746337890625, -1.16162109375, -0.9486083984375, -0.735595703125, -0.5225830078125, -0.3095703125, -0.0965576171875, 0.116455078125, 0.3294677734375, 0.54248046875, 0.7554931640625, 0.968505859375, 1.1815185546875, 1.39453125, 1.6075439453125, 1.820556640625, 2.0335693359375, 2.24658203125, 2.4595947265625, 2.672607421875, 2.8856201171875, 3.0986328125, 3.3116455078125, 3.524658203125, 3.7376708984375, 3.95068359375, 4.1636962890625, 4.376708984375, 4.5897216796875, 4.802734375, 5.0157470703125, 5.228759765625, 5.4417724609375, 5.65478515625, 5.8677978515625, 6.080810546875, 6.2938232421875, 6.5068359375, 6.7198486328125, 6.932861328125, 7.1458740234375, 7.35888671875, 7.5718994140625, 7.784912109375, 7.9979248046875, 8.2109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 9.0, 15.0, 100.0, 282.0, 404.0, 138.0, 35.0, 13.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.06217956542969, -76.85025024414062, -72.6383285522461, -68.42640686035156, -64.2144775390625, -60.0025520324707, -55.790626525878906, -51.57870101928711, -47.36677551269531, -43.154850006103516, -38.94292449951172, -34.73099899291992, -30.519073486328125, -26.307147979736328, -22.09522247314453, -17.883296966552734, -13.671371459960938, -9.45944595336914, -5.247520446777344, -1.0355949401855469, 3.17633056640625, 7.388256072998047, 11.600181579589844, 15.81210708618164, 20.024032592773438, 24.235958099365234, 28.44788360595703, 32.65980911254883, 36.871734619140625, 41.08366012573242, 45.29558563232422, 49.507511138916016, 53.719451904296875, 57.93137741088867, 62.14330291748047, 66.355224609375, 70.56715393066406, 74.77908325195312, 78.99100494384766, 83.20292663574219, 87.41485595703125, 91.62678527832031, 95.83870697021484, 100.05062866210938, 104.26255798339844, 108.4744873046875, 112.68640899658203, 116.89833068847656, 121.11026000976562, 125.32218933105469, 129.53411865234375, 133.74603271484375, 137.9579620361328, 142.16989135742188, 146.38180541992188, 150.59373474121094, 154.8056640625, 159.01759338378906, 163.22952270507812, 167.44143676757812, 171.6533660888672, 175.86529541015625, 180.07720947265625, 184.2891387939453, 188.50106811523438]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 16.0, 12.0, 29.0, 37.0, 52.0, 37.0, 50.0, 54.0, 77.0, 92.0, 68.0, 95.0, 65.0, 69.0, 59.0, 44.0, 38.0, 23.0, 21.0, 15.0, 8.0, 4.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.531421661376953, -20.19291114807129, -18.854402542114258, -17.515892028808594, -16.177383422851562, -14.838872909545898, -13.500362396240234, -12.161852836608887, -10.823343276977539, -9.484833717346191, -8.146324157714844, -6.80781364440918, -5.469304084777832, -4.130794525146484, -2.7922840118408203, -1.4537744522094727, -0.115264892578125, 1.2232449054718018, 2.5617547035217285, 3.9002647399902344, 5.238774299621582, 6.57728385925293, 7.915794372558594, 9.254303932189941, 10.592813491821289, 11.931323051452637, 13.269832611083984, 14.608343124389648, 15.946852684020996, 17.285362243652344, 18.623872756958008, 19.962383270263672, 21.30089569091797, 22.639406204223633, 23.977914810180664, 25.316425323486328, 26.65493392944336, 27.993444442749023, 29.331954956054688, 30.67046356201172, 32.00897216796875, 33.34748077392578, 34.68599319458008, 36.02450180053711, 37.36301040649414, 38.70152282714844, 40.04003143310547, 41.3785400390625, 42.7170524597168, 44.05556106567383, 45.394073486328125, 46.732582092285156, 48.07109069824219, 49.40959930419922, 50.748111724853516, 52.08662033081055, 53.425132751464844, 54.763641357421875, 56.10215377807617, 57.4406623840332, 58.779170989990234, 60.11768341064453, 61.45619201660156, 62.794700622558594, 64.13320922851562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 30.0, 49.0, 65.0, 111.0, 211.0, 308.0, 608.0, 1142.0, 2452.0, 5553.0, 14072.0, 43485.0, 221011.0, 594097.0, 117993.0, 29059.0, 10087.0, 4151.0, 1955.0, 906.0, 462.0, 274.0, 175.0, 93.0, 54.0, 37.0, 26.0, 18.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.53955078125, -4.3603515625, -4.18115234375, -4.001953125, -3.82275390625, -3.6435546875, -3.46435546875, -3.28515625, -3.10595703125, -2.9267578125, -2.74755859375, -2.568359375, -2.38916015625, -2.2099609375, -2.03076171875, -1.8515625, -1.67236328125, -1.4931640625, -1.31396484375, -1.134765625, -0.95556640625, -0.7763671875, -0.59716796875, -0.41796875, -0.23876953125, -0.0595703125, 0.11962890625, 0.298828125, 0.47802734375, 0.6572265625, 0.83642578125, 1.015625, 1.19482421875, 1.3740234375, 1.55322265625, 1.732421875, 1.91162109375, 2.0908203125, 2.27001953125, 2.44921875, 2.62841796875, 2.8076171875, 2.98681640625, 3.166015625, 3.34521484375, 3.5244140625, 3.70361328125, 3.8828125, 4.06201171875, 4.2412109375, 4.42041015625, 4.599609375, 4.77880859375, 4.9580078125, 5.13720703125, 5.31640625, 5.49560546875, 5.6748046875, 5.85400390625, 6.033203125, 6.21240234375, 6.3916015625, 6.57080078125, 6.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 17.0, 12.0, 15.0, 18.0, 27.0, 32.0, 27.0, 36.0, 34.0, 48.0, 38.0, 59.0, 62.0, 49.0, 54.0, 64.0, 52.0, 56.0, 53.0, 38.0, 39.0, 37.0, 21.0, 18.0, 22.0, 12.0, 13.0, 8.0, 5.0, 10.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.498046875, -2.4297943115234375, -2.361541748046875, -2.2932891845703125, -2.22503662109375, -2.1567840576171875, -2.088531494140625, -2.0202789306640625, -1.9520263671875, -1.8837738037109375, -1.815521240234375, -1.7472686767578125, -1.67901611328125, -1.6107635498046875, -1.542510986328125, -1.4742584228515625, -1.406005859375, -1.3377532958984375, -1.269500732421875, -1.2012481689453125, -1.13299560546875, -1.0647430419921875, -0.996490478515625, -0.9282379150390625, -0.8599853515625, -0.7917327880859375, -0.723480224609375, -0.6552276611328125, -0.58697509765625, -0.5187225341796875, -0.450469970703125, -0.3822174072265625, -0.31396484375, -0.2457122802734375, -0.177459716796875, -0.1092071533203125, -0.04095458984375, 0.0272979736328125, 0.095550537109375, 0.1638031005859375, 0.2320556640625, 0.3003082275390625, 0.368560791015625, 0.4368133544921875, 0.50506591796875, 0.5733184814453125, 0.641571044921875, 0.7098236083984375, 0.778076171875, 0.8463287353515625, 0.914581298828125, 0.9828338623046875, 1.05108642578125, 1.1193389892578125, 1.187591552734375, 1.2558441162109375, 1.3240966796875, 1.3923492431640625, 1.460601806640625, 1.5288543701171875, 1.59710693359375, 1.6653594970703125, 1.733612060546875, 1.8018646240234375, 1.8701171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 21.0, 20.0, 28.0, 40.0, 45.0, 68.0, 120.0, 168.0, 286.0, 490.0, 892.0, 1770.0, 4364.0, 14404.0, 79786.0, 809453.0, 109615.0, 17626.0, 5092.0, 1950.0, 926.0, 477.0, 313.0, 182.0, 119.0, 69.0, 63.0, 37.0, 28.0, 18.0, 14.0, 7.0, 9.0, 7.0, 5.0, 6.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7421875, -9.47576904296875, -9.2093505859375, -8.94293212890625, -8.676513671875, -8.41009521484375, -8.1436767578125, -7.87725830078125, -7.61083984375, -7.34442138671875, -7.0780029296875, -6.81158447265625, -6.545166015625, -6.27874755859375, -6.0123291015625, -5.74591064453125, -5.4794921875, -5.21307373046875, -4.9466552734375, -4.68023681640625, -4.413818359375, -4.14739990234375, -3.8809814453125, -3.61456298828125, -3.34814453125, -3.08172607421875, -2.8153076171875, -2.54888916015625, -2.282470703125, -2.01605224609375, -1.7496337890625, -1.48321533203125, -1.216796875, -0.95037841796875, -0.6839599609375, -0.41754150390625, -0.151123046875, 0.11529541015625, 0.3817138671875, 0.64813232421875, 0.91455078125, 1.18096923828125, 1.4473876953125, 1.71380615234375, 1.980224609375, 2.24664306640625, 2.5130615234375, 2.77947998046875, 3.0458984375, 3.31231689453125, 3.5787353515625, 3.84515380859375, 4.111572265625, 4.37799072265625, 4.6444091796875, 4.91082763671875, 5.17724609375, 5.44366455078125, 5.7100830078125, 5.97650146484375, 6.242919921875, 6.50933837890625, 6.7757568359375, 7.04217529296875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 18.0, 11.0, 12.0, 16.0, 23.0, 32.0, 40.0, 44.0, 51.0, 51.0, 53.0, 56.0, 62.0, 74.0, 59.0, 58.0, 50.0, 38.0, 28.0, 39.0, 27.0, 21.0, 17.0, 13.0, 14.0, 15.0, 14.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.8934326171875, -7.607177734375, -7.3209228515625, -7.03466796875, -6.7484130859375, -6.462158203125, -6.1759033203125, -5.8896484375, -5.6033935546875, -5.317138671875, -5.0308837890625, -4.74462890625, -4.4583740234375, -4.172119140625, -3.8858642578125, -3.599609375, -3.3133544921875, -3.027099609375, -2.7408447265625, -2.45458984375, -2.1683349609375, -1.882080078125, -1.5958251953125, -1.3095703125, -1.0233154296875, -0.737060546875, -0.4508056640625, -0.16455078125, 0.1217041015625, 0.407958984375, 0.6942138671875, 0.98046875, 1.2667236328125, 1.552978515625, 1.8392333984375, 2.12548828125, 2.4117431640625, 2.697998046875, 2.9842529296875, 3.2705078125, 3.5567626953125, 3.843017578125, 4.1292724609375, 4.41552734375, 4.7017822265625, 4.988037109375, 5.2742919921875, 5.560546875, 5.8468017578125, 6.133056640625, 6.4193115234375, 6.70556640625, 6.9918212890625, 7.278076171875, 7.5643310546875, 7.8505859375, 8.1368408203125, 8.423095703125, 8.7093505859375, 8.99560546875, 9.2818603515625, 9.568115234375, 9.8543701171875, 10.140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 18.0, 28.0, 35.0, 69.0, 79.0, 161.0, 311.0, 546.0, 1159.0, 2636.0, 6806.0, 20439.0, 80486.0, 645501.0, 228415.0, 41815.0, 12162.0, 4241.0, 1797.0, 767.0, 379.0, 222.0, 148.0, 87.0, 54.0, 38.0, 27.0, 18.0, 15.0, 13.0, 13.0, 2.0, 2.0, 10.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.31451416015625, -2.2247314453125, -2.13494873046875, -2.045166015625, -1.95538330078125, -1.8656005859375, -1.77581787109375, -1.68603515625, -1.59625244140625, -1.5064697265625, -1.41668701171875, -1.326904296875, -1.23712158203125, -1.1473388671875, -1.05755615234375, -0.9677734375, -0.87799072265625, -0.7882080078125, -0.69842529296875, -0.608642578125, -0.51885986328125, -0.4290771484375, -0.33929443359375, -0.24951171875, -0.15972900390625, -0.0699462890625, 0.01983642578125, 0.109619140625, 0.19940185546875, 0.2891845703125, 0.37896728515625, 0.46875, 0.55853271484375, 0.6483154296875, 0.73809814453125, 0.827880859375, 0.91766357421875, 1.0074462890625, 1.09722900390625, 1.18701171875, 1.27679443359375, 1.3665771484375, 1.45635986328125, 1.546142578125, 1.63592529296875, 1.7257080078125, 1.81549072265625, 1.9052734375, 1.99505615234375, 2.0848388671875, 2.17462158203125, 2.264404296875, 2.35418701171875, 2.4439697265625, 2.53375244140625, 2.62353515625, 2.71331787109375, 2.8031005859375, 2.89288330078125, 2.982666015625, 3.07244873046875, 3.1622314453125, 3.25201416015625, 3.341796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 7.0, 19.0, 21.0, 24.0, 43.0, 57.0, 101.0, 134.0, 158.0, 118.0, 67.0, 55.0, 42.0, 28.0, 18.0, 21.0, 18.0, 6.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006933212280273438, -0.0006669163703918457, -0.0006405115127563477, -0.0006141066551208496, -0.0005877017974853516, -0.0005612969398498535, -0.0005348920822143555, -0.0005084872245788574, -0.0004820823669433594, -0.00045567750930786133, -0.0004292726516723633, -0.00040286779403686523, -0.0003764629364013672, -0.00035005807876586914, -0.0003236532211303711, -0.00029724836349487305, -0.000270843505859375, -0.00024443864822387695, -0.0002180337905883789, -0.00019162893295288086, -0.0001652240753173828, -0.00013881921768188477, -0.00011241436004638672, -8.600950241088867e-05, -5.9604644775390625e-05, -3.319978713989258e-05, -6.794929504394531e-06, 1.9609928131103516e-05, 4.601478576660156e-05, 7.241964340209961e-05, 9.882450103759766e-05, 0.0001252293586730957, 0.00015163421630859375, 0.0001780390739440918, 0.00020444393157958984, 0.0002308487892150879, 0.00025725364685058594, 0.000283658504486084, 0.00031006336212158203, 0.0003364682197570801, 0.0003628730773925781, 0.00038927793502807617, 0.0004156827926635742, 0.00044208765029907227, 0.0004684925079345703, 0.0004948973655700684, 0.0005213022232055664, 0.0005477070808410645, 0.0005741119384765625, 0.0006005167961120605, 0.0006269216537475586, 0.0006533265113830566, 0.0006797313690185547, 0.0007061362266540527, 0.0007325410842895508, 0.0007589459419250488, 0.0007853507995605469, 0.0008117556571960449, 0.000838160514831543, 0.000864565372467041, 0.0008909702301025391, 0.0009173750877380371, 0.0009437799453735352, 0.0009701848030090332, 0.0009965896606445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 3.0, 12.0, 14.0, 8.0, 14.0, 17.0, 27.0, 33.0, 62.0, 83.0, 121.0, 160.0, 221.0, 330.0, 567.0, 950.0, 1804.0, 3617.0, 8204.0, 21249.0, 65794.0, 289415.0, 527231.0, 84303.0, 25588.0, 9734.0, 4136.0, 1947.0, 1119.0, 623.0, 377.0, 244.0, 160.0, 95.0, 92.0, 57.0, 27.0, 29.0, 21.0, 20.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.176422119140625, -2.11065673828125, -2.044891357421875, -1.9791259765625, -1.913360595703125, -1.84759521484375, -1.781829833984375, -1.716064453125, -1.650299072265625, -1.58453369140625, -1.518768310546875, -1.4530029296875, -1.387237548828125, -1.32147216796875, -1.255706787109375, -1.18994140625, -1.124176025390625, -1.05841064453125, -0.992645263671875, -0.9268798828125, -0.861114501953125, -0.79534912109375, -0.729583740234375, -0.663818359375, -0.598052978515625, -0.53228759765625, -0.466522216796875, -0.4007568359375, -0.334991455078125, -0.26922607421875, -0.203460693359375, -0.1376953125, -0.071929931640625, -0.00616455078125, 0.059600830078125, 0.1253662109375, 0.191131591796875, 0.25689697265625, 0.322662353515625, 0.388427734375, 0.454193115234375, 0.51995849609375, 0.585723876953125, 0.6514892578125, 0.717254638671875, 0.78302001953125, 0.848785400390625, 0.91455078125, 0.980316162109375, 1.04608154296875, 1.111846923828125, 1.1776123046875, 1.243377685546875, 1.30914306640625, 1.374908447265625, 1.440673828125, 1.506439208984375, 1.57220458984375, 1.637969970703125, 1.7037353515625, 1.769500732421875, 1.83526611328125, 1.901031494140625, 1.966796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 11.0, 6.0, 15.0, 8.0, 12.0, 14.0, 20.0, 39.0, 35.0, 42.0, 64.0, 74.0, 80.0, 107.0, 105.0, 83.0, 43.0, 37.0, 41.0, 38.0, 22.0, 21.0, 11.0, 15.0, 13.0, 8.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.38739013671875, -2.3099365234375, -2.23248291015625, -2.155029296875, -2.07757568359375, -2.0001220703125, -1.92266845703125, -1.84521484375, -1.76776123046875, -1.6903076171875, -1.61285400390625, -1.535400390625, -1.45794677734375, -1.3804931640625, -1.30303955078125, -1.2255859375, -1.14813232421875, -1.0706787109375, -0.99322509765625, -0.915771484375, -0.83831787109375, -0.7608642578125, -0.68341064453125, -0.60595703125, -0.52850341796875, -0.4510498046875, -0.37359619140625, -0.296142578125, -0.21868896484375, -0.1412353515625, -0.06378173828125, 0.013671875, 0.09112548828125, 0.1685791015625, 0.24603271484375, 0.323486328125, 0.40093994140625, 0.4783935546875, 0.55584716796875, 0.63330078125, 0.71075439453125, 0.7882080078125, 0.86566162109375, 0.943115234375, 1.02056884765625, 1.0980224609375, 1.17547607421875, 1.2529296875, 1.33038330078125, 1.4078369140625, 1.48529052734375, 1.562744140625, 1.64019775390625, 1.7176513671875, 1.79510498046875, 1.87255859375, 1.95001220703125, 2.0274658203125, 2.10491943359375, 2.182373046875, 2.25982666015625, 2.3372802734375, 2.41473388671875, 2.4921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 11.0, 31.0, 63.0, 133.0, 217.0, 209.0, 133.0, 91.0, 53.0, 20.0, 7.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.09856414794922, -53.26109313964844, -51.42361831665039, -49.58614730834961, -47.74867630004883, -45.91120147705078, -44.07373046875, -42.23625946044922, -40.39878845214844, -38.561317443847656, -36.72384262084961, -34.88637161254883, -33.04890060424805, -31.211427688598633, -29.37395477294922, -27.536483764648438, -25.699010848999023, -23.86153793334961, -22.024066925048828, -20.186594009399414, -18.349123001098633, -16.51165008544922, -14.674178123474121, -12.836706161499023, -10.999234199523926, -9.161762237548828, -7.3242902755737305, -5.486817836761475, -3.649345874786377, -1.811873435974121, 0.025598526000976562, 1.8630704879760742, 3.700542449951172, 5.5380144119262695, 7.375486373901367, 9.212959289550781, 11.050430297851562, 12.887903213500977, 14.725375175476074, 16.562847137451172, 18.400318145751953, 20.237791061401367, 22.07526206970215, 23.912734985351562, 25.750205993652344, 27.587678909301758, 29.425151824951172, 31.262622833251953, 33.10009765625, 34.93756866455078, 36.77504348754883, 38.61251449584961, 40.44998550415039, 42.28746032714844, 44.12493133544922, 45.96240234375, 47.79987335205078, 49.63734436035156, 51.47481918334961, 53.31229019165039, 55.14976119995117, 56.98723602294922, 58.82470703125, 60.66217803955078, 62.49964904785156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 2.0, 19.0, 16.0, 19.0, 17.0, 14.0, 21.0, 27.0, 31.0, 29.0, 44.0, 50.0, 47.0, 77.0, 75.0, 62.0, 58.0, 76.0, 36.0, 37.0, 42.0, 27.0, 27.0, 31.0, 18.0, 13.0, 13.0, 10.0, 7.0, 10.0, 4.0, 9.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.8331413269043, -34.77885818481445, -33.72457504272461, -32.67029571533203, -31.616012573242188, -30.561729431152344, -29.5074462890625, -28.453163146972656, -27.398881912231445, -26.3445987701416, -25.29031753540039, -24.236034393310547, -23.181751251220703, -22.127470016479492, -21.07318687438965, -20.018905639648438, -18.964622497558594, -17.91033935546875, -16.85605812072754, -15.801774978637695, -14.747492790222168, -13.69321060180664, -12.638927459716797, -11.58464527130127, -10.530363082885742, -9.476080894470215, -8.421798706054688, -7.367515563964844, -6.313233375549316, -5.258951187133789, -4.2046685218811035, -3.150385856628418, -2.096101760864258, -1.0418193340301514, 0.012463092803955078, 1.0667455196380615, 2.121027946472168, 3.1753101348876953, 4.229592800140381, 5.283875465393066, 6.338157653808594, 7.392439842224121, 8.446722030639648, 9.501005172729492, 10.55528736114502, 11.609569549560547, 12.66385269165039, 13.718134880065918, 14.772417068481445, 15.826699256896973, 16.8809814453125, 17.935264587402344, 18.989547729492188, 20.0438289642334, 21.098112106323242, 22.152393341064453, 23.206676483154297, 24.26095962524414, 25.31524085998535, 26.369524002075195, 27.423805236816406, 28.47808837890625, 29.532371520996094, 30.586654663085938, 31.64093589782715]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 5.0, 5.0, 15.0, 7.0, 16.0, 22.0, 31.0, 36.0, 77.0, 103.0, 186.0, 328.0, 646.0, 1432.0, 3471.0, 9644.0, 32890.0, 186602.0, 2523138.0, 1294798.0, 104330.0, 23444.0, 7708.0, 2893.0, 1252.0, 558.0, 270.0, 149.0, 71.0, 37.0, 33.0, 28.0, 15.0, 9.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0], "bins": [-5.25, -5.12750244140625, -5.0050048828125, -4.88250732421875, -4.760009765625, -4.63751220703125, -4.5150146484375, -4.39251708984375, -4.27001953125, -4.14752197265625, -4.0250244140625, -3.90252685546875, -3.780029296875, -3.65753173828125, -3.5350341796875, -3.41253662109375, -3.2900390625, -3.16754150390625, -3.0450439453125, -2.92254638671875, -2.800048828125, -2.67755126953125, -2.5550537109375, -2.43255615234375, -2.31005859375, -2.18756103515625, -2.0650634765625, -1.94256591796875, -1.820068359375, -1.69757080078125, -1.5750732421875, -1.45257568359375, -1.330078125, -1.20758056640625, -1.0850830078125, -0.96258544921875, -0.840087890625, -0.71759033203125, -0.5950927734375, -0.47259521484375, -0.35009765625, -0.22760009765625, -0.1051025390625, 0.01739501953125, 0.139892578125, 0.26239013671875, 0.3848876953125, 0.50738525390625, 0.6298828125, 0.75238037109375, 0.8748779296875, 0.99737548828125, 1.119873046875, 1.24237060546875, 1.3648681640625, 1.48736572265625, 1.60986328125, 1.73236083984375, 1.8548583984375, 1.97735595703125, 2.099853515625, 2.22235107421875, 2.3448486328125, 2.46734619140625, 2.58984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 7.0, 16.0, 12.0, 14.0, 20.0, 21.0, 25.0, 35.0, 37.0, 52.0, 47.0, 50.0, 67.0, 62.0, 53.0, 59.0, 55.0, 51.0, 61.0, 60.0, 41.0, 33.0, 22.0, 25.0, 23.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.904144287109375, -2.83172607421875, -2.759307861328125, -2.6868896484375, -2.614471435546875, -2.54205322265625, -2.469635009765625, -2.397216796875, -2.324798583984375, -2.25238037109375, -2.179962158203125, -2.1075439453125, -2.035125732421875, -1.96270751953125, -1.890289306640625, -1.81787109375, -1.745452880859375, -1.67303466796875, -1.600616455078125, -1.5281982421875, -1.455780029296875, -1.38336181640625, -1.310943603515625, -1.238525390625, -1.166107177734375, -1.09368896484375, -1.021270751953125, -0.9488525390625, -0.876434326171875, -0.80401611328125, -0.731597900390625, -0.6591796875, -0.586761474609375, -0.51434326171875, -0.441925048828125, -0.3695068359375, -0.297088623046875, -0.22467041015625, -0.152252197265625, -0.079833984375, -0.007415771484375, 0.06500244140625, 0.137420654296875, 0.2098388671875, 0.282257080078125, 0.35467529296875, 0.427093505859375, 0.49951171875, 0.571929931640625, 0.64434814453125, 0.716766357421875, 0.7891845703125, 0.861602783203125, 0.93402099609375, 1.006439208984375, 1.078857421875, 1.151275634765625, 1.22369384765625, 1.296112060546875, 1.3685302734375, 1.440948486328125, 1.51336669921875, 1.585784912109375, 1.658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 9.0, 5.0, 5.0, 12.0, 13.0, 26.0, 33.0, 55.0, 106.0, 170.0, 346.0, 683.0, 1426.0, 3606.0, 9987.0, 32886.0, 170092.0, 2864419.0, 996518.0, 82217.0, 19958.0, 6637.0, 2547.0, 1156.0, 562.0, 304.0, 183.0, 105.0, 52.0, 44.0, 36.0, 14.0, 14.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.8037109375, -4.642578125, -4.4814453125, -4.3203125, -4.1591796875, -3.998046875, -3.8369140625, -3.67578125, -3.5146484375, -3.353515625, -3.1923828125, -3.03125, -2.8701171875, -2.708984375, -2.5478515625, -2.38671875, -2.2255859375, -2.064453125, -1.9033203125, -1.7421875, -1.5810546875, -1.419921875, -1.2587890625, -1.09765625, -0.9365234375, -0.775390625, -0.6142578125, -0.453125, -0.2919921875, -0.130859375, 0.0302734375, 0.19140625, 0.3525390625, 0.513671875, 0.6748046875, 0.8359375, 0.9970703125, 1.158203125, 1.3193359375, 1.48046875, 1.6416015625, 1.802734375, 1.9638671875, 2.125, 2.2861328125, 2.447265625, 2.6083984375, 2.76953125, 2.9306640625, 3.091796875, 3.2529296875, 3.4140625, 3.5751953125, 3.736328125, 3.8974609375, 4.05859375, 4.2197265625, 4.380859375, 4.5419921875, 4.703125, 4.8642578125, 5.025390625, 5.1865234375, 5.34765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 18.0, 16.0, 21.0, 25.0, 38.0, 57.0, 78.0, 113.0, 182.0, 365.0, 704.0, 850.0, 638.0, 385.0, 205.0, 127.0, 63.0, 43.0, 36.0, 19.0, 14.0, 18.0, 7.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.99029541015625, -3.8126220703125, -3.63494873046875, -3.457275390625, -3.27960205078125, -3.1019287109375, -2.92425537109375, -2.74658203125, -2.56890869140625, -2.3912353515625, -2.21356201171875, -2.035888671875, -1.85821533203125, -1.6805419921875, -1.50286865234375, -1.3251953125, -1.14752197265625, -0.9698486328125, -0.79217529296875, -0.614501953125, -0.43682861328125, -0.2591552734375, -0.08148193359375, 0.09619140625, 0.27386474609375, 0.4515380859375, 0.62921142578125, 0.806884765625, 0.98455810546875, 1.1622314453125, 1.33990478515625, 1.517578125, 1.69525146484375, 1.8729248046875, 2.05059814453125, 2.228271484375, 2.40594482421875, 2.5836181640625, 2.76129150390625, 2.93896484375, 3.11663818359375, 3.2943115234375, 3.47198486328125, 3.649658203125, 3.82733154296875, 4.0050048828125, 4.18267822265625, 4.3603515625, 4.53802490234375, 4.7156982421875, 4.89337158203125, 5.071044921875, 5.24871826171875, 5.4263916015625, 5.60406494140625, 5.78173828125, 5.95941162109375, 6.1370849609375, 6.31475830078125, 6.492431640625, 6.67010498046875, 6.8477783203125, 7.02545166015625, 7.203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 12.0, 23.0, 79.0, 150.0, 251.0, 245.0, 140.0, 50.0, 18.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.43997192382812, -87.19168853759766, -84.94339752197266, -82.69511413574219, -80.44683074951172, -78.19854736328125, -75.95025634765625, -73.70197296142578, -71.45368957519531, -69.20540618896484, -66.95711517333984, -64.70883178710938, -62.460548400878906, -60.21226119995117, -57.96397399902344, -55.71569061279297, -53.467403411865234, -51.2191162109375, -48.97083282470703, -46.7225456237793, -44.47426223754883, -42.225975036621094, -39.977691650390625, -37.72940444946289, -35.481117248535156, -33.23283004760742, -30.984546661376953, -28.73625946044922, -26.48797607421875, -24.239688873291016, -21.991403579711914, -19.743118286132812, -17.494834899902344, -15.246549606323242, -12.99826431274414, -10.749978065490723, -8.501692771911621, -6.2534074783325195, -4.005121231079102, -1.7568359375, 0.49144935607910156, 2.7397348880767822, 4.988020420074463, 7.236306190490723, 9.484591484069824, 11.732876777648926, 13.981163024902344, 16.229448318481445, 18.477733612060547, 20.72601890563965, 22.97430419921875, 25.222591400146484, 27.470874786376953, 29.719161987304688, 31.96744728088379, 34.21573257446289, 36.464019775390625, 38.71230697631836, 40.96059036254883, 43.20887756347656, 45.45716094970703, 47.705448150634766, 49.9537353515625, 52.20201873779297, 54.45030212402344]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 13.0, 9.0, 15.0, 21.0, 24.0, 19.0, 18.0, 19.0, 20.0, 35.0, 46.0, 30.0, 38.0, 48.0, 57.0, 53.0, 37.0, 48.0, 52.0, 34.0, 44.0, 32.0, 44.0, 21.0, 25.0, 25.0, 27.0, 27.0, 20.0, 12.0, 17.0, 16.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.417434692382812, -21.777280807495117, -21.137126922607422, -20.49697494506836, -19.856821060180664, -19.21666717529297, -18.576513290405273, -17.936359405517578, -17.296207427978516, -16.65605354309082, -16.015899658203125, -15.375746726989746, -14.735593795776367, -14.095439910888672, -13.455286026000977, -12.815133094787598, -12.174979209899902, -11.534825325012207, -10.894672393798828, -10.254518508911133, -9.614365577697754, -8.974211692810059, -8.33405876159668, -7.693904876708984, -7.053751468658447, -6.41359806060791, -5.773444652557373, -5.133291244506836, -4.493137359619141, -3.8529841899871826, -3.2128305435180664, -2.5726771354675293, -1.9325237274169922, -1.292370319366455, -0.6522167921066284, -0.012063264846801758, 0.6280901432037354, 1.2682435512542725, 1.9083971977233887, 2.548550605773926, 3.188704013824463, 3.828857421875, 4.469010829925537, 5.109164237976074, 5.7493181228637695, 6.389471054077148, 7.029624938964844, 7.669778347015381, 8.309931755065918, 8.950085639953613, 9.590238571166992, 10.230392456054688, 10.870545387268066, 11.510699272155762, 12.15085220336914, 12.791006088256836, 13.431159973144531, 14.071313858032227, 14.711466789245605, 15.3516206741333, 15.99177360534668, 16.631927490234375, 17.27208137512207, 17.912235260009766, 18.552387237548828]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 24.0, 17.0, 40.0, 46.0, 57.0, 106.0, 156.0, 239.0, 387.0, 573.0, 951.0, 1729.0, 3391.0, 7068.0, 18173.0, 64472.0, 289377.0, 467499.0, 139740.0, 33015.0, 10933.0, 4843.0, 2380.0, 1259.0, 738.0, 455.0, 294.0, 184.0, 106.0, 96.0, 62.0, 38.0, 27.0, 22.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.09173583984375, -2.9822998046875, -2.87286376953125, -2.763427734375, -2.65399169921875, -2.5445556640625, -2.43511962890625, -2.32568359375, -2.21624755859375, -2.1068115234375, -1.99737548828125, -1.887939453125, -1.77850341796875, -1.6690673828125, -1.55963134765625, -1.4501953125, -1.34075927734375, -1.2313232421875, -1.12188720703125, -1.012451171875, -0.90301513671875, -0.7935791015625, -0.68414306640625, -0.57470703125, -0.46527099609375, -0.3558349609375, -0.24639892578125, -0.136962890625, -0.02752685546875, 0.0819091796875, 0.19134521484375, 0.30078125, 0.41021728515625, 0.5196533203125, 0.62908935546875, 0.738525390625, 0.84796142578125, 0.9573974609375, 1.06683349609375, 1.17626953125, 1.28570556640625, 1.3951416015625, 1.50457763671875, 1.614013671875, 1.72344970703125, 1.8328857421875, 1.94232177734375, 2.0517578125, 2.16119384765625, 2.2706298828125, 2.38006591796875, 2.489501953125, 2.59893798828125, 2.7083740234375, 2.81781005859375, 2.92724609375, 3.03668212890625, 3.1461181640625, 3.25555419921875, 3.364990234375, 3.47442626953125, 3.5838623046875, 3.69329833984375, 3.802734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 17.0, 16.0, 21.0, 27.0, 18.0, 29.0, 46.0, 42.0, 44.0, 61.0, 50.0, 57.0, 53.0, 64.0, 66.0, 57.0, 46.0, 36.0, 36.0, 31.0, 32.0, 24.0, 21.0, 12.0, 16.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.869140625, -2.7957916259765625, -2.722442626953125, -2.6490936279296875, -2.57574462890625, -2.5023956298828125, -2.429046630859375, -2.3556976318359375, -2.2823486328125, -2.2089996337890625, -2.135650634765625, -2.0623016357421875, -1.98895263671875, -1.9156036376953125, -1.842254638671875, -1.7689056396484375, -1.695556640625, -1.6222076416015625, -1.548858642578125, -1.4755096435546875, -1.40216064453125, -1.3288116455078125, -1.255462646484375, -1.1821136474609375, -1.1087646484375, -1.0354156494140625, -0.962066650390625, -0.8887176513671875, -0.81536865234375, -0.7420196533203125, -0.668670654296875, -0.5953216552734375, -0.52197265625, -0.4486236572265625, -0.375274658203125, -0.3019256591796875, -0.22857666015625, -0.1552276611328125, -0.081878662109375, -0.0085296630859375, 0.0648193359375, 0.1381683349609375, 0.211517333984375, 0.2848663330078125, 0.35821533203125, 0.4315643310546875, 0.504913330078125, 0.5782623291015625, 0.651611328125, 0.7249603271484375, 0.798309326171875, 0.8716583251953125, 0.94500732421875, 1.0183563232421875, 1.091705322265625, 1.1650543212890625, 1.2384033203125, 1.3117523193359375, 1.385101318359375, 1.4584503173828125, 1.53179931640625, 1.6051483154296875, 1.678497314453125, 1.7518463134765625, 1.8251953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 10.0, 20.0, 25.0, 39.0, 62.0, 93.0, 128.0, 279.0, 615.0, 1414.0, 3743.0, 15811.0, 161969.0, 778769.0, 71215.0, 9423.0, 2776.0, 1057.0, 477.0, 261.0, 139.0, 73.0, 46.0, 33.0, 21.0, 13.0, 9.0, 9.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.2042236328125, -5.013916015625, -4.8236083984375, -4.63330078125, -4.4429931640625, -4.252685546875, -4.0623779296875, -3.8720703125, -3.6817626953125, -3.491455078125, -3.3011474609375, -3.11083984375, -2.9205322265625, -2.730224609375, -2.5399169921875, -2.349609375, -2.1593017578125, -1.968994140625, -1.7786865234375, -1.58837890625, -1.3980712890625, -1.207763671875, -1.0174560546875, -0.8271484375, -0.6368408203125, -0.446533203125, -0.2562255859375, -0.06591796875, 0.1243896484375, 0.314697265625, 0.5050048828125, 0.6953125, 0.8856201171875, 1.075927734375, 1.2662353515625, 1.45654296875, 1.6468505859375, 1.837158203125, 2.0274658203125, 2.2177734375, 2.4080810546875, 2.598388671875, 2.7886962890625, 2.97900390625, 3.1693115234375, 3.359619140625, 3.5499267578125, 3.740234375, 3.9305419921875, 4.120849609375, 4.3111572265625, 4.50146484375, 4.6917724609375, 4.882080078125, 5.0723876953125, 5.2626953125, 5.4530029296875, 5.643310546875, 5.8336181640625, 6.02392578125, 6.2142333984375, 6.404541015625, 6.5948486328125, 6.78515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 11.0, 15.0, 23.0, 13.0, 18.0, 19.0, 24.0, 42.0, 51.0, 37.0, 41.0, 41.0, 45.0, 50.0, 57.0, 59.0, 39.0, 51.0, 36.0, 45.0, 30.0, 25.0, 28.0, 25.0, 31.0, 24.0, 26.0, 12.0, 13.0, 17.0, 2.0, 3.0, 8.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.63671875, -7.4022216796875, -7.167724609375, -6.9332275390625, -6.69873046875, -6.4642333984375, -6.229736328125, -5.9952392578125, -5.7607421875, -5.5262451171875, -5.291748046875, -5.0572509765625, -4.82275390625, -4.5882568359375, -4.353759765625, -4.1192626953125, -3.884765625, -3.6502685546875, -3.415771484375, -3.1812744140625, -2.94677734375, -2.7122802734375, -2.477783203125, -2.2432861328125, -2.0087890625, -1.7742919921875, -1.539794921875, -1.3052978515625, -1.07080078125, -0.8363037109375, -0.601806640625, -0.3673095703125, -0.1328125, 0.1016845703125, 0.336181640625, 0.5706787109375, 0.80517578125, 1.0396728515625, 1.274169921875, 1.5086669921875, 1.7431640625, 1.9776611328125, 2.212158203125, 2.4466552734375, 2.68115234375, 2.9156494140625, 3.150146484375, 3.3846435546875, 3.619140625, 3.8536376953125, 4.088134765625, 4.3226318359375, 4.55712890625, 4.7916259765625, 5.026123046875, 5.2606201171875, 5.4951171875, 5.7296142578125, 5.964111328125, 6.1986083984375, 6.43310546875, 6.6676025390625, 6.902099609375, 7.1365966796875, 7.37109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 14.0, 13.0, 36.0, 78.0, 126.0, 246.0, 513.0, 1099.0, 2867.0, 10215.0, 48258.0, 349253.0, 563153.0, 55687.0, 11370.0, 3415.0, 1171.0, 498.0, 251.0, 112.0, 82.0, 36.0, 16.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.229400634765625, -2.16192626953125, -2.094451904296875, -2.0269775390625, -1.959503173828125, -1.89202880859375, -1.824554443359375, -1.757080078125, -1.689605712890625, -1.62213134765625, -1.554656982421875, -1.4871826171875, -1.419708251953125, -1.35223388671875, -1.284759521484375, -1.21728515625, -1.149810791015625, -1.08233642578125, -1.014862060546875, -0.9473876953125, -0.879913330078125, -0.81243896484375, -0.744964599609375, -0.677490234375, -0.610015869140625, -0.54254150390625, -0.475067138671875, -0.4075927734375, -0.340118408203125, -0.27264404296875, -0.205169677734375, -0.1376953125, -0.070220947265625, -0.00274658203125, 0.064727783203125, 0.1322021484375, 0.199676513671875, 0.26715087890625, 0.334625244140625, 0.402099609375, 0.469573974609375, 0.53704833984375, 0.604522705078125, 0.6719970703125, 0.739471435546875, 0.80694580078125, 0.874420166015625, 0.94189453125, 1.009368896484375, 1.07684326171875, 1.144317626953125, 1.2117919921875, 1.279266357421875, 1.34674072265625, 1.414215087890625, 1.481689453125, 1.549163818359375, 1.61663818359375, 1.684112548828125, 1.7515869140625, 1.819061279296875, 1.88653564453125, 1.954010009765625, 2.021484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 11.0, 5.0, 16.0, 13.0, 15.0, 29.0, 47.0, 52.0, 70.0, 111.0, 112.0, 125.0, 117.0, 81.0, 67.0, 25.0, 30.0, 16.0, 15.0, 10.0, 3.0, 6.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038123130798339844, -0.00036537274718284607, -0.0003495141863822937, -0.00033365562558174133, -0.00031779706478118896, -0.0003019385039806366, -0.00028607994318008423, -0.00027022138237953186, -0.0002543628215789795, -0.00023850426077842712, -0.00022264569997787476, -0.0002067871391773224, -0.00019092857837677002, -0.00017507001757621765, -0.00015921145677566528, -0.00014335289597511292, -0.00012749433517456055, -0.00011163577437400818, -9.577721357345581e-05, -7.991865277290344e-05, -6.406009197235107e-05, -4.8201531171798706e-05, -3.234297037124634e-05, -1.648440957069397e-05, -6.258487701416016e-07, 1.5232712030410767e-05, 3.1091272830963135e-05, 4.69498336315155e-05, 6.280839443206787e-05, 7.866695523262024e-05, 9.452551603317261e-05, 0.00011038407683372498, 0.00012624263763427734, 0.0001421011984348297, 0.00015795975923538208, 0.00017381832003593445, 0.00018967688083648682, 0.00020553544163703918, 0.00022139400243759155, 0.00023725256323814392, 0.0002531111240386963, 0.00026896968483924866, 0.000284828245639801, 0.0003006868064403534, 0.00031654536724090576, 0.00033240392804145813, 0.0003482624888420105, 0.00036412104964256287, 0.00037997961044311523, 0.0003958381712436676, 0.00041169673204421997, 0.00042755529284477234, 0.0004434138536453247, 0.0004592724144458771, 0.00047513097524642944, 0.0004909895360469818, 0.0005068480968475342, 0.0005227066576480865, 0.0005385652184486389, 0.0005544237792491913, 0.0005702823400497437, 0.000586140900850296, 0.0006019994616508484, 0.0006178580224514008, 0.0006337165832519531]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 12.0, 30.0, 45.0, 80.0, 151.0, 346.0, 1132.0, 5459.0, 60354.0, 884139.0, 87844.0, 6841.0, 1349.0, 406.0, 155.0, 99.0, 38.0, 24.0, 11.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.938812255859375, -4.80731201171875, -4.675811767578125, -4.5443115234375, -4.412811279296875, -4.28131103515625, -4.149810791015625, -4.018310546875, -3.886810302734375, -3.75531005859375, -3.623809814453125, -3.4923095703125, -3.360809326171875, -3.22930908203125, -3.097808837890625, -2.96630859375, -2.834808349609375, -2.70330810546875, -2.571807861328125, -2.4403076171875, -2.308807373046875, -2.17730712890625, -2.045806884765625, -1.914306640625, -1.782806396484375, -1.65130615234375, -1.519805908203125, -1.3883056640625, -1.256805419921875, -1.12530517578125, -0.993804931640625, -0.8623046875, -0.730804443359375, -0.59930419921875, -0.467803955078125, -0.3363037109375, -0.204803466796875, -0.07330322265625, 0.058197021484375, 0.189697265625, 0.321197509765625, 0.45269775390625, 0.584197998046875, 0.7156982421875, 0.847198486328125, 0.97869873046875, 1.110198974609375, 1.24169921875, 1.373199462890625, 1.50469970703125, 1.636199951171875, 1.7677001953125, 1.899200439453125, 2.03070068359375, 2.162200927734375, 2.293701171875, 2.425201416015625, 2.55670166015625, 2.688201904296875, 2.8197021484375, 2.951202392578125, 3.08270263671875, 3.214202880859375, 3.345703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 11.0, 7.0, 12.0, 22.0, 19.0, 38.0, 39.0, 57.0, 65.0, 84.0, 86.0, 80.0, 98.0, 87.0, 75.0, 45.0, 32.0, 33.0, 18.0, 22.0, 11.0, 12.0, 5.0, 7.0, 9.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.35791015625, -2.2958984375, -2.23388671875, -2.171875, -2.10986328125, -2.0478515625, -1.98583984375, -1.923828125, -1.86181640625, -1.7998046875, -1.73779296875, -1.67578125, -1.61376953125, -1.5517578125, -1.48974609375, -1.427734375, -1.36572265625, -1.3037109375, -1.24169921875, -1.1796875, -1.11767578125, -1.0556640625, -0.99365234375, -0.931640625, -0.86962890625, -0.8076171875, -0.74560546875, -0.68359375, -0.62158203125, -0.5595703125, -0.49755859375, -0.435546875, -0.37353515625, -0.3115234375, -0.24951171875, -0.1875, -0.12548828125, -0.0634765625, -0.00146484375, 0.060546875, 0.12255859375, 0.1845703125, 0.24658203125, 0.30859375, 0.37060546875, 0.4326171875, 0.49462890625, 0.556640625, 0.61865234375, 0.6806640625, 0.74267578125, 0.8046875, 0.86669921875, 0.9287109375, 0.99072265625, 1.052734375, 1.11474609375, 1.1767578125, 1.23876953125, 1.30078125, 1.36279296875, 1.4248046875, 1.48681640625, 1.548828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 8.0, 16.0, 19.0, 32.0, 78.0, 144.0, 247.0, 228.0, 116.0, 55.0, 24.0, 8.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.43402862548828, -44.93017578125, -43.42632293701172, -41.9224739074707, -40.41862106323242, -38.91476821899414, -37.410919189453125, -35.907066345214844, -34.40321350097656, -32.89936065673828, -31.395509719848633, -29.891658782958984, -28.387805938720703, -26.883953094482422, -25.380102157592773, -23.876251220703125, -22.372398376464844, -20.868545532226562, -19.364694595336914, -17.860843658447266, -16.356990814208984, -14.85313892364502, -13.349287033081055, -11.84543514251709, -10.341583251953125, -8.83773136138916, -7.333879470825195, -5.8300275802612305, -4.326175689697266, -2.822323799133301, -1.318471908569336, 0.1853799819946289, 1.6892318725585938, 3.1930837631225586, 4.696935653686523, 6.200787544250488, 7.704639434814453, 9.208491325378418, 10.712343215942383, 12.216195106506348, 13.720046997070312, 15.223898887634277, 16.727750778198242, 18.23160171508789, 19.735454559326172, 21.239307403564453, 22.7431583404541, 24.24700927734375, 25.75086212158203, 27.254714965820312, 28.75856590270996, 30.26241683959961, 31.76626968383789, 33.27012252807617, 34.77397155761719, 36.27782440185547, 37.78167724609375, 39.28553009033203, 40.78938293457031, 42.29323196411133, 43.79708480834961, 45.30093765258789, 46.804786682128906, 48.30863952636719, 49.81249237060547]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 4.0, 12.0, 10.0, 11.0, 17.0, 12.0, 18.0, 27.0, 16.0, 27.0, 33.0, 28.0, 39.0, 34.0, 60.0, 68.0, 80.0, 63.0, 73.0, 56.0, 42.0, 30.0, 32.0, 27.0, 20.0, 19.0, 31.0, 14.0, 10.0, 15.0, 10.0, 9.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.821874618530273, -29.876317977905273, -28.930763244628906, -27.985206604003906, -27.039649963378906, -26.094093322753906, -25.148536682128906, -24.20298194885254, -23.25742530822754, -22.31186866760254, -21.366313934326172, -20.420757293701172, -19.475200653076172, -18.529644012451172, -17.584087371826172, -16.638532638549805, -15.692975997924805, -14.747419357299805, -13.801863670349121, -12.856307983398438, -11.910751342773438, -10.965194702148438, -10.019639015197754, -9.07408332824707, -8.12852668762207, -7.1829705238342285, -6.237414360046387, -5.291858196258545, -4.346302032470703, -3.4007458686828613, -2.4551897048950195, -1.5096335411071777, -0.5640754699707031, 0.38148069381713867, 1.3270368576049805, 2.2725930213928223, 3.218149185180664, 4.163705348968506, 5.109261512756348, 6.0548176765441895, 7.000373840332031, 7.945930004119873, 8.891486167907715, 9.837041854858398, 10.782598495483398, 11.728155136108398, 12.673710823059082, 13.619266510009766, 14.564823150634766, 15.510379791259766, 16.455936431884766, 17.401491165161133, 18.347047805786133, 19.292604446411133, 20.2381591796875, 21.1837158203125, 22.1292724609375, 23.0748291015625, 24.0203857421875, 24.965940475463867, 25.911497116088867, 26.857053756713867, 27.802608489990234, 28.748165130615234, 29.693721771240234]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 16.0, 18.0, 46.0, 55.0, 97.0, 180.0, 334.0, 557.0, 1181.0, 2680.0, 6723.0, 20845.0, 100576.0, 1197512.0, 2591532.0, 220243.0, 34329.0, 9964.0, 3914.0, 1664.0, 814.0, 432.0, 211.0, 131.0, 65.0, 50.0, 29.0, 22.0, 9.0, 11.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.244293212890625, -3.13311767578125, -3.021942138671875, -2.9107666015625, -2.799591064453125, -2.68841552734375, -2.577239990234375, -2.466064453125, -2.354888916015625, -2.24371337890625, -2.132537841796875, -2.0213623046875, -1.910186767578125, -1.79901123046875, -1.687835693359375, -1.57666015625, -1.465484619140625, -1.35430908203125, -1.243133544921875, -1.1319580078125, -1.020782470703125, -0.90960693359375, -0.798431396484375, -0.687255859375, -0.576080322265625, -0.46490478515625, -0.353729248046875, -0.2425537109375, -0.131378173828125, -0.02020263671875, 0.090972900390625, 0.2021484375, 0.313323974609375, 0.42449951171875, 0.535675048828125, 0.6468505859375, 0.758026123046875, 0.86920166015625, 0.980377197265625, 1.091552734375, 1.202728271484375, 1.31390380859375, 1.425079345703125, 1.5362548828125, 1.647430419921875, 1.75860595703125, 1.869781494140625, 1.98095703125, 2.092132568359375, 2.20330810546875, 2.314483642578125, 2.4256591796875, 2.536834716796875, 2.64801025390625, 2.759185791015625, 2.870361328125, 2.981536865234375, 3.09271240234375, 3.203887939453125, 3.3150634765625, 3.426239013671875, 3.53741455078125, 3.648590087890625, 3.759765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 8.0, 10.0, 16.0, 9.0, 23.0, 21.0, 20.0, 37.0, 33.0, 46.0, 39.0, 47.0, 43.0, 47.0, 46.0, 54.0, 50.0, 47.0, 47.0, 43.0, 47.0, 50.0, 34.0, 35.0, 23.0, 18.0, 24.0, 17.0, 11.0, 15.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3984375, -2.33551025390625, -2.2725830078125, -2.20965576171875, -2.146728515625, -2.08380126953125, -2.0208740234375, -1.95794677734375, -1.89501953125, -1.83209228515625, -1.7691650390625, -1.70623779296875, -1.643310546875, -1.58038330078125, -1.5174560546875, -1.45452880859375, -1.3916015625, -1.32867431640625, -1.2657470703125, -1.20281982421875, -1.139892578125, -1.07696533203125, -1.0140380859375, -0.95111083984375, -0.88818359375, -0.82525634765625, -0.7623291015625, -0.69940185546875, -0.636474609375, -0.57354736328125, -0.5106201171875, -0.44769287109375, -0.384765625, -0.32183837890625, -0.2589111328125, -0.19598388671875, -0.133056640625, -0.07012939453125, -0.0072021484375, 0.05572509765625, 0.11865234375, 0.18157958984375, 0.2445068359375, 0.30743408203125, 0.370361328125, 0.43328857421875, 0.4962158203125, 0.55914306640625, 0.6220703125, 0.68499755859375, 0.7479248046875, 0.81085205078125, 0.873779296875, 0.93670654296875, 0.9996337890625, 1.06256103515625, 1.12548828125, 1.18841552734375, 1.2513427734375, 1.31427001953125, 1.377197265625, 1.44012451171875, 1.5030517578125, 1.56597900390625, 1.62890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 17.0, 13.0, 20.0, 29.0, 52.0, 100.0, 202.0, 512.0, 1536.0, 5289.0, 26583.0, 329817.0, 3647591.0, 159001.0, 17471.0, 3883.0, 1223.0, 463.0, 201.0, 112.0, 55.0, 29.0, 20.0, 18.0, 9.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.06951904296875, -6.8577880859375, -6.64605712890625, -6.434326171875, -6.22259521484375, -6.0108642578125, -5.79913330078125, -5.58740234375, -5.37567138671875, -5.1639404296875, -4.95220947265625, -4.740478515625, -4.52874755859375, -4.3170166015625, -4.10528564453125, -3.8935546875, -3.68182373046875, -3.4700927734375, -3.25836181640625, -3.046630859375, -2.83489990234375, -2.6231689453125, -2.41143798828125, -2.19970703125, -1.98797607421875, -1.7762451171875, -1.56451416015625, -1.352783203125, -1.14105224609375, -0.9293212890625, -0.71759033203125, -0.505859375, -0.29412841796875, -0.0823974609375, 0.12933349609375, 0.341064453125, 0.55279541015625, 0.7645263671875, 0.97625732421875, 1.18798828125, 1.39971923828125, 1.6114501953125, 1.82318115234375, 2.034912109375, 2.24664306640625, 2.4583740234375, 2.67010498046875, 2.8818359375, 3.09356689453125, 3.3052978515625, 3.51702880859375, 3.728759765625, 3.94049072265625, 4.1522216796875, 4.36395263671875, 4.57568359375, 4.78741455078125, 4.9991455078125, 5.21087646484375, 5.422607421875, 5.63433837890625, 5.8460693359375, 6.05780029296875, 6.26953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 9.0, 12.0, 6.0, 9.0, 15.0, 16.0, 25.0, 36.0, 63.0, 61.0, 97.0, 182.0, 320.0, 528.0, 822.0, 693.0, 427.0, 265.0, 159.0, 95.0, 70.0, 37.0, 26.0, 28.0, 18.0, 10.0, 9.0, 5.0, 4.0, 11.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.380615234375, -4.23388671875, -4.087158203125, -3.9404296875, -3.793701171875, -3.64697265625, -3.500244140625, -3.353515625, -3.206787109375, -3.06005859375, -2.913330078125, -2.7666015625, -2.619873046875, -2.47314453125, -2.326416015625, -2.1796875, -2.032958984375, -1.88623046875, -1.739501953125, -1.5927734375, -1.446044921875, -1.29931640625, -1.152587890625, -1.005859375, -0.859130859375, -0.71240234375, -0.565673828125, -0.4189453125, -0.272216796875, -0.12548828125, 0.021240234375, 0.16796875, 0.314697265625, 0.46142578125, 0.608154296875, 0.7548828125, 0.901611328125, 1.04833984375, 1.195068359375, 1.341796875, 1.488525390625, 1.63525390625, 1.781982421875, 1.9287109375, 2.075439453125, 2.22216796875, 2.368896484375, 2.515625, 2.662353515625, 2.80908203125, 2.955810546875, 3.1025390625, 3.249267578125, 3.39599609375, 3.542724609375, 3.689453125, 3.836181640625, 3.98291015625, 4.129638671875, 4.2763671875, 4.423095703125, 4.56982421875, 4.716552734375, 4.86328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 27.0, 56.0, 70.0, 104.0, 138.0, 125.0, 128.0, 96.0, 81.0, 44.0, 34.0, 25.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59521484375, -39.510807037353516, -38.42639923095703, -37.34198760986328, -36.2575798034668, -35.17317199707031, -34.08876037597656, -33.00435256958008, -31.919944763183594, -30.83553695678711, -29.751127243041992, -28.666717529296875, -27.58230972290039, -26.497901916503906, -25.41349220275879, -24.329082489013672, -23.244674682617188, -22.160266876220703, -21.075857162475586, -19.99144744873047, -18.907039642333984, -17.8226318359375, -16.738222122192383, -15.653813362121582, -14.569404602050781, -13.48499584197998, -12.40058708190918, -11.316178321838379, -10.231769561767578, -9.147360801696777, -8.062952041625977, -6.978543281555176, -5.894136428833008, -4.809727668762207, -3.7253189086914062, -2.6409101486206055, -1.5565013885498047, -0.4720926284790039, 0.6123161315917969, 1.6967248916625977, 2.7811336517333984, 3.865542411804199, 4.949951171875, 6.034359931945801, 7.118768692016602, 8.203177452087402, 9.287586212158203, 10.371994972229004, 11.456403732299805, 12.540812492370605, 13.625221252441406, 14.709630012512207, 15.794038772583008, 16.878448486328125, 17.96285629272461, 19.047264099121094, 20.13167381286621, 21.216083526611328, 22.300491333007812, 23.384899139404297, 24.469308853149414, 25.55371856689453, 26.638126373291016, 27.7225341796875, 28.806943893432617]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 14.0, 23.0, 18.0, 20.0, 37.0, 37.0, 35.0, 51.0, 55.0, 46.0, 55.0, 69.0, 88.0, 66.0, 63.0, 47.0, 35.0, 40.0, 34.0, 33.0, 20.0, 21.0, 20.0, 21.0, 5.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-29.58866310119629, -28.84001922607422, -28.09137535095215, -27.342731475830078, -26.59408950805664, -25.84544563293457, -25.0968017578125, -24.34815788269043, -23.59951400756836, -22.85087013244629, -22.10222625732422, -21.35358428955078, -20.60494041442871, -19.85629653930664, -19.10765266418457, -18.3590087890625, -17.610366821289062, -16.861722946166992, -16.113079071044922, -15.364436149597168, -14.615793228149414, -13.867149353027344, -13.118505477905273, -12.369861602783203, -11.62121868133545, -10.872574806213379, -10.123931884765625, -9.375288009643555, -8.626644134521484, -7.8780012130737305, -7.12935733795166, -6.380713939666748, -5.632072448730469, -4.883429050445557, -4.1347856521606445, -3.386141777038574, -2.637498378753662, -1.88885498046875, -1.1402111053466797, -0.3915677070617676, 0.35707569122314453, 1.1057192087173462, 1.8543627262115479, 2.603006362915039, 3.351649761199951, 4.100293159484863, 4.848937034606934, 5.597580432891846, 6.346223831176758, 7.09486722946167, 7.843510627746582, 8.592154502868652, 9.340797424316406, 10.089441299438477, 10.838085174560547, 11.586729049682617, 12.335371971130371, 13.084015846252441, 13.832658767700195, 14.581302642822266, 15.329946517944336, 16.078590393066406, 16.827232360839844, 17.575876235961914, 18.324520111083984]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 10.0, 14.0, 27.0, 28.0, 79.0, 94.0, 196.0, 332.0, 592.0, 1227.0, 2710.0, 7500.0, 27449.0, 171932.0, 638496.0, 159553.0, 25979.0, 7050.0, 2723.0, 1142.0, 574.0, 334.0, 205.0, 125.0, 62.0, 34.0, 27.0, 18.0, 17.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.02423095703125, -3.8922119140625, -3.76019287109375, -3.628173828125, -3.49615478515625, -3.3641357421875, -3.23211669921875, -3.10009765625, -2.96807861328125, -2.8360595703125, -2.70404052734375, -2.572021484375, -2.44000244140625, -2.3079833984375, -2.17596435546875, -2.0439453125, -1.91192626953125, -1.7799072265625, -1.64788818359375, -1.515869140625, -1.38385009765625, -1.2518310546875, -1.11981201171875, -0.98779296875, -0.85577392578125, -0.7237548828125, -0.59173583984375, -0.459716796875, -0.32769775390625, -0.1956787109375, -0.06365966796875, 0.068359375, 0.20037841796875, 0.3323974609375, 0.46441650390625, 0.596435546875, 0.72845458984375, 0.8604736328125, 0.99249267578125, 1.12451171875, 1.25653076171875, 1.3885498046875, 1.52056884765625, 1.652587890625, 1.78460693359375, 1.9166259765625, 2.04864501953125, 2.1806640625, 2.31268310546875, 2.4447021484375, 2.57672119140625, 2.708740234375, 2.84075927734375, 2.9727783203125, 3.10479736328125, 3.23681640625, 3.36883544921875, 3.5008544921875, 3.63287353515625, 3.764892578125, 3.89691162109375, 4.0289306640625, 4.16094970703125, 4.29296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 15.0, 8.0, 10.0, 12.0, 17.0, 21.0, 18.0, 22.0, 28.0, 34.0, 41.0, 46.0, 58.0, 57.0, 57.0, 50.0, 58.0, 41.0, 52.0, 54.0, 56.0, 42.0, 30.0, 33.0, 28.0, 16.0, 24.0, 20.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.158233642578125, -2.08599853515625, -2.013763427734375, -1.9415283203125, -1.869293212890625, -1.79705810546875, -1.724822998046875, -1.652587890625, -1.580352783203125, -1.50811767578125, -1.435882568359375, -1.3636474609375, -1.291412353515625, -1.21917724609375, -1.146942138671875, -1.07470703125, -1.002471923828125, -0.93023681640625, -0.858001708984375, -0.7857666015625, -0.713531494140625, -0.64129638671875, -0.569061279296875, -0.496826171875, -0.424591064453125, -0.35235595703125, -0.280120849609375, -0.2078857421875, -0.135650634765625, -0.06341552734375, 0.008819580078125, 0.0810546875, 0.153289794921875, 0.22552490234375, 0.297760009765625, 0.3699951171875, 0.442230224609375, 0.51446533203125, 0.586700439453125, 0.658935546875, 0.731170654296875, 0.80340576171875, 0.875640869140625, 0.9478759765625, 1.020111083984375, 1.09234619140625, 1.164581298828125, 1.23681640625, 1.309051513671875, 1.38128662109375, 1.453521728515625, 1.5257568359375, 1.597991943359375, 1.67022705078125, 1.742462158203125, 1.814697265625, 1.886932373046875, 1.95916748046875, 2.031402587890625, 2.1036376953125, 2.175872802734375, 2.24810791015625, 2.320343017578125, 2.392578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 4.0, 10.0, 10.0, 13.0, 19.0, 30.0, 36.0, 56.0, 79.0, 83.0, 140.0, 213.0, 334.0, 656.0, 1234.0, 2831.0, 8809.0, 43177.0, 517772.0, 417327.0, 41492.0, 8501.0, 2835.0, 1239.0, 601.0, 348.0, 207.0, 152.0, 93.0, 61.0, 50.0, 53.0, 19.0, 14.0, 13.0, 12.0, 8.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.046875, -4.906646728515625, -4.76641845703125, -4.626190185546875, -4.4859619140625, -4.345733642578125, -4.20550537109375, -4.065277099609375, -3.925048828125, -3.784820556640625, -3.64459228515625, -3.504364013671875, -3.3641357421875, -3.223907470703125, -3.08367919921875, -2.943450927734375, -2.80322265625, -2.662994384765625, -2.52276611328125, -2.382537841796875, -2.2423095703125, -2.102081298828125, -1.96185302734375, -1.821624755859375, -1.681396484375, -1.541168212890625, -1.40093994140625, -1.260711669921875, -1.1204833984375, -0.980255126953125, -0.84002685546875, -0.699798583984375, -0.5595703125, -0.419342041015625, -0.27911376953125, -0.138885498046875, 0.0013427734375, 0.141571044921875, 0.28179931640625, 0.422027587890625, 0.562255859375, 0.702484130859375, 0.84271240234375, 0.982940673828125, 1.1231689453125, 1.263397216796875, 1.40362548828125, 1.543853759765625, 1.68408203125, 1.824310302734375, 1.96453857421875, 2.104766845703125, 2.2449951171875, 2.385223388671875, 2.52545166015625, 2.665679931640625, 2.805908203125, 2.946136474609375, 3.08636474609375, 3.226593017578125, 3.3668212890625, 3.507049560546875, 3.64727783203125, 3.787506103515625, 3.927734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 15.0, 14.0, 13.0, 25.0, 26.0, 34.0, 35.0, 52.0, 53.0, 44.0, 65.0, 64.0, 52.0, 64.0, 54.0, 76.0, 49.0, 53.0, 37.0, 27.0, 23.0, 26.0, 16.0, 11.0, 9.0, 7.0, 6.0, 6.0, 6.0, 0.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8187255859375, -8.535888671875, -8.2530517578125, -7.97021484375, -7.6873779296875, -7.404541015625, -7.1217041015625, -6.8388671875, -6.5560302734375, -6.273193359375, -5.9903564453125, -5.70751953125, -5.4246826171875, -5.141845703125, -4.8590087890625, -4.576171875, -4.2933349609375, -4.010498046875, -3.7276611328125, -3.44482421875, -3.1619873046875, -2.879150390625, -2.5963134765625, -2.3134765625, -2.0306396484375, -1.747802734375, -1.4649658203125, -1.18212890625, -0.8992919921875, -0.616455078125, -0.3336181640625, -0.05078125, 0.2320556640625, 0.514892578125, 0.7977294921875, 1.08056640625, 1.3634033203125, 1.646240234375, 1.9290771484375, 2.2119140625, 2.4947509765625, 2.777587890625, 3.0604248046875, 3.34326171875, 3.6260986328125, 3.908935546875, 4.1917724609375, 4.474609375, 4.7574462890625, 5.040283203125, 5.3231201171875, 5.60595703125, 5.8887939453125, 6.171630859375, 6.4544677734375, 6.7373046875, 7.0201416015625, 7.302978515625, 7.5858154296875, 7.86865234375, 8.1514892578125, 8.434326171875, 8.7171630859375, 9.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 17.0, 24.0, 22.0, 62.0, 82.0, 129.0, 199.0, 323.0, 570.0, 1057.0, 2388.0, 5594.0, 15649.0, 58456.0, 627585.0, 271626.0, 43318.0, 12552.0, 4659.0, 1962.0, 1023.0, 493.0, 280.0, 179.0, 87.0, 56.0, 42.0, 36.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7517242431640625, -1.696807861328125, -1.6418914794921875, -1.58697509765625, -1.5320587158203125, -1.477142333984375, -1.4222259521484375, -1.3673095703125, -1.3123931884765625, -1.257476806640625, -1.2025604248046875, -1.14764404296875, -1.0927276611328125, -1.037811279296875, -0.9828948974609375, -0.927978515625, -0.8730621337890625, -0.818145751953125, -0.7632293701171875, -0.70831298828125, -0.6533966064453125, -0.598480224609375, -0.5435638427734375, -0.4886474609375, -0.4337310791015625, -0.378814697265625, -0.3238983154296875, -0.26898193359375, -0.2140655517578125, -0.159149169921875, -0.1042327880859375, -0.04931640625, 0.0055999755859375, 0.060516357421875, 0.1154327392578125, 0.17034912109375, 0.2252655029296875, 0.280181884765625, 0.3350982666015625, 0.3900146484375, 0.4449310302734375, 0.499847412109375, 0.5547637939453125, 0.60968017578125, 0.6645965576171875, 0.719512939453125, 0.7744293212890625, 0.829345703125, 0.8842620849609375, 0.939178466796875, 0.9940948486328125, 1.04901123046875, 1.1039276123046875, 1.158843994140625, 1.2137603759765625, 1.2686767578125, 1.3235931396484375, 1.378509521484375, 1.4334259033203125, 1.48834228515625, 1.5432586669921875, 1.598175048828125, 1.6530914306640625, 1.7080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 4.0, 13.0, 20.0, 32.0, 46.0, 58.0, 80.0, 122.0, 150.0, 146.0, 74.0, 67.0, 47.0, 26.0, 23.0, 16.0, 10.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005035400390625, -0.0004870593547821045, -0.000470578670501709, -0.0004540979862213135, -0.00043761730194091797, -0.00042113661766052246, -0.00040465593338012695, -0.00038817524909973145, -0.00037169456481933594, -0.00035521388053894043, -0.0003387331962585449, -0.0003222525119781494, -0.0003057718276977539, -0.0002892911434173584, -0.0002728104591369629, -0.0002563297748565674, -0.00023984909057617188, -0.00022336840629577637, -0.00020688772201538086, -0.00019040703773498535, -0.00017392635345458984, -0.00015744566917419434, -0.00014096498489379883, -0.00012448430061340332, -0.00010800361633300781, -9.15229320526123e-05, -7.50422477722168e-05, -5.856156349182129e-05, -4.208087921142578e-05, -2.5600194931030273e-05, -9.119510650634766e-06, 7.361173629760742e-06, 2.384185791015625e-05, 4.032254219055176e-05, 5.6803226470947266e-05, 7.328391075134277e-05, 8.976459503173828e-05, 0.00010624527931213379, 0.0001227259635925293, 0.0001392066478729248, 0.0001556873321533203, 0.00017216801643371582, 0.00018864870071411133, 0.00020512938499450684, 0.00022161006927490234, 0.00023809075355529785, 0.00025457143783569336, 0.00027105212211608887, 0.0002875328063964844, 0.0003040134906768799, 0.0003204941749572754, 0.0003369748592376709, 0.0003534555435180664, 0.0003699362277984619, 0.0003864169120788574, 0.00040289759635925293, 0.00041937828063964844, 0.00043585896492004395, 0.00045233964920043945, 0.00046882033348083496, 0.00048530101776123047, 0.000501781702041626, 0.0005182623863220215, 0.000534743070602417, 0.0005512237548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 6.0, 8.0, 20.0, 29.0, 51.0, 64.0, 116.0, 279.0, 622.0, 1682.0, 5975.0, 35047.0, 746901.0, 231614.0, 19796.0, 4080.0, 1262.0, 472.0, 231.0, 87.0, 51.0, 52.0, 26.0, 14.0, 20.0, 10.0, 11.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.059234619140625, -2.96612548828125, -2.873016357421875, -2.7799072265625, -2.686798095703125, -2.59368896484375, -2.500579833984375, -2.407470703125, -2.314361572265625, -2.22125244140625, -2.128143310546875, -2.0350341796875, -1.941925048828125, -1.84881591796875, -1.755706787109375, -1.66259765625, -1.569488525390625, -1.47637939453125, -1.383270263671875, -1.2901611328125, -1.197052001953125, -1.10394287109375, -1.010833740234375, -0.917724609375, -0.824615478515625, -0.73150634765625, -0.638397216796875, -0.5452880859375, -0.452178955078125, -0.35906982421875, -0.265960693359375, -0.1728515625, -0.079742431640625, 0.01336669921875, 0.106475830078125, 0.1995849609375, 0.292694091796875, 0.38580322265625, 0.478912353515625, 0.572021484375, 0.665130615234375, 0.75823974609375, 0.851348876953125, 0.9444580078125, 1.037567138671875, 1.13067626953125, 1.223785400390625, 1.31689453125, 1.410003662109375, 1.50311279296875, 1.596221923828125, 1.6893310546875, 1.782440185546875, 1.87554931640625, 1.968658447265625, 2.061767578125, 2.154876708984375, 2.24798583984375, 2.341094970703125, 2.4342041015625, 2.527313232421875, 2.62042236328125, 2.713531494140625, 2.806640625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 14.0, 21.0, 27.0, 45.0, 69.0, 114.0, 178.0, 173.0, 119.0, 69.0, 54.0, 30.0, 24.0, 15.0, 11.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-4.16015625, -4.0716552734375, -3.983154296875, -3.8946533203125, -3.80615234375, -3.7176513671875, -3.629150390625, -3.5406494140625, -3.4521484375, -3.3636474609375, -3.275146484375, -3.1866455078125, -3.09814453125, -3.0096435546875, -2.921142578125, -2.8326416015625, -2.744140625, -2.6556396484375, -2.567138671875, -2.4786376953125, -2.39013671875, -2.3016357421875, -2.213134765625, -2.1246337890625, -2.0361328125, -1.9476318359375, -1.859130859375, -1.7706298828125, -1.68212890625, -1.5936279296875, -1.505126953125, -1.4166259765625, -1.328125, -1.2396240234375, -1.151123046875, -1.0626220703125, -0.97412109375, -0.8856201171875, -0.797119140625, -0.7086181640625, -0.6201171875, -0.5316162109375, -0.443115234375, -0.3546142578125, -0.26611328125, -0.1776123046875, -0.089111328125, -0.0006103515625, 0.087890625, 0.1763916015625, 0.264892578125, 0.3533935546875, 0.44189453125, 0.5303955078125, 0.618896484375, 0.7073974609375, 0.7958984375, 0.8843994140625, 0.972900390625, 1.0614013671875, 1.14990234375, 1.2384033203125, 1.326904296875, 1.4154052734375, 1.50390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 7.0, 15.0, 26.0, 63.0, 175.0, 430.0, 187.0, 64.0, 16.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.28250122070312, -78.20263671875, -76.12277221679688, -74.04290771484375, -71.96304321289062, -69.8831787109375, -67.80331420898438, -65.72344970703125, -63.64358139038086, -61.563716888427734, -59.48385238647461, -57.403987884521484, -55.324119567871094, -53.24425506591797, -51.164390563964844, -49.08452606201172, -47.004661560058594, -44.92479705810547, -42.844932556152344, -40.76506805419922, -38.685203552246094, -36.60533905029297, -34.52547073364258, -32.44560623168945, -30.365741729736328, -28.285877227783203, -26.206012725830078, -24.12614631652832, -22.046281814575195, -19.96641731262207, -17.886550903320312, -15.806686401367188, -13.726829528808594, -11.646965026855469, -9.567099571228027, -7.487234592437744, -5.407369613647461, -3.327505111694336, -1.2476396560668945, 0.8322257995605469, 2.912090301513672, 4.991955280303955, 7.071820259094238, 9.15168571472168, 11.231550216674805, 13.31141471862793, 15.391280174255371, 17.471145629882812, 19.551010131835938, 21.630874633789062, 23.710739135742188, 25.790605545043945, 27.87047004699707, 29.950334548950195, 32.03020095825195, 34.11006546020508, 36.1899299621582, 38.26979446411133, 40.34965896606445, 42.42952346801758, 44.50939178466797, 46.589256286621094, 48.66912078857422, 50.748985290527344, 52.82884979248047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 14.0, 14.0, 10.0, 30.0, 30.0, 19.0, 24.0, 32.0, 40.0, 53.0, 62.0, 82.0, 98.0, 84.0, 57.0, 54.0, 41.0, 35.0, 30.0, 30.0, 19.0, 18.0, 17.0, 18.0, 11.0, 16.0, 7.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.24529266357422, -29.26091194152832, -28.276531219482422, -27.29214859008789, -26.307767868041992, -25.323387145996094, -24.339006423950195, -23.354625701904297, -22.370243072509766, -21.385862350463867, -20.40148162841797, -19.417098999023438, -18.43271827697754, -17.44833755493164, -16.463956832885742, -15.479575157165527, -14.495194435119629, -13.51081371307373, -12.526432037353516, -11.542051315307617, -10.557669639587402, -9.573288917541504, -8.588907241821289, -7.604526519775391, -6.620145320892334, -5.635764122009277, -4.651382923126221, -3.667001962661743, -2.6826207637786865, -1.698239803314209, -0.7138586044311523, 0.2705225944519043, 1.254903793334961, 2.2392849922180176, 3.223666191101074, 4.208046913146973, 5.1924285888671875, 6.176809310913086, 7.161190509796143, 8.1455717086792, 9.129953384399414, 10.114334106445312, 11.098715782165527, 12.083096504211426, 13.06747817993164, 14.051858901977539, 15.036239624023438, 16.02062225341797, 17.005001068115234, 17.989381790161133, 18.97376251220703, 19.958145141601562, 20.94252586364746, 21.92690658569336, 22.911287307739258, 23.895668029785156, 24.880050659179688, 25.864431381225586, 26.848812103271484, 27.833194732666016, 28.817575454711914, 29.801956176757812, 30.78633689880371, 31.77071762084961, 32.75510025024414]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 5.0, 13.0, 14.0, 15.0, 29.0, 49.0, 75.0, 136.0, 217.0, 367.0, 789.0, 1715.0, 4001.0, 11012.0, 38705.0, 256075.0, 2713143.0, 1038481.0, 95883.0, 21038.0, 6984.0, 2829.0, 1307.0, 608.0, 312.0, 184.0, 93.0, 67.0, 46.0, 24.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.03515625, -3.915679931640625, -3.79620361328125, -3.676727294921875, -3.5572509765625, -3.437774658203125, -3.31829833984375, -3.198822021484375, -3.079345703125, -2.959869384765625, -2.84039306640625, -2.720916748046875, -2.6014404296875, -2.481964111328125, -2.36248779296875, -2.243011474609375, -2.12353515625, -2.004058837890625, -1.88458251953125, -1.765106201171875, -1.6456298828125, -1.526153564453125, -1.40667724609375, -1.287200927734375, -1.167724609375, -1.048248291015625, -0.92877197265625, -0.809295654296875, -0.6898193359375, -0.570343017578125, -0.45086669921875, -0.331390380859375, -0.2119140625, -0.092437744140625, 0.02703857421875, 0.146514892578125, 0.2659912109375, 0.385467529296875, 0.50494384765625, 0.624420166015625, 0.743896484375, 0.863372802734375, 0.98284912109375, 1.102325439453125, 1.2218017578125, 1.341278076171875, 1.46075439453125, 1.580230712890625, 1.69970703125, 1.819183349609375, 1.93865966796875, 2.058135986328125, 2.1776123046875, 2.297088623046875, 2.41656494140625, 2.536041259765625, 2.655517578125, 2.774993896484375, 2.89447021484375, 3.013946533203125, 3.1334228515625, 3.252899169921875, 3.37237548828125, 3.491851806640625, 3.611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 12.0, 11.0, 13.0, 19.0, 16.0, 31.0, 23.0, 32.0, 40.0, 38.0, 44.0, 52.0, 55.0, 52.0, 64.0, 69.0, 63.0, 48.0, 44.0, 48.0, 50.0, 29.0, 27.0, 24.0, 13.0, 19.0, 15.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.939453125, -2.8662872314453125, -2.793121337890625, -2.7199554443359375, -2.64678955078125, -2.5736236572265625, -2.500457763671875, -2.4272918701171875, -2.3541259765625, -2.2809600830078125, -2.207794189453125, -2.1346282958984375, -2.06146240234375, -1.9882965087890625, -1.915130615234375, -1.8419647216796875, -1.768798828125, -1.6956329345703125, -1.622467041015625, -1.5493011474609375, -1.47613525390625, -1.4029693603515625, -1.329803466796875, -1.2566375732421875, -1.1834716796875, -1.1103057861328125, -1.037139892578125, -0.9639739990234375, -0.89080810546875, -0.8176422119140625, -0.744476318359375, -0.6713104248046875, -0.59814453125, -0.5249786376953125, -0.451812744140625, -0.3786468505859375, -0.30548095703125, -0.2323150634765625, -0.159149169921875, -0.0859832763671875, -0.0128173828125, 0.0603485107421875, 0.133514404296875, 0.2066802978515625, 0.27984619140625, 0.3530120849609375, 0.426177978515625, 0.4993438720703125, 0.572509765625, 0.6456756591796875, 0.718841552734375, 0.7920074462890625, 0.86517333984375, 0.9383392333984375, 1.011505126953125, 1.0846710205078125, 1.1578369140625, 1.2310028076171875, 1.304168701171875, 1.3773345947265625, 1.45050048828125, 1.5236663818359375, 1.596832275390625, 1.6699981689453125, 1.7431640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 19.0, 25.0, 27.0, 43.0, 59.0, 128.0, 246.0, 587.0, 1479.0, 4560.0, 18414.0, 121670.0, 3057645.0, 915305.0, 57896.0, 11114.0, 3040.0, 1072.0, 430.0, 198.0, 114.0, 61.0, 37.0, 21.0, 26.0, 13.0, 13.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.1484375, -5.97186279296875, -5.7952880859375, -5.61871337890625, -5.442138671875, -5.26556396484375, -5.0889892578125, -4.91241455078125, -4.73583984375, -4.55926513671875, -4.3826904296875, -4.20611572265625, -4.029541015625, -3.85296630859375, -3.6763916015625, -3.49981689453125, -3.3232421875, -3.14666748046875, -2.9700927734375, -2.79351806640625, -2.616943359375, -2.44036865234375, -2.2637939453125, -2.08721923828125, -1.91064453125, -1.73406982421875, -1.5574951171875, -1.38092041015625, -1.204345703125, -1.02777099609375, -0.8511962890625, -0.67462158203125, -0.498046875, -0.32147216796875, -0.1448974609375, 0.03167724609375, 0.208251953125, 0.38482666015625, 0.5614013671875, 0.73797607421875, 0.91455078125, 1.09112548828125, 1.2677001953125, 1.44427490234375, 1.620849609375, 1.79742431640625, 1.9739990234375, 2.15057373046875, 2.3271484375, 2.50372314453125, 2.6802978515625, 2.85687255859375, 3.033447265625, 3.21002197265625, 3.3865966796875, 3.56317138671875, 3.73974609375, 3.91632080078125, 4.0928955078125, 4.26947021484375, 4.446044921875, 4.62261962890625, 4.7991943359375, 4.97576904296875, 5.15234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 12.0, 9.0, 13.0, 23.0, 42.0, 51.0, 60.0, 86.0, 129.0, 222.0, 376.0, 597.0, 772.0, 580.0, 340.0, 226.0, 128.0, 97.0, 68.0, 49.0, 37.0, 33.0, 27.0, 15.0, 11.0, 6.0, 13.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.9659423828125, -3.826416015625, -3.6868896484375, -3.54736328125, -3.4078369140625, -3.268310546875, -3.1287841796875, -2.9892578125, -2.8497314453125, -2.710205078125, -2.5706787109375, -2.43115234375, -2.2916259765625, -2.152099609375, -2.0125732421875, -1.873046875, -1.7335205078125, -1.593994140625, -1.4544677734375, -1.31494140625, -1.1754150390625, -1.035888671875, -0.8963623046875, -0.7568359375, -0.6173095703125, -0.477783203125, -0.3382568359375, -0.19873046875, -0.0592041015625, 0.080322265625, 0.2198486328125, 0.359375, 0.4989013671875, 0.638427734375, 0.7779541015625, 0.91748046875, 1.0570068359375, 1.196533203125, 1.3360595703125, 1.4755859375, 1.6151123046875, 1.754638671875, 1.8941650390625, 2.03369140625, 2.1732177734375, 2.312744140625, 2.4522705078125, 2.591796875, 2.7313232421875, 2.870849609375, 3.0103759765625, 3.14990234375, 3.2894287109375, 3.428955078125, 3.5684814453125, 3.7080078125, 3.8475341796875, 3.987060546875, 4.1265869140625, 4.26611328125, 4.4056396484375, 4.545166015625, 4.6846923828125, 4.82421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 7.0, 25.0, 63.0, 162.0, 278.0, 252.0, 128.0, 54.0, 13.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.43502426147461, -17.206241607666016, -14.977458953857422, -12.748676300048828, -10.519893646240234, -8.29111099243164, -6.062328338623047, -3.833545684814453, -1.6047630310058594, 0.6240196228027344, 2.852802276611328, 5.081584930419922, 7.310367584228516, 9.53915023803711, 11.767932891845703, 13.996715545654297, 16.22549819946289, 18.454280853271484, 20.683063507080078, 22.911846160888672, 25.140628814697266, 27.36941146850586, 29.598194122314453, 31.826976776123047, 34.05575942993164, 36.284542083740234, 38.51332473754883, 40.74210739135742, 42.970890045166016, 45.19967269897461, 47.4284553527832, 49.6572380065918, 51.886016845703125, 54.11479949951172, 56.34358215332031, 58.572364807128906, 60.8011474609375, 63.029930114746094, 65.25871276855469, 67.48749542236328, 69.71627807617188, 71.94506072998047, 74.17384338378906, 76.40262603759766, 78.63140869140625, 80.86019134521484, 83.08897399902344, 85.31775665283203, 87.54653930664062, 89.77532196044922, 92.00410461425781, 94.2328872680664, 96.461669921875, 98.6904525756836, 100.91923522949219, 103.14801788330078, 105.37680053710938, 107.60558319091797, 109.83436584472656, 112.06314849853516, 114.29193115234375, 116.52071380615234, 118.74949645996094, 120.97827911376953, 123.20706176757812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 6.0, 10.0, 14.0, 10.0, 12.0, 19.0, 21.0, 14.0, 25.0, 27.0, 23.0, 23.0, 33.0, 37.0, 48.0, 39.0, 41.0, 39.0, 44.0, 43.0, 39.0, 42.0, 52.0, 45.0, 38.0, 29.0, 31.0, 31.0, 27.0, 14.0, 16.0, 14.0, 13.0, 9.0, 10.0, 11.0, 15.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.35088539123535, -17.808513641357422, -17.266143798828125, -16.723772048950195, -16.181400299072266, -15.639029502868652, -15.096658706665039, -14.55428695678711, -14.011916160583496, -13.469545364379883, -12.927173614501953, -12.38480281829834, -11.842432022094727, -11.300060272216797, -10.757689476013184, -10.21531867980957, -9.67294692993164, -9.130576133728027, -8.588204383850098, -8.045833587646484, -7.503462314605713, -6.961091041564941, -6.418720245361328, -5.876348972320557, -5.333977699279785, -4.791606426239014, -4.249235153198242, -3.706864356994629, -3.1644930839538574, -2.622121810913086, -2.0797507762908936, -1.5373797416687012, -0.9950065612792969, -0.45263540744781494, 0.08973574638366699, 0.6321069002151489, 1.1744780540466309, 1.7168493270874023, 2.2592203617095947, 2.801591396331787, 3.3439626693725586, 3.88633394241333, 4.428705215454102, 4.971076011657715, 5.513447284698486, 6.055818557739258, 6.598189353942871, 7.140560626983643, 7.682931900024414, 8.225302696228027, 8.767674446105957, 9.31004524230957, 9.8524169921875, 10.394787788391113, 10.937158584594727, 11.479530334472656, 12.02190113067627, 12.564271926879883, 13.106643676757812, 13.649014472961426, 14.191385269165039, 14.733757019042969, 15.276127815246582, 15.818498611450195, 16.360870361328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 13.0, 15.0, 34.0, 35.0, 88.0, 121.0, 172.0, 292.0, 459.0, 934.0, 1989.0, 4221.0, 10510.0, 28967.0, 96860.0, 385302.0, 376936.0, 94628.0, 28222.0, 10400.0, 4260.0, 1910.0, 952.0, 490.0, 269.0, 171.0, 94.0, 75.0, 56.0, 23.0, 24.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.33447265625, -3.2333984375, -3.13232421875, -3.03125, -2.93017578125, -2.8291015625, -2.72802734375, -2.626953125, -2.52587890625, -2.4248046875, -2.32373046875, -2.22265625, -2.12158203125, -2.0205078125, -1.91943359375, -1.818359375, -1.71728515625, -1.6162109375, -1.51513671875, -1.4140625, -1.31298828125, -1.2119140625, -1.11083984375, -1.009765625, -0.90869140625, -0.8076171875, -0.70654296875, -0.60546875, -0.50439453125, -0.4033203125, -0.30224609375, -0.201171875, -0.10009765625, 0.0009765625, 0.10205078125, 0.203125, 0.30419921875, 0.4052734375, 0.50634765625, 0.607421875, 0.70849609375, 0.8095703125, 0.91064453125, 1.01171875, 1.11279296875, 1.2138671875, 1.31494140625, 1.416015625, 1.51708984375, 1.6181640625, 1.71923828125, 1.8203125, 1.92138671875, 2.0224609375, 2.12353515625, 2.224609375, 2.32568359375, 2.4267578125, 2.52783203125, 2.62890625, 2.72998046875, 2.8310546875, 2.93212890625, 3.033203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 10.0, 10.0, 9.0, 14.0, 12.0, 16.0, 29.0, 25.0, 31.0, 29.0, 24.0, 34.0, 27.0, 31.0, 37.0, 42.0, 36.0, 55.0, 47.0, 46.0, 51.0, 32.0, 47.0, 35.0, 34.0, 31.0, 28.0, 34.0, 21.0, 19.0, 13.0, 17.0, 6.0, 9.0, 10.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.0382843017578125, -1.976959228515625, -1.9156341552734375, -1.85430908203125, -1.7929840087890625, -1.731658935546875, -1.6703338623046875, -1.6090087890625, -1.5476837158203125, -1.486358642578125, -1.4250335693359375, -1.36370849609375, -1.3023834228515625, -1.241058349609375, -1.1797332763671875, -1.118408203125, -1.0570831298828125, -0.995758056640625, -0.9344329833984375, -0.87310791015625, -0.8117828369140625, -0.750457763671875, -0.6891326904296875, -0.6278076171875, -0.5664825439453125, -0.505157470703125, -0.4438323974609375, -0.38250732421875, -0.3211822509765625, -0.259857177734375, -0.1985321044921875, -0.13720703125, -0.0758819580078125, -0.014556884765625, 0.0467681884765625, 0.10809326171875, 0.1694183349609375, 0.230743408203125, 0.2920684814453125, 0.3533935546875, 0.4147186279296875, 0.476043701171875, 0.5373687744140625, 0.59869384765625, 0.6600189208984375, 0.721343994140625, 0.7826690673828125, 0.843994140625, 0.9053192138671875, 0.966644287109375, 1.0279693603515625, 1.08929443359375, 1.1506195068359375, 1.211944580078125, 1.2732696533203125, 1.3345947265625, 1.3959197998046875, 1.457244873046875, 1.5185699462890625, 1.57989501953125, 1.6412200927734375, 1.702545166015625, 1.7638702392578125, 1.8251953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 15.0, 15.0, 16.0, 20.0, 34.0, 37.0, 43.0, 63.0, 94.0, 155.0, 254.0, 386.0, 634.0, 1092.0, 2358.0, 5917.0, 20900.0, 129893.0, 771564.0, 89035.0, 16307.0, 5061.0, 2083.0, 934.0, 518.0, 360.0, 253.0, 134.0, 111.0, 65.0, 57.0, 41.0, 22.0, 24.0, 11.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.1494140625, -3.998046875, -3.8466796875, -3.6953125, -3.5439453125, -3.392578125, -3.2412109375, -3.08984375, -2.9384765625, -2.787109375, -2.6357421875, -2.484375, -2.3330078125, -2.181640625, -2.0302734375, -1.87890625, -1.7275390625, -1.576171875, -1.4248046875, -1.2734375, -1.1220703125, -0.970703125, -0.8193359375, -0.66796875, -0.5166015625, -0.365234375, -0.2138671875, -0.0625, 0.0888671875, 0.240234375, 0.3916015625, 0.54296875, 0.6943359375, 0.845703125, 0.9970703125, 1.1484375, 1.2998046875, 1.451171875, 1.6025390625, 1.75390625, 1.9052734375, 2.056640625, 2.2080078125, 2.359375, 2.5107421875, 2.662109375, 2.8134765625, 2.96484375, 3.1162109375, 3.267578125, 3.4189453125, 3.5703125, 3.7216796875, 3.873046875, 4.0244140625, 4.17578125, 4.3271484375, 4.478515625, 4.6298828125, 4.78125, 4.9326171875, 5.083984375, 5.2353515625, 5.38671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 6.0, 6.0, 6.0, 9.0, 8.0, 25.0, 15.0, 21.0, 35.0, 33.0, 44.0, 63.0, 55.0, 56.0, 74.0, 68.0, 67.0, 68.0, 64.0, 57.0, 50.0, 31.0, 27.0, 21.0, 16.0, 24.0, 14.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.0960693359375, -8.778076171875, -8.4600830078125, -8.14208984375, -7.8240966796875, -7.506103515625, -7.1881103515625, -6.8701171875, -6.5521240234375, -6.234130859375, -5.9161376953125, -5.59814453125, -5.2801513671875, -4.962158203125, -4.6441650390625, -4.326171875, -4.0081787109375, -3.690185546875, -3.3721923828125, -3.05419921875, -2.7362060546875, -2.418212890625, -2.1002197265625, -1.7822265625, -1.4642333984375, -1.146240234375, -0.8282470703125, -0.51025390625, -0.1922607421875, 0.125732421875, 0.4437255859375, 0.76171875, 1.0797119140625, 1.397705078125, 1.7156982421875, 2.03369140625, 2.3516845703125, 2.669677734375, 2.9876708984375, 3.3056640625, 3.6236572265625, 3.941650390625, 4.2596435546875, 4.57763671875, 4.8956298828125, 5.213623046875, 5.5316162109375, 5.849609375, 6.1676025390625, 6.485595703125, 6.8035888671875, 7.12158203125, 7.4395751953125, 7.757568359375, 8.0755615234375, 8.3935546875, 8.7115478515625, 9.029541015625, 9.3475341796875, 9.66552734375, 9.9835205078125, 10.301513671875, 10.6195068359375, 10.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 12.0, 13.0, 18.0, 26.0, 60.0, 91.0, 122.0, 184.0, 285.0, 470.0, 814.0, 1447.0, 3127.0, 7910.0, 32942.0, 332038.0, 617047.0, 36446.0, 8571.0, 3200.0, 1511.0, 867.0, 497.0, 259.0, 183.0, 145.0, 83.0, 50.0, 45.0, 27.0, 18.0, 6.0, 11.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.7038726806640625, -1.648956298828125, -1.5940399169921875, -1.53912353515625, -1.4842071533203125, -1.429290771484375, -1.3743743896484375, -1.3194580078125, -1.2645416259765625, -1.209625244140625, -1.1547088623046875, -1.09979248046875, -1.0448760986328125, -0.989959716796875, -0.9350433349609375, -0.880126953125, -0.8252105712890625, -0.770294189453125, -0.7153778076171875, -0.66046142578125, -0.6055450439453125, -0.550628662109375, -0.4957122802734375, -0.4407958984375, -0.3858795166015625, -0.330963134765625, -0.2760467529296875, -0.22113037109375, -0.1662139892578125, -0.111297607421875, -0.0563812255859375, -0.00146484375, 0.0534515380859375, 0.108367919921875, 0.1632843017578125, 0.21820068359375, 0.2731170654296875, 0.328033447265625, 0.3829498291015625, 0.4378662109375, 0.4927825927734375, 0.547698974609375, 0.6026153564453125, 0.65753173828125, 0.7124481201171875, 0.767364501953125, 0.8222808837890625, 0.877197265625, 0.9321136474609375, 0.987030029296875, 1.0419464111328125, 1.09686279296875, 1.1517791748046875, 1.206695556640625, 1.2616119384765625, 1.3165283203125, 1.3714447021484375, 1.426361083984375, 1.4812774658203125, 1.53619384765625, 1.5911102294921875, 1.646026611328125, 1.7009429931640625, 1.755859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 9.0, 14.0, 17.0, 28.0, 46.0, 101.0, 153.0, 270.0, 168.0, 74.0, 44.0, 19.0, 16.0, 9.0, 6.0, 3.0, 8.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006971359252929688, -0.0006707906723022461, -0.0006444454193115234, -0.0006181001663208008, -0.0005917549133300781, -0.0005654096603393555, -0.0005390644073486328, -0.0005127191543579102, -0.0004863739013671875, -0.00046002864837646484, -0.0004336833953857422, -0.00040733814239501953, -0.0003809928894042969, -0.0003546476364135742, -0.00032830238342285156, -0.0003019571304321289, -0.00027561187744140625, -0.0002492666244506836, -0.00022292137145996094, -0.00019657611846923828, -0.00017023086547851562, -0.00014388561248779297, -0.00011754035949707031, -9.119510650634766e-05, -6.4849853515625e-05, -3.8504600524902344e-05, -1.2159347534179688e-05, 1.4185905456542969e-05, 4.0531158447265625e-05, 6.687641143798828e-05, 9.322166442871094e-05, 0.0001195669174194336, 0.00014591217041015625, 0.0001722574234008789, 0.00019860267639160156, 0.00022494792938232422, 0.0002512931823730469, 0.00027763843536376953, 0.0003039836883544922, 0.00033032894134521484, 0.0003566741943359375, 0.00038301944732666016, 0.0004093647003173828, 0.00043570995330810547, 0.0004620552062988281, 0.0004884004592895508, 0.0005147457122802734, 0.0005410909652709961, 0.0005674362182617188, 0.0005937814712524414, 0.0006201267242431641, 0.0006464719772338867, 0.0006728172302246094, 0.000699162483215332, 0.0007255077362060547, 0.0007518529891967773, 0.0007781982421875, 0.0008045434951782227, 0.0008308887481689453, 0.000857234001159668, 0.0008835792541503906, 0.0009099245071411133, 0.0009362697601318359, 0.0009626150131225586, 0.0009889602661132812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 10.0, 6.0, 10.0, 16.0, 24.0, 41.0, 63.0, 102.0, 190.0, 306.0, 615.0, 1319.0, 3072.0, 8589.0, 31210.0, 187497.0, 718816.0, 71877.0, 15744.0, 5047.0, 2010.0, 897.0, 453.0, 278.0, 112.0, 84.0, 60.0, 39.0, 23.0, 20.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.357421875, -1.3076171875, -1.2578125, -1.2080078125, -1.158203125, -1.1083984375, -1.05859375, -1.0087890625, -0.958984375, -0.9091796875, -0.859375, -0.8095703125, -0.759765625, -0.7099609375, -0.66015625, -0.6103515625, -0.560546875, -0.5107421875, -0.4609375, -0.4111328125, -0.361328125, -0.3115234375, -0.26171875, -0.2119140625, -0.162109375, -0.1123046875, -0.0625, -0.0126953125, 0.037109375, 0.0869140625, 0.13671875, 0.1865234375, 0.236328125, 0.2861328125, 0.3359375, 0.3857421875, 0.435546875, 0.4853515625, 0.53515625, 0.5849609375, 0.634765625, 0.6845703125, 0.734375, 0.7841796875, 0.833984375, 0.8837890625, 0.93359375, 0.9833984375, 1.033203125, 1.0830078125, 1.1328125, 1.1826171875, 1.232421875, 1.2822265625, 1.33203125, 1.3818359375, 1.431640625, 1.4814453125, 1.53125, 1.5810546875, 1.630859375, 1.6806640625, 1.73046875, 1.7802734375, 1.830078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 19.0, 24.0, 15.0, 48.0, 39.0, 53.0, 88.0, 117.0, 117.0, 127.0, 78.0, 55.0, 41.0, 47.0, 28.0, 27.0, 11.0, 13.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.919921875, -1.865875244140625, -1.81182861328125, -1.757781982421875, -1.7037353515625, -1.649688720703125, -1.59564208984375, -1.541595458984375, -1.487548828125, -1.433502197265625, -1.37945556640625, -1.325408935546875, -1.2713623046875, -1.217315673828125, -1.16326904296875, -1.109222412109375, -1.05517578125, -1.001129150390625, -0.94708251953125, -0.893035888671875, -0.8389892578125, -0.784942626953125, -0.73089599609375, -0.676849365234375, -0.622802734375, -0.568756103515625, -0.51470947265625, -0.460662841796875, -0.4066162109375, -0.352569580078125, -0.29852294921875, -0.244476318359375, -0.1904296875, -0.136383056640625, -0.08233642578125, -0.028289794921875, 0.0257568359375, 0.079803466796875, 0.13385009765625, 0.187896728515625, 0.241943359375, 0.295989990234375, 0.35003662109375, 0.404083251953125, 0.4581298828125, 0.512176513671875, 0.56622314453125, 0.620269775390625, 0.67431640625, 0.728363037109375, 0.78240966796875, 0.836456298828125, 0.8905029296875, 0.944549560546875, 0.99859619140625, 1.052642822265625, 1.106689453125, 1.160736083984375, 1.21478271484375, 1.268829345703125, 1.3228759765625, 1.376922607421875, 1.43096923828125, 1.485015869140625, 1.5390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 8.0, 30.0, 126.0, 594.0, 177.0, 39.0, 12.0, 9.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.8374786376953, -169.2025604248047, -165.567626953125, -161.93270874023438, -158.2977752685547, -154.66285705566406, -151.02792358398438, -147.39300537109375, -143.75808715820312, -140.1231689453125, -136.4882354736328, -132.8533172607422, -129.2183837890625, -125.58346557617188, -121.94853973388672, -118.31361389160156, -114.67868041992188, -111.04375457763672, -107.40882873535156, -103.77391052246094, -100.13898468017578, -96.50405883789062, -92.86913299560547, -89.23420715332031, -85.59928894042969, -81.96436309814453, -78.32943725585938, -74.69451904296875, -71.0595932006836, -67.42466735839844, -63.78974151611328, -60.154815673828125, -56.51988983154297, -52.88496398925781, -49.25004196166992, -45.615116119384766, -41.98019027709961, -38.34526824951172, -34.71034240722656, -31.075416564941406, -27.440492630004883, -23.80556869506836, -20.170642852783203, -16.53571891784668, -12.90079402923584, -9.265869140625, -5.630945205688477, -1.9960193634033203, 1.6389045715332031, 5.273829460144043, 8.908754348754883, 12.543678283691406, 16.178604125976562, 19.813528060913086, 23.44845199584961, 27.083377838134766, 30.71830177307129, 34.35322570800781, 37.98815155029297, 41.623077392578125, 45.257999420166016, 48.89292526245117, 52.52784729003906, 56.16277313232422, 59.797698974609375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 13.0, 7.0, 20.0, 14.0, 21.0, 24.0, 33.0, 34.0, 27.0, 28.0, 35.0, 51.0, 85.0, 96.0, 104.0, 86.0, 35.0, 33.0, 34.0, 18.0, 32.0, 19.0, 13.0, 16.0, 9.0, 15.0, 13.0, 3.0, 18.0, 7.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31207275390625, -28.33296012878418, -27.35384750366211, -26.374736785888672, -25.3956241607666, -24.41651153564453, -23.43739891052246, -22.45828628540039, -21.479175567626953, -20.500062942504883, -19.520950317382812, -18.541839599609375, -17.562726974487305, -16.583614349365234, -15.604501724243164, -14.625389099121094, -13.646276473999023, -12.667163848876953, -11.6880521774292, -10.708939552307129, -9.729827880859375, -8.750715255737305, -7.771602630615234, -6.792490482330322, -5.81337833404541, -4.834266185760498, -3.855153799057007, -2.8760414123535156, -1.8969292640686035, -0.9178171157836914, 0.061295509338378906, 1.040407657623291, 2.019519805908203, 2.9986319541931152, 3.9777443408966064, 4.956856727600098, 5.93596887588501, 6.915081024169922, 7.894193649291992, 8.873306274414062, 9.852417945861816, 10.831530570983887, 11.81064224243164, 12.789754867553711, 13.768867492675781, 14.747979164123535, 15.727091789245605, 16.70620346069336, 17.68531608581543, 18.6644287109375, 19.64354133605957, 20.62265396118164, 21.601764678955078, 22.58087730407715, 23.55998992919922, 24.53910255432129, 25.51821517944336, 26.49732780456543, 27.4764404296875, 28.455551147460938, 29.434663772583008, 30.413776397705078, 31.39288902282715, 32.37200164794922, 33.351112365722656]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 6.0, 5.0, 14.0, 23.0, 19.0, 39.0, 71.0, 101.0, 175.0, 357.0, 616.0, 1278.0, 2654.0, 6734.0, 20048.0, 74674.0, 457703.0, 2455829.0, 986113.0, 138410.0, 31940.0, 10056.0, 3806.0, 1770.0, 842.0, 428.0, 219.0, 150.0, 85.0, 41.0, 29.0, 21.0, 9.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.19921875, -6.046844482421875, -5.89447021484375, -5.742095947265625, -5.5897216796875, -5.437347412109375, -5.28497314453125, -5.132598876953125, -4.980224609375, -4.827850341796875, -4.67547607421875, -4.523101806640625, -4.3707275390625, -4.218353271484375, -4.06597900390625, -3.913604736328125, -3.76123046875, -3.608856201171875, -3.45648193359375, -3.304107666015625, -3.1517333984375, -2.999359130859375, -2.84698486328125, -2.694610595703125, -2.542236328125, -2.389862060546875, -2.23748779296875, -2.085113525390625, -1.9327392578125, -1.780364990234375, -1.62799072265625, -1.475616455078125, -1.3232421875, -1.170867919921875, -1.01849365234375, -0.866119384765625, -0.7137451171875, -0.561370849609375, -0.40899658203125, -0.256622314453125, -0.104248046875, 0.048126220703125, 0.20050048828125, 0.352874755859375, 0.5052490234375, 0.657623291015625, 0.80999755859375, 0.962371826171875, 1.11474609375, 1.267120361328125, 1.41949462890625, 1.571868896484375, 1.7242431640625, 1.876617431640625, 2.02899169921875, 2.181365966796875, 2.333740234375, 2.486114501953125, 2.63848876953125, 2.790863037109375, 2.9432373046875, 3.095611572265625, 3.24798583984375, 3.400360107421875, 3.552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 11.0, 12.0, 12.0, 15.0, 26.0, 25.0, 15.0, 28.0, 26.0, 30.0, 29.0, 32.0, 43.0, 39.0, 38.0, 41.0, 43.0, 62.0, 42.0, 50.0, 50.0, 43.0, 43.0, 45.0, 27.0, 24.0, 25.0, 9.0, 20.0, 15.0, 15.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-2.37890625, -2.315155029296875, -2.25140380859375, -2.187652587890625, -2.1239013671875, -2.060150146484375, -1.99639892578125, -1.932647705078125, -1.868896484375, -1.805145263671875, -1.74139404296875, -1.677642822265625, -1.6138916015625, -1.550140380859375, -1.48638916015625, -1.422637939453125, -1.35888671875, -1.295135498046875, -1.23138427734375, -1.167633056640625, -1.1038818359375, -1.040130615234375, -0.97637939453125, -0.912628173828125, -0.848876953125, -0.785125732421875, -0.72137451171875, -0.657623291015625, -0.5938720703125, -0.530120849609375, -0.46636962890625, -0.402618408203125, -0.3388671875, -0.275115966796875, -0.21136474609375, -0.147613525390625, -0.0838623046875, -0.020111083984375, 0.04364013671875, 0.107391357421875, 0.171142578125, 0.234893798828125, 0.29864501953125, 0.362396240234375, 0.4261474609375, 0.489898681640625, 0.55364990234375, 0.617401123046875, 0.68115234375, 0.744903564453125, 0.80865478515625, 0.872406005859375, 0.9361572265625, 0.999908447265625, 1.06365966796875, 1.127410888671875, 1.191162109375, 1.254913330078125, 1.31866455078125, 1.382415771484375, 1.4461669921875, 1.509918212890625, 1.57366943359375, 1.637420654296875, 1.701171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 15.0, 28.0, 17.0, 35.0, 49.0, 88.0, 122.0, 171.0, 317.0, 704.0, 1785.0, 7203.0, 100886.0, 3958150.0, 113907.0, 7537.0, 1754.0, 648.0, 323.0, 195.0, 122.0, 64.0, 39.0, 34.0, 20.0, 14.0, 8.0, 7.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.9920654296875, -16.499755859375, -16.0074462890625, -15.51513671875, -15.0228271484375, -14.530517578125, -14.0382080078125, -13.5458984375, -13.0535888671875, -12.561279296875, -12.0689697265625, -11.57666015625, -11.0843505859375, -10.592041015625, -10.0997314453125, -9.607421875, -9.1151123046875, -8.622802734375, -8.1304931640625, -7.63818359375, -7.1458740234375, -6.653564453125, -6.1612548828125, -5.6689453125, -5.1766357421875, -4.684326171875, -4.1920166015625, -3.69970703125, -3.2073974609375, -2.715087890625, -2.2227783203125, -1.73046875, -1.2381591796875, -0.745849609375, -0.2535400390625, 0.23876953125, 0.7310791015625, 1.223388671875, 1.7156982421875, 2.2080078125, 2.7003173828125, 3.192626953125, 3.6849365234375, 4.17724609375, 4.6695556640625, 5.161865234375, 5.6541748046875, 6.146484375, 6.6387939453125, 7.131103515625, 7.6234130859375, 8.11572265625, 8.6080322265625, 9.100341796875, 9.5926513671875, 10.0849609375, 10.5772705078125, 11.069580078125, 11.5618896484375, 12.05419921875, 12.5465087890625, 13.038818359375, 13.5311279296875, 14.0234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 5.0, 9.0, 10.0, 21.0, 23.0, 34.0, 45.0, 75.0, 88.0, 151.0, 220.0, 343.0, 528.0, 774.0, 611.0, 388.0, 250.0, 140.0, 120.0, 67.0, 52.0, 40.0, 33.0, 15.0, 11.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.671875, -9.392333984375, -9.11279296875, -8.833251953125, -8.5537109375, -8.274169921875, -7.99462890625, -7.715087890625, -7.435546875, -7.156005859375, -6.87646484375, -6.596923828125, -6.3173828125, -6.037841796875, -5.75830078125, -5.478759765625, -5.19921875, -4.919677734375, -4.64013671875, -4.360595703125, -4.0810546875, -3.801513671875, -3.52197265625, -3.242431640625, -2.962890625, -2.683349609375, -2.40380859375, -2.124267578125, -1.8447265625, -1.565185546875, -1.28564453125, -1.006103515625, -0.7265625, -0.447021484375, -0.16748046875, 0.112060546875, 0.3916015625, 0.671142578125, 0.95068359375, 1.230224609375, 1.509765625, 1.789306640625, 2.06884765625, 2.348388671875, 2.6279296875, 2.907470703125, 3.18701171875, 3.466552734375, 3.74609375, 4.025634765625, 4.30517578125, 4.584716796875, 4.8642578125, 5.143798828125, 5.42333984375, 5.702880859375, 5.982421875, 6.261962890625, 6.54150390625, 6.821044921875, 7.1005859375, 7.380126953125, 7.65966796875, 7.939208984375, 8.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 16.0, 15.0, 41.0, 64.0, 104.0, 153.0, 179.0, 163.0, 95.0, 59.0, 29.0, 25.0, 18.0, 7.0, 2.0, 8.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.10050964355469, -82.2998046875, -79.49910736083984, -76.69840240478516, -73.897705078125, -71.09700012207031, -68.29629516601562, -65.49559020996094, -62.69489288330078, -59.89419174194336, -57.09349060058594, -54.29278564453125, -51.49208450317383, -48.691383361816406, -45.89067840576172, -43.0899772644043, -40.289276123046875, -37.48857498168945, -34.68787384033203, -31.887168884277344, -29.086467742919922, -26.2857666015625, -23.485063552856445, -20.68436050415039, -17.88365936279297, -15.08295726776123, -12.282255172729492, -9.481553077697754, -6.680850982666016, -3.8801488876342773, -1.079446792602539, 1.7212562561035156, 4.521949768066406, 7.3226518630981445, 10.123353958129883, 12.924056053161621, 15.72475814819336, 18.52545928955078, 21.326162338256836, 24.12686538696289, 26.927566528320312, 29.728267669677734, 32.528968811035156, 35.329673767089844, 38.130374908447266, 40.93107604980469, 43.731781005859375, 46.5324821472168, 49.33318328857422, 52.13388442993164, 54.93458557128906, 57.73529052734375, 60.53599166870117, 63.336692810058594, 66.13739776611328, 68.93809509277344, 71.73880004882812, 74.53950500488281, 77.34020233154297, 80.14090728759766, 82.94160461425781, 85.7423095703125, 88.54301452636719, 91.34371948242188, 94.14441680908203]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 13.0, 11.0, 17.0, 17.0, 21.0, 17.0, 28.0, 28.0, 26.0, 38.0, 35.0, 43.0, 42.0, 31.0, 63.0, 54.0, 77.0, 65.0, 48.0, 35.0, 42.0, 33.0, 34.0, 29.0, 31.0, 24.0, 21.0, 15.0, 10.0, 13.0, 11.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.560752868652344, -41.1661262512207, -39.77149963378906, -38.37687301635742, -36.98224639892578, -35.587623596191406, -34.1929931640625, -32.798370361328125, -31.403743743896484, -30.009117126464844, -28.614490509033203, -27.219863891601562, -25.825239181518555, -24.430612564086914, -23.035985946655273, -21.641361236572266, -20.246732711791992, -18.85210609436035, -17.45747947692871, -16.062854766845703, -14.668228149414062, -13.273601531982422, -11.878974914550781, -10.484349250793457, -9.089722633361816, -7.695096492767334, -6.300470352172852, -4.905843734741211, -3.5112175941467285, -2.116591453552246, -0.7219648361206055, 0.6726608276367188, 2.0672874450683594, 3.461913585662842, 4.856539726257324, 6.251166343688965, 7.645792484283447, 9.04041862487793, 10.43504524230957, 11.829670906066895, 13.224297523498535, 14.618924140930176, 16.0135498046875, 17.40817642211914, 18.80280303955078, 20.197429656982422, 21.592056274414062, 22.98668098449707, 24.38130760192871, 25.77593421936035, 27.170560836791992, 28.565185546875, 29.95981216430664, 31.35443878173828, 32.74906539916992, 34.14369201660156, 35.5383186340332, 36.932945251464844, 38.327571868896484, 39.722198486328125, 41.116825103759766, 42.511451721191406, 43.90607452392578, 45.30070114135742, 46.69532775878906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 12.0, 21.0, 23.0, 47.0, 80.0, 149.0, 296.0, 627.0, 1335.0, 3488.0, 11567.0, 52423.0, 503832.0, 411947.0, 46219.0, 10639.0, 3328.0, 1276.0, 603.0, 288.0, 162.0, 84.0, 39.0, 33.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.48828125, -6.3173828125, -6.146484375, -5.9755859375, -5.8046875, -5.6337890625, -5.462890625, -5.2919921875, -5.12109375, -4.9501953125, -4.779296875, -4.6083984375, -4.4375, -4.2666015625, -4.095703125, -3.9248046875, -3.75390625, -3.5830078125, -3.412109375, -3.2412109375, -3.0703125, -2.8994140625, -2.728515625, -2.5576171875, -2.38671875, -2.2158203125, -2.044921875, -1.8740234375, -1.703125, -1.5322265625, -1.361328125, -1.1904296875, -1.01953125, -0.8486328125, -0.677734375, -0.5068359375, -0.3359375, -0.1650390625, 0.005859375, 0.1767578125, 0.34765625, 0.5185546875, 0.689453125, 0.8603515625, 1.03125, 1.2021484375, 1.373046875, 1.5439453125, 1.71484375, 1.8857421875, 2.056640625, 2.2275390625, 2.3984375, 2.5693359375, 2.740234375, 2.9111328125, 3.08203125, 3.2529296875, 3.423828125, 3.5947265625, 3.765625, 3.9365234375, 4.107421875, 4.2783203125, 4.44921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 6.0, 10.0, 6.0, 9.0, 26.0, 19.0, 20.0, 36.0, 33.0, 37.0, 37.0, 65.0, 51.0, 58.0, 54.0, 53.0, 89.0, 58.0, 58.0, 50.0, 42.0, 37.0, 33.0, 31.0, 16.0, 21.0, 9.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.49609375, -3.37030029296875, -3.2445068359375, -3.11871337890625, -2.992919921875, -2.86712646484375, -2.7413330078125, -2.61553955078125, -2.48974609375, -2.36395263671875, -2.2381591796875, -2.11236572265625, -1.986572265625, -1.86077880859375, -1.7349853515625, -1.60919189453125, -1.4833984375, -1.35760498046875, -1.2318115234375, -1.10601806640625, -0.980224609375, -0.85443115234375, -0.7286376953125, -0.60284423828125, -0.47705078125, -0.35125732421875, -0.2254638671875, -0.09967041015625, 0.026123046875, 0.15191650390625, 0.2777099609375, 0.40350341796875, 0.529296875, 0.65509033203125, 0.7808837890625, 0.90667724609375, 1.032470703125, 1.15826416015625, 1.2840576171875, 1.40985107421875, 1.53564453125, 1.66143798828125, 1.7872314453125, 1.91302490234375, 2.038818359375, 2.16461181640625, 2.2904052734375, 2.41619873046875, 2.5419921875, 2.66778564453125, 2.7935791015625, 2.91937255859375, 3.045166015625, 3.17095947265625, 3.2967529296875, 3.42254638671875, 3.54833984375, 3.67413330078125, 3.7999267578125, 3.92572021484375, 4.051513671875, 4.17730712890625, 4.3031005859375, 4.42889404296875, 4.5546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 10.0, 7.0, 21.0, 26.0, 37.0, 40.0, 71.0, 113.0, 185.0, 304.0, 533.0, 1169.0, 3408.0, 12334.0, 75402.0, 879342.0, 59583.0, 10544.0, 3002.0, 1111.0, 509.0, 272.0, 159.0, 92.0, 79.0, 61.0, 31.0, 22.0, 23.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0078125, -4.8377685546875, -4.667724609375, -4.4976806640625, -4.32763671875, -4.1575927734375, -3.987548828125, -3.8175048828125, -3.6474609375, -3.4774169921875, -3.307373046875, -3.1373291015625, -2.96728515625, -2.7972412109375, -2.627197265625, -2.4571533203125, -2.287109375, -2.1170654296875, -1.947021484375, -1.7769775390625, -1.60693359375, -1.4368896484375, -1.266845703125, -1.0968017578125, -0.9267578125, -0.7567138671875, -0.586669921875, -0.4166259765625, -0.24658203125, -0.0765380859375, 0.093505859375, 0.2635498046875, 0.43359375, 0.6036376953125, 0.773681640625, 0.9437255859375, 1.11376953125, 1.2838134765625, 1.453857421875, 1.6239013671875, 1.7939453125, 1.9639892578125, 2.134033203125, 2.3040771484375, 2.47412109375, 2.6441650390625, 2.814208984375, 2.9842529296875, 3.154296875, 3.3243408203125, 3.494384765625, 3.6644287109375, 3.83447265625, 4.0045166015625, 4.174560546875, 4.3446044921875, 4.5146484375, 4.6846923828125, 4.854736328125, 5.0247802734375, 5.19482421875, 5.3648681640625, 5.534912109375, 5.7049560546875, 5.875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 8.0, 8.0, 13.0, 14.0, 16.0, 18.0, 26.0, 31.0, 31.0, 33.0, 35.0, 55.0, 67.0, 73.0, 70.0, 67.0, 62.0, 61.0, 51.0, 41.0, 24.0, 22.0, 27.0, 9.0, 19.0, 18.0, 9.0, 6.0, 9.0, 8.0, 10.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-12.546875, -12.176513671875, -11.80615234375, -11.435791015625, -11.0654296875, -10.695068359375, -10.32470703125, -9.954345703125, -9.583984375, -9.213623046875, -8.84326171875, -8.472900390625, -8.1025390625, -7.732177734375, -7.36181640625, -6.991455078125, -6.62109375, -6.250732421875, -5.88037109375, -5.510009765625, -5.1396484375, -4.769287109375, -4.39892578125, -4.028564453125, -3.658203125, -3.287841796875, -2.91748046875, -2.547119140625, -2.1767578125, -1.806396484375, -1.43603515625, -1.065673828125, -0.6953125, -0.324951171875, 0.04541015625, 0.415771484375, 0.7861328125, 1.156494140625, 1.52685546875, 1.897216796875, 2.267578125, 2.637939453125, 3.00830078125, 3.378662109375, 3.7490234375, 4.119384765625, 4.48974609375, 4.860107421875, 5.23046875, 5.600830078125, 5.97119140625, 6.341552734375, 6.7119140625, 7.082275390625, 7.45263671875, 7.822998046875, 8.193359375, 8.563720703125, 8.93408203125, 9.304443359375, 9.6748046875, 10.045166015625, 10.41552734375, 10.785888671875, 11.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 4.0, 11.0, 12.0, 14.0, 22.0, 32.0, 31.0, 56.0, 70.0, 132.0, 197.0, 270.0, 503.0, 791.0, 1644.0, 3586.0, 8334.0, 23900.0, 105355.0, 796972.0, 74370.0, 18964.0, 7000.0, 2948.0, 1421.0, 703.0, 431.0, 256.0, 153.0, 112.0, 70.0, 49.0, 36.0, 24.0, 24.0, 14.0, 11.0, 9.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.82568359375, -0.8023605346679688, -0.7790374755859375, -0.7557144165039062, -0.732391357421875, -0.7090682983398438, -0.6857452392578125, -0.6624221801757812, -0.63909912109375, -0.6157760620117188, -0.5924530029296875, -0.5691299438476562, -0.545806884765625, -0.5224838256835938, -0.4991607666015625, -0.47583770751953125, -0.4525146484375, -0.42919158935546875, -0.4058685302734375, -0.38254547119140625, -0.359222412109375, -0.33589935302734375, -0.3125762939453125, -0.28925323486328125, -0.26593017578125, -0.24260711669921875, -0.2192840576171875, -0.19596099853515625, -0.172637939453125, -0.14931488037109375, -0.1259918212890625, -0.10266876220703125, -0.079345703125, -0.05602264404296875, -0.0326995849609375, -0.00937652587890625, 0.013946533203125, 0.03726959228515625, 0.0605926513671875, 0.08391571044921875, 0.10723876953125, 0.13056182861328125, 0.1538848876953125, 0.17720794677734375, 0.200531005859375, 0.22385406494140625, 0.2471771240234375, 0.27050018310546875, 0.2938232421875, 0.31714630126953125, 0.3404693603515625, 0.36379241943359375, 0.387115478515625, 0.41043853759765625, 0.4337615966796875, 0.45708465576171875, 0.48040771484375, 0.5037307739257812, 0.5270538330078125, 0.5503768920898438, 0.573699951171875, 0.5970230102539062, 0.6203460693359375, 0.6436691284179688, 0.6669921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 7.0, 6.0, 14.0, 25.0, 15.0, 42.0, 41.0, 48.0, 88.0, 102.0, 114.0, 109.0, 108.0, 66.0, 38.0, 40.0, 27.0, 21.0, 14.0, 15.0, 5.0, 8.0, 5.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002675056457519531, -0.0002602245658636093, -0.0002529434859752655, -0.0002456624060869217, -0.00023838132619857788, -0.00023110024631023407, -0.00022381916642189026, -0.00021653808653354645, -0.00020925700664520264, -0.00020197592675685883, -0.00019469484686851501, -0.0001874137669801712, -0.0001801326870918274, -0.00017285160720348358, -0.00016557052731513977, -0.00015828944742679596, -0.00015100836753845215, -0.00014372728765010834, -0.00013644620776176453, -0.00012916512787342072, -0.0001218840479850769, -0.0001146029680967331, -0.00010732188820838928, -0.00010004080832004547, -9.275972843170166e-05, -8.547864854335785e-05, -7.819756865501404e-05, -7.091648876667023e-05, -6.363540887832642e-05, -5.6354328989982605e-05, -4.9073249101638794e-05, -4.179216921329498e-05, -3.451108932495117e-05, -2.723000943660736e-05, -1.994892954826355e-05, -1.2667849659919739e-05, -5.386769771575928e-06, 1.8943101167678833e-06, 9.175390005111694e-06, 1.6456469893455505e-05, 2.3737549781799316e-05, 3.101862967014313e-05, 3.829970955848694e-05, 4.558078944683075e-05, 5.286186933517456e-05, 6.014294922351837e-05, 6.742402911186218e-05, 7.4705109000206e-05, 8.19861888885498e-05, 8.926726877689362e-05, 9.654834866523743e-05, 0.00010382942855358124, 0.00011111050844192505, 0.00011839158833026886, 0.00012567266821861267, 0.00013295374810695648, 0.0001402348279953003, 0.0001475159078836441, 0.00015479698777198792, 0.00016207806766033173, 0.00016935914754867554, 0.00017664022743701935, 0.00018392130732536316, 0.00019120238721370697, 0.00019848346710205078]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 16.0, 7.0, 12.0, 18.0, 26.0, 46.0, 76.0, 85.0, 128.0, 212.0, 328.0, 585.0, 991.0, 2026.0, 4190.0, 10450.0, 30537.0, 161880.0, 761164.0, 49798.0, 14657.0, 5631.0, 2503.0, 1313.0, 744.0, 403.0, 270.0, 157.0, 95.0, 65.0, 48.0, 38.0, 17.0, 14.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.86279296875, -0.8310546875, -0.79931640625, -0.767578125, -0.73583984375, -0.7041015625, -0.67236328125, -0.640625, -0.60888671875, -0.5771484375, -0.54541015625, -0.513671875, -0.48193359375, -0.4501953125, -0.41845703125, -0.38671875, -0.35498046875, -0.3232421875, -0.29150390625, -0.259765625, -0.22802734375, -0.1962890625, -0.16455078125, -0.1328125, -0.10107421875, -0.0693359375, -0.03759765625, -0.005859375, 0.02587890625, 0.0576171875, 0.08935546875, 0.12109375, 0.15283203125, 0.1845703125, 0.21630859375, 0.248046875, 0.27978515625, 0.3115234375, 0.34326171875, 0.375, 0.40673828125, 0.4384765625, 0.47021484375, 0.501953125, 0.53369140625, 0.5654296875, 0.59716796875, 0.62890625, 0.66064453125, 0.6923828125, 0.72412109375, 0.755859375, 0.78759765625, 0.8193359375, 0.85107421875, 0.8828125, 0.91455078125, 0.9462890625, 0.97802734375, 1.009765625, 1.04150390625, 1.0732421875, 1.10498046875, 1.13671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 10.0, 8.0, 9.0, 9.0, 15.0, 10.0, 9.0, 13.0, 18.0, 17.0, 23.0, 34.0, 45.0, 51.0, 65.0, 82.0, 100.0, 97.0, 89.0, 62.0, 45.0, 32.0, 24.0, 21.0, 15.0, 10.0, 13.0, 14.0, 10.0, 8.0, 11.0, 7.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.961090087890625, -0.93096923828125, -0.900848388671875, -0.8707275390625, -0.840606689453125, -0.81048583984375, -0.780364990234375, -0.750244140625, -0.720123291015625, -0.69000244140625, -0.659881591796875, -0.6297607421875, -0.599639892578125, -0.56951904296875, -0.539398193359375, -0.50927734375, -0.479156494140625, -0.44903564453125, -0.418914794921875, -0.3887939453125, -0.358673095703125, -0.32855224609375, -0.298431396484375, -0.268310546875, -0.238189697265625, -0.20806884765625, -0.177947998046875, -0.1478271484375, -0.117706298828125, -0.08758544921875, -0.057464599609375, -0.02734375, 0.002777099609375, 0.03289794921875, 0.063018798828125, 0.0931396484375, 0.123260498046875, 0.15338134765625, 0.183502197265625, 0.213623046875, 0.243743896484375, 0.27386474609375, 0.303985595703125, 0.3341064453125, 0.364227294921875, 0.39434814453125, 0.424468994140625, 0.45458984375, 0.484710693359375, 0.51483154296875, 0.544952392578125, 0.5750732421875, 0.605194091796875, 0.63531494140625, 0.665435791015625, 0.695556640625, 0.725677490234375, 0.75579833984375, 0.785919189453125, 0.8160400390625, 0.846160888671875, 0.87628173828125, 0.906402587890625, 0.9365234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 10.0, 4.0, 3.0, 9.0, 13.0, 17.0, 26.0, 46.0, 89.0, 322.0, 225.0, 96.0, 46.0, 40.0, 18.0, 16.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.705677032470703, -15.398041725158691, -14.09040641784668, -12.782772064208984, -11.475136756896973, -10.167501449584961, -8.859867095947266, -7.552231788635254, -6.244596481323242, -4.9369611740112305, -3.629326343536377, -2.3216912746429443, -1.0140562057495117, 0.2935791015625, 1.6012139320373535, 2.908848762512207, 4.216484069824219, 5.5241193771362305, 6.831754207611084, 8.139389038085938, 9.44702434539795, 10.754659652709961, 12.062294006347656, 13.369929313659668, 14.67756462097168, 15.985199928283691, 17.292835235595703, 18.6004695892334, 19.908103942871094, 21.215740203857422, 22.523374557495117, 23.831008911132812, 25.138648986816406, 26.4462833404541, 27.75391960144043, 29.061553955078125, 30.369190216064453, 31.67682456970215, 32.984458923339844, 34.29209518432617, 35.5997314453125, 36.90736770629883, 38.21500015258789, 39.52263641357422, 40.83027267456055, 42.137908935546875, 43.44554138183594, 44.753177642822266, 46.06081008911133, 47.368446350097656, 48.67607879638672, 49.98371505737305, 51.291351318359375, 52.59898376464844, 53.906620025634766, 55.214256286621094, 56.521888732910156, 57.829524993896484, 59.13715744018555, 60.444793701171875, 61.7524299621582, 63.06006622314453, 64.3676986694336, 65.67533111572266, 66.98297119140625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 7.0, 10.0, 6.0, 10.0, 6.0, 8.0, 9.0, 14.0, 27.0, 15.0, 21.0, 27.0, 41.0, 41.0, 77.0, 102.0, 128.0, 114.0, 76.0, 45.0, 19.0, 31.0, 14.0, 13.0, 14.0, 14.0, 12.0, 15.0, 12.0, 11.0, 7.0, 6.0, 7.0, 4.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.786760330200195, -30.809301376342773, -29.83184051513672, -28.854381561279297, -27.876920700073242, -26.89946174621582, -25.922000885009766, -24.944541931152344, -23.967082977294922, -22.9896240234375, -22.012163162231445, -21.034704208374023, -20.05724334716797, -19.079784393310547, -18.102325439453125, -17.12486457824707, -16.147403717041016, -15.169943809509277, -14.192483901977539, -13.215024948120117, -12.237564086914062, -11.26010513305664, -10.282645225524902, -9.305185317993164, -8.327725410461426, -7.3502655029296875, -6.372805595397949, -5.395346164703369, -4.417886257171631, -3.4404263496398926, -2.4629669189453125, -1.4855070114135742, -0.5080451965332031, 0.4694145917892456, 1.4468743801116943, 2.4243340492248535, 3.401793956756592, 4.37925386428833, 5.35671329498291, 6.334173202514648, 7.311633110046387, 8.289093017578125, 9.266552925109863, 10.244012832641602, 11.221471786499023, 12.198932647705078, 13.1763916015625, 14.153851509094238, 15.131311416625977, 16.1087703704834, 17.086231231689453, 18.063690185546875, 19.04115104675293, 20.01861000061035, 20.996070861816406, 21.973529815673828, 22.95098876953125, 23.928447723388672, 24.905908584594727, 25.88336753845215, 26.860828399658203, 27.838287353515625, 28.815746307373047, 29.7932071685791, 30.770668029785156]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 8.0, 13.0, 14.0, 19.0, 29.0, 29.0, 35.0, 32.0, 43.0, 52.0, 88.0, 220.0, 107.0, 61.0, 40.0, 36.0, 29.0, 19.0, 25.0, 15.0, 22.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.235137939453125, -3.10894775390625, -2.982757568359375, -2.8565673828125, -2.730377197265625, -2.60418701171875, -2.477996826171875, -2.351806640625, -2.225616455078125, -2.09942626953125, -1.973236083984375, -1.8470458984375, -1.720855712890625, -1.59466552734375, -1.468475341796875, -1.34228515625, -1.216094970703125, -1.08990478515625, -0.963714599609375, -0.8375244140625, -0.711334228515625, -0.58514404296875, -0.458953857421875, -0.332763671875, -0.206573486328125, -0.08038330078125, 0.045806884765625, 0.1719970703125, 0.298187255859375, 0.42437744140625, 0.550567626953125, 0.6767578125, 0.802947998046875, 0.92913818359375, 1.055328369140625, 1.1815185546875, 1.307708740234375, 1.43389892578125, 1.560089111328125, 1.686279296875, 1.812469482421875, 1.93865966796875, 2.064849853515625, 2.1910400390625, 2.317230224609375, 2.44342041015625, 2.569610595703125, 2.69580078125, 2.821990966796875, 2.94818115234375, 3.074371337890625, 3.2005615234375, 3.326751708984375, 3.45294189453125, 3.579132080078125, 3.705322265625, 3.831512451171875, 3.95770263671875, 4.083892822265625, 4.2100830078125, 4.336273193359375, 4.46246337890625, 4.588653564453125, 4.71484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 11.0, 13.0, 16.0, 37.0, 39.0, 72.0, 114.0, 248.0, 555.0, 1634.0, 5896.0, 59546.0, 8302411.0, 13253.0, 2926.0, 944.0, 384.0, 158.0, 73.0, 53.0, 41.0, 31.0, 26.0, 20.0, 8.0, 7.0, 12.0, 11.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 0.0, 1.0], "bins": [-23.040096282958984, -22.346797943115234, -21.653501510620117, -20.960203170776367, -20.266904830932617, -19.573606491088867, -18.88031005859375, -18.18701171875, -17.49371337890625, -16.8004150390625, -16.107118606567383, -15.413820266723633, -14.720521926879883, -14.02722454071045, -13.333927154541016, -12.640628814697266, -11.947331428527832, -11.254034042358398, -10.560735702514648, -9.867438316345215, -9.174139976501465, -8.480842590332031, -7.7875447273254395, -7.094246864318848, -6.400949001312256, -5.707651138305664, -5.014353275299072, -4.3210554122924805, -3.6277577877044678, -2.934459924697876, -2.2411623001098633, -1.5478644371032715, -0.8545665740966797, -0.16126877069473267, 0.5320290327072144, 1.2253267765045166, 1.9186246395111084, 2.6119225025177, 3.305220127105713, 3.9985179901123047, 4.6918158531188965, 5.385113716125488, 6.07841157913208, 6.771709442138672, 7.4650068283081055, 8.158305168151855, 8.851602554321289, 9.544900894165039, 10.238198280334473, 10.931495666503906, 11.624794006347656, 12.31809139251709, 13.01138973236084, 13.704687118530273, 14.397985458374023, 15.091282844543457, 15.78458023071289, 16.47787857055664, 17.171175003051758, 17.864473342895508, 18.557771682739258, 19.251070022583008, 19.944366455078125, 20.637664794921875, 21.330963134765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-37.35580062866211, -36.37879180908203, -35.40178298950195, -34.42477798461914, -33.44776916503906, -32.470760345458984, -31.493751525878906, -30.51674461364746, -29.539735794067383, -28.562726974487305, -27.58572006225586, -26.60871124267578, -25.631704330444336, -24.654695510864258, -23.677688598632812, -22.700679779052734, -21.723670959472656, -20.746662139892578, -19.769655227661133, -18.792646408081055, -17.81563949584961, -16.83863067626953, -15.86162281036377, -14.884614944458008, -13.907608032226562, -12.9306001663208, -11.953592300415039, -10.976583480834961, -9.9995756149292, -9.022567749023438, -8.045559883117676, -7.068551540374756, -6.091543197631836, -5.114535331726074, -4.137526988983154, -3.1605191230773926, -2.1835110187530518, -1.206502914428711, -0.22949504852294922, 0.7475132942199707, 1.7245211601257324, 2.7015292644500732, 3.678537368774414, 4.655545234680176, 5.6325531005859375, 6.609561443328857, 7.586569309234619, 8.563577651977539, 9.5405855178833, 10.517593383789062, 11.494601249694824, 12.471609115600586, 13.448617935180664, 14.425625801086426, 15.402633666992188, 16.379642486572266, 17.35664939880371, 18.33365821838379, 19.310665130615234, 20.287673950195312, 21.264680862426758, 22.241689682006836, 23.21869659423828, 24.19570541381836, 25.172714233398438]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 19.0, 16.0, 26.0, 34.0, 27.0, 45.0, 50.0, 56.0, 69.0, 65.0, 84.0, 61.0, 76.0, 54.0, 54.0, 52.0, 36.0, 37.0, 29.0, 24.0, 20.0, 12.0, 12.0, 12.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.942779541015625, -3.83477783203125, -3.726776123046875, -3.6187744140625, -3.510772705078125, -3.40277099609375, -3.294769287109375, -3.186767578125, -3.078765869140625, -2.97076416015625, -2.862762451171875, -2.7547607421875, -2.646759033203125, -2.53875732421875, -2.430755615234375, -2.32275390625, -2.214752197265625, -2.10675048828125, -1.998748779296875, -1.8907470703125, -1.782745361328125, -1.67474365234375, -1.566741943359375, -1.458740234375, -1.350738525390625, -1.24273681640625, -1.134735107421875, -1.0267333984375, -0.918731689453125, -0.81072998046875, -0.702728271484375, -0.5947265625, -0.486724853515625, -0.37872314453125, -0.270721435546875, -0.1627197265625, -0.054718017578125, 0.05328369140625, 0.161285400390625, 0.269287109375, 0.377288818359375, 0.48529052734375, 0.593292236328125, 0.7012939453125, 0.809295654296875, 0.91729736328125, 1.025299072265625, 1.13330078125, 1.241302490234375, 1.34930419921875, 1.457305908203125, 1.5653076171875, 1.673309326171875, 1.78131103515625, 1.889312744140625, 1.997314453125, 2.105316162109375, 2.21331787109375, 2.321319580078125, 2.4293212890625, 2.537322998046875, 2.64532470703125, 2.753326416015625, 2.861328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 6.0, 7.0, 19.0, 11.0, 26.0, 51.0, 77.0, 151.0, 297.0, 638.0, 1459.0, 3924.0, 11169.0, 35279.0, 114885.0, 211167.0, 98864.0, 30260.0, 9929.0, 3456.0, 1392.0, 586.0, 244.0, 142.0, 60.0, 47.0, 30.0, 21.0, 15.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.453125, -18.76904296875, -18.0849609375, -17.40087890625, -16.716796875, -16.03271484375, -15.3486328125, -14.66455078125, -13.98046875, -13.29638671875, -12.6123046875, -11.92822265625, -11.244140625, -10.56005859375, -9.8759765625, -9.19189453125, -8.5078125, -7.82373046875, -7.1396484375, -6.45556640625, -5.771484375, -5.08740234375, -4.4033203125, -3.71923828125, -3.03515625, -2.35107421875, -1.6669921875, -0.98291015625, -0.298828125, 0.38525390625, 1.0693359375, 1.75341796875, 2.4375, 3.12158203125, 3.8056640625, 4.48974609375, 5.173828125, 5.85791015625, 6.5419921875, 7.22607421875, 7.91015625, 8.59423828125, 9.2783203125, 9.96240234375, 10.646484375, 11.33056640625, 12.0146484375, 12.69873046875, 13.3828125, 14.06689453125, 14.7509765625, 15.43505859375, 16.119140625, 16.80322265625, 17.4873046875, 18.17138671875, 18.85546875, 19.53955078125, 20.2236328125, 20.90771484375, 21.591796875, 22.27587890625, 22.9599609375, 23.64404296875, 24.328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 8.0, 6.0, 11.0, 17.0, 28.0, 26.0, 37.0, 43.0, 58.0, 41.0, 60.0, 56.0, 60.0, 73.0, 63.0, 70.0, 55.0, 62.0, 34.0, 33.0, 34.0, 30.0, 22.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.452789306640625, -3.34893798828125, -3.245086669921875, -3.1412353515625, -3.037384033203125, -2.93353271484375, -2.829681396484375, -2.725830078125, -2.621978759765625, -2.51812744140625, -2.414276123046875, -2.3104248046875, -2.206573486328125, -2.10272216796875, -1.998870849609375, -1.89501953125, -1.791168212890625, -1.68731689453125, -1.583465576171875, -1.4796142578125, -1.375762939453125, -1.27191162109375, -1.168060302734375, -1.064208984375, -0.960357666015625, -0.85650634765625, -0.752655029296875, -0.6488037109375, -0.544952392578125, -0.44110107421875, -0.337249755859375, -0.2333984375, -0.129547119140625, -0.02569580078125, 0.078155517578125, 0.1820068359375, 0.285858154296875, 0.38970947265625, 0.493560791015625, 0.597412109375, 0.701263427734375, 0.80511474609375, 0.908966064453125, 1.0128173828125, 1.116668701171875, 1.22052001953125, 1.324371337890625, 1.42822265625, 1.532073974609375, 1.63592529296875, 1.739776611328125, 1.8436279296875, 1.947479248046875, 2.05133056640625, 2.155181884765625, 2.259033203125, 2.362884521484375, 2.46673583984375, 2.570587158203125, 2.6744384765625, 2.778289794921875, 2.88214111328125, 2.985992431640625, 3.08984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 7.0, 4.0, 6.0, 13.0, 17.0, 38.0, 75.0, 106.0, 96.0, 46.0, 25.0, 10.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.659618377685547, -29.742244720458984, -28.82486915588379, -27.907495498657227, -26.990121841430664, -26.07274627685547, -25.155372619628906, -24.237998962402344, -23.32062339782715, -22.403249740600586, -21.48587417602539, -20.568500518798828, -19.651126861572266, -18.73375129699707, -17.816377639770508, -16.899002075195312, -15.981629371643066, -15.064254760742188, -14.146881103515625, -13.229506492614746, -12.312131881713867, -11.394758224487305, -10.477383613586426, -9.560009002685547, -8.642635345458984, -7.725261211395264, -6.807886600494385, -5.890512466430664, -4.973137855529785, -4.0557637214660645, -3.1383895874023438, -2.221014976501465, -1.303640365600586, -0.3862660527229309, 0.5311082601547241, 1.4484825134277344, 2.365856885910034, 3.283231258392334, 4.200605392456055, 5.117980003356934, 6.035354137420654, 6.952728271484375, 7.870102882385254, 8.787477493286133, 9.704851150512695, 10.622225761413574, 11.539600372314453, 12.456974029541016, 13.374348640441895, 14.291723251342773, 15.209096908569336, 16.12647247314453, 17.043846130371094, 17.961219787597656, 18.87859344482422, 19.795969009399414, 20.713342666625977, 21.63071632385254, 22.548091888427734, 23.465465545654297, 24.38283920288086, 25.300214767456055, 26.217588424682617, 27.134963989257812, 28.052337646484375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 9.0, 2.0, 5.0, 27.0, 54.0, 132.0, 121.0, 59.0, 20.0, 8.0, 9.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.553199768066406, -24.54115104675293, -23.52910041809082, -22.517051696777344, -21.505001068115234, -20.492952346801758, -19.48090362548828, -18.468852996826172, -17.456804275512695, -16.44475555419922, -15.43270492553711, -14.420656204223633, -13.40860652923584, -12.396556854248047, -11.38450813293457, -10.372458457946777, -9.360408782958984, -8.348359107971191, -7.336309909820557, -6.324260711669922, -5.312211036682129, -4.300161361694336, -3.288112163543701, -2.2760629653930664, -1.2640132904052734, -0.25196385383605957, 0.7600855827331543, 1.7721350193023682, 2.784184455871582, 3.796234130859375, 4.80828332901001, 5.8203325271606445, 6.832378387451172, 7.844428062438965, 8.856477737426758, 9.868526458740234, 10.880576133728027, 11.89262580871582, 12.904674530029297, 13.91672420501709, 14.928773880004883, 15.940823554992676, 16.95287322998047, 17.964921951293945, 18.976970672607422, 19.98902130126953, 21.001070022583008, 22.013118743896484, 23.025169372558594, 24.03721809387207, 25.04926872253418, 26.061317443847656, 27.073368072509766, 28.085416793823242, 29.09746551513672, 30.109516143798828, 31.121564865112305, 32.13361358642578, 33.14566421508789, 34.15771484375, 35.169761657714844, 36.18181228637695, 37.19386291503906, 38.205909729003906, 39.217960357666016]}, "eval/loss": 1.85287344455719, "eval/wer": 0.9976993256644189, "eval/runtime": 896.1552, "eval/samples_per_second": 2.948, "eval/steps_per_second": 0.369, "train/train_runtime": 114528.9287, "train/train_samples_per_second": 4.984, "train/train_steps_per_second": 0.156, "train/total_flos": 0.0, "train/train_loss": 0.9826719127995244} \ No newline at end of file