diff --git "a/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" --- "a/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" +++ "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.3634, "train/learning_rate": 4.750593824228029e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 115954, "_timestamp": 1647709832, "_step": 17847, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [3.0, 6.0, 11.0, 43.0, 105.0, 198.0, 326.0, 195.0, 91.0, 29.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845430850982666, -4.951228618621826, -4.057026386260986, -3.1628243923187256, -2.2686221599578857, -1.374420166015625, -0.48021793365478516, 0.4139842987060547, 1.3081865310668945, 2.2023887634277344, 3.096590995788574, 3.990792989730835, 4.884995460510254, 5.7791972160339355, 6.673399448394775, 7.567601680755615, 8.461803436279297, 9.356005668640137, 10.250207901000977, 11.144410133361816, 12.038612365722656, 12.93281364440918, 13.827016830444336, 14.72121810913086, 15.615421295166016, 16.50962257385254, 17.403825759887695, 18.29802703857422, 19.192230224609375, 20.0864315032959, 20.980634689331055, 21.874835968017578, 22.7690372467041, 23.663238525390625, 24.55744171142578, 25.451642990112305, 26.34584617614746, 27.240047454833984, 28.13425064086914, 29.028451919555664, 29.92265510559082, 30.816856384277344, 31.7110595703125, 32.605262756347656, 33.49946212768555, 34.3936653137207, 35.28786849975586, 36.182071685791016, 37.076271057128906, 37.97047424316406, 38.86467361450195, 39.75887680053711, 40.653079986572266, 41.54728317260742, 42.44148254394531, 43.33568572998047, 44.229888916015625, 45.12409210205078, 46.01829147338867, 46.91249465942383, 47.806697845458984, 48.70090103149414, 49.59510040283203, 50.48930358886719, 51.383506774902344]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 8.0, 12.0, 8.0, 8.0, 12.0, 17.0, 12.0, 24.0, 21.0, 22.0, 31.0, 34.0, 24.0, 27.0, 36.0, 42.0, 46.0, 40.0, 40.0, 44.0, 61.0, 46.0, 41.0, 33.0, 29.0, 41.0, 28.0, 30.0, 15.0, 24.0, 28.0, 18.0, 17.0, 17.0, 7.0, 6.0, 8.0, 8.0, 8.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.530182838439941, -5.347039222717285, -5.163896083831787, -4.980752468109131, -4.797609329223633, -4.614465713500977, -4.43132209777832, -4.248178482055664, -4.065035343170166, -3.881891965866089, -3.6987485885620117, -3.5156049728393555, -3.3324615955352783, -3.149318218231201, -2.966174602508545, -2.7830312252044678, -2.5998878479003906, -2.4167444705963135, -2.2336010932922363, -2.05045747756958, -1.867314100265503, -1.6841707229614258, -1.501027226448059, -1.3178837299346924, -1.1347403526306152, -0.9515969157218933, -0.7684534788131714, -0.5853100419044495, -0.40216660499572754, -0.21902316808700562, -0.03587973117828369, 0.147263765335083, 0.33040761947631836, 0.5135510563850403, 0.6966944932937622, 0.8798379302024841, 1.062981367111206, 1.2461247444152832, 1.42926824092865, 1.6124117374420166, 1.7955551147460938, 1.978698492050171, 2.161841869354248, 2.3449854850769043, 2.5281288623809814, 2.7112722396850586, 2.894415855407715, 3.077559232711792, 3.260702610015869, 3.4438459873199463, 3.6269893646240234, 3.8101329803466797, 3.993276357650757, 4.176419734954834, 4.35956335067749, 4.542706489562988, 4.7258501052856445, 4.908993721008301, 5.092136859893799, 5.275280475616455, 5.458423614501953, 5.641567230224609, 5.824710845947266, 6.007854461669922, 6.19099760055542]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 7.0, 7.0, 10.0, 18.0, 23.0, 18.0, 21.0, 34.0, 36.0, 37.0, 48.0, 45.0, 43.0, 57.0, 65.0, 69.0, 63.0, 51.0, 45.0, 33.0, 39.0, 39.0, 36.0, 28.0, 19.0, 23.0, 15.0, 17.0, 6.0, 6.0, 7.0, 7.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.7312545776367188, -0.7090911865234375, -0.6869277954101562, -0.664764404296875, -0.6426010131835938, -0.6204376220703125, -0.5982742309570312, -0.57611083984375, -0.5539474487304688, -0.5317840576171875, -0.5096206665039062, -0.487457275390625, -0.46529388427734375, -0.4431304931640625, -0.42096710205078125, -0.3988037109375, -0.37664031982421875, -0.3544769287109375, -0.33231353759765625, -0.310150146484375, -0.28798675537109375, -0.2658233642578125, -0.24365997314453125, -0.22149658203125, -0.19933319091796875, -0.1771697998046875, -0.15500640869140625, -0.132843017578125, -0.11067962646484375, -0.0885162353515625, -0.06635284423828125, -0.044189453125, -0.02202606201171875, 0.0001373291015625, 0.02230072021484375, 0.044464111328125, 0.06662750244140625, 0.0887908935546875, 0.11095428466796875, 0.13311767578125, 0.15528106689453125, 0.1774444580078125, 0.19960784912109375, 0.221771240234375, 0.24393463134765625, 0.2660980224609375, 0.28826141357421875, 0.3104248046875, 0.33258819580078125, 0.3547515869140625, 0.37691497802734375, 0.399078369140625, 0.42124176025390625, 0.4434051513671875, 0.46556854248046875, 0.48773193359375, 0.5098953247070312, 0.5320587158203125, 0.5542221069335938, 0.576385498046875, 0.5985488891601562, 0.6207122802734375, 0.6428756713867188, 0.6650390625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 14.0, 19.0, 32.0, 32.0, 49.0, 83.0, 100.0, 146.0, 196.0, 298.0, 475.0, 1167.0, 3939.0, 19260.0, 189804.0, 3827644.0, 128776.0, 16054.0, 3656.0, 1094.0, 489.0, 289.0, 178.0, 127.0, 81.0, 69.0, 61.0, 38.0, 39.0, 18.0, 21.0, 7.0, 8.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.26849365234375, -8.0135498046875, -7.75860595703125, -7.503662109375, -7.24871826171875, -6.9937744140625, -6.73883056640625, -6.48388671875, -6.22894287109375, -5.9739990234375, -5.71905517578125, -5.464111328125, -5.20916748046875, -4.9542236328125, -4.69927978515625, -4.4443359375, -4.18939208984375, -3.9344482421875, -3.67950439453125, -3.424560546875, -3.16961669921875, -2.9146728515625, -2.65972900390625, -2.40478515625, -2.14984130859375, -1.8948974609375, -1.63995361328125, -1.385009765625, -1.13006591796875, -0.8751220703125, -0.62017822265625, -0.365234375, -0.11029052734375, 0.1446533203125, 0.39959716796875, 0.654541015625, 0.90948486328125, 1.1644287109375, 1.41937255859375, 1.67431640625, 1.92926025390625, 2.1842041015625, 2.43914794921875, 2.694091796875, 2.94903564453125, 3.2039794921875, 3.45892333984375, 3.7138671875, 3.96881103515625, 4.2237548828125, 4.47869873046875, 4.733642578125, 4.98858642578125, 5.2435302734375, 5.49847412109375, 5.75341796875, 6.00836181640625, 6.2633056640625, 6.51824951171875, 6.773193359375, 7.02813720703125, 7.2830810546875, 7.53802490234375, 7.79296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 23.0, 63.0, 99.0, 194.0, 527.0, 1662.0, 903.0, 322.0, 141.0, 70.0, 39.0, 19.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.46923828125, -9.2666015625, -9.06396484375, -8.861328125, -8.65869140625, -8.4560546875, -8.25341796875, -8.05078125, -7.84814453125, -7.6455078125, -7.44287109375, -7.240234375, -7.03759765625, -6.8349609375, -6.63232421875, -6.4296875, -6.22705078125, -6.0244140625, -5.82177734375, -5.619140625, -5.41650390625, -5.2138671875, -5.01123046875, -4.80859375, -4.60595703125, -4.4033203125, -4.20068359375, -3.998046875, -3.79541015625, -3.5927734375, -3.39013671875, -3.1875, -2.98486328125, -2.7822265625, -2.57958984375, -2.376953125, -2.17431640625, -1.9716796875, -1.76904296875, -1.56640625, -1.36376953125, -1.1611328125, -0.95849609375, -0.755859375, -0.55322265625, -0.3505859375, -0.14794921875, 0.0546875, 0.25732421875, 0.4599609375, 0.66259765625, 0.865234375, 1.06787109375, 1.2705078125, 1.47314453125, 1.67578125, 1.87841796875, 2.0810546875, 2.28369140625, 2.486328125, 2.68896484375, 2.8916015625, 3.09423828125, 3.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 8.0, 15.0, 31.0, 41.0, 81.0, 160.0, 586.0, 4736.0, 195360.0, 3961587.0, 29464.0, 1617.0, 330.0, 111.0, 62.0, 45.0, 19.0, 15.0, 9.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.904541015625, -34.05908203125, -33.213623046875, -32.3681640625, -31.522705078125, -30.67724609375, -29.831787109375, -28.986328125, -28.140869140625, -27.29541015625, -26.449951171875, -25.6044921875, -24.759033203125, -23.91357421875, -23.068115234375, -22.22265625, -21.377197265625, -20.53173828125, -19.686279296875, -18.8408203125, -17.995361328125, -17.14990234375, -16.304443359375, -15.458984375, -14.613525390625, -13.76806640625, -12.922607421875, -12.0771484375, -11.231689453125, -10.38623046875, -9.540771484375, -8.6953125, -7.849853515625, -7.00439453125, -6.158935546875, -5.3134765625, -4.468017578125, -3.62255859375, -2.777099609375, -1.931640625, -1.086181640625, -0.24072265625, 0.604736328125, 1.4501953125, 2.295654296875, 3.14111328125, 3.986572265625, 4.83203125, 5.677490234375, 6.52294921875, 7.368408203125, 8.2138671875, 9.059326171875, 9.90478515625, 10.750244140625, 11.595703125, 12.441162109375, 13.28662109375, 14.132080078125, 14.9775390625, 15.822998046875, 16.66845703125, 17.513916015625, 18.359375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 12.0, 8.0, 27.0, 35.0, 57.0, 100.0, 99.0, 148.0, 125.0, 134.0, 95.0, 62.0, 49.0, 27.0, 9.0, 10.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.54487419128418, -23.042083740234375, -22.53929328918457, -22.036502838134766, -21.53371238708496, -21.030921936035156, -20.52813148498535, -20.025341033935547, -19.522550582885742, -19.019760131835938, -18.516969680786133, -18.014179229736328, -17.511388778686523, -17.00859832763672, -16.505807876586914, -16.00301742553711, -15.500226020812988, -14.997435569763184, -14.494645118713379, -13.991854667663574, -13.48906421661377, -12.986273765563965, -12.483482360839844, -11.980691909790039, -11.477901458740234, -10.97511100769043, -10.472320556640625, -9.96953010559082, -9.466739654541016, -8.963949203491211, -8.461158752441406, -7.958367824554443, -7.455578804016113, -6.952788352966309, -6.449997901916504, -5.947207450866699, -5.4444169998168945, -4.94162654876709, -4.438835620880127, -3.9360451698303223, -3.4332547187805176, -2.930464267730713, -2.427673816680908, -1.9248831272125244, -1.4220926761627197, -0.919302225112915, -0.41651153564453125, 0.08627891540527344, 0.5890693664550781, 1.0918598175048828, 1.594650387763977, 2.0974409580230713, 2.600231409072876, 3.1030218601226807, 3.6058125495910645, 4.108603000640869, 4.611393451690674, 5.1141839027404785, 5.616974353790283, 6.119765281677246, 6.622555732727051, 7.1253461837768555, 7.62813663482666, 8.130927085876465, 8.63371753692627]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 10.0, 7.0, 7.0, 10.0, 12.0, 9.0, 19.0, 21.0, 25.0, 35.0, 31.0, 45.0, 30.0, 30.0, 34.0, 50.0, 34.0, 47.0, 38.0, 49.0, 44.0, 32.0, 32.0, 35.0, 40.0, 36.0, 24.0, 34.0, 29.0, 30.0, 12.0, 20.0, 10.0, 14.0, 7.0, 7.0, 10.0, 3.0, 5.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.30954647064209, -8.061635971069336, -7.813724994659424, -7.565814018249512, -7.317903518676758, -7.069992542266846, -6.822081565856934, -6.57417106628418, -6.326260089874268, -6.0783491134643555, -5.830438613891602, -5.5825276374816895, -5.334616661071777, -5.086706161499023, -4.838795185089111, -4.590884208679199, -4.342973709106445, -4.095062732696533, -3.8471522331237793, -3.599241256713867, -3.351330518722534, -3.103419780731201, -2.855508804321289, -2.607598066329956, -2.359687328338623, -2.11177659034729, -1.8638657331466675, -1.615954875946045, -1.368044137954712, -1.120133399963379, -0.8722225427627563, -0.6243116855621338, -0.376401424407959, -0.1284906268119812, 0.11942017078399658, 0.36733096837997437, 0.6152417659759521, 0.8631525039672852, 1.1110633611679077, 1.3589742183685303, 1.6068849563598633, 1.8547956943511963, 2.1027064323425293, 2.3506174087524414, 2.5985281467437744, 2.8464388847351074, 3.0943498611450195, 3.3422605991363525, 3.5901713371276855, 3.8380820751190186, 4.085992813110352, 4.333903789520264, 4.581814765930176, 4.82972526550293, 5.077636241912842, 5.325547218322754, 5.573457717895508, 5.82136869430542, 6.069279193878174, 6.317190170288086, 6.56510066986084, 6.813011646270752, 7.060922622680664, 7.308833122253418, 7.55674409866333]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 11.0, 9.0, 10.0, 14.0, 9.0, 18.0, 24.0, 28.0, 29.0, 18.0, 28.0, 36.0, 24.0, 44.0, 35.0, 46.0, 38.0, 54.0, 51.0, 47.0, 44.0, 53.0, 38.0, 34.0, 28.0, 38.0, 41.0, 27.0, 14.0, 24.0, 11.0, 18.0, 13.0, 10.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.78271484375, -0.7615890502929688, -0.7404632568359375, -0.7193374633789062, -0.698211669921875, -0.6770858764648438, -0.6559600830078125, -0.6348342895507812, -0.61370849609375, -0.5925827026367188, -0.5714569091796875, -0.5503311157226562, -0.529205322265625, -0.5080795288085938, -0.4869537353515625, -0.46582794189453125, -0.4447021484375, -0.42357635498046875, -0.4024505615234375, -0.38132476806640625, -0.360198974609375, -0.33907318115234375, -0.3179473876953125, -0.29682159423828125, -0.27569580078125, -0.25457000732421875, -0.2334442138671875, -0.21231842041015625, -0.191192626953125, -0.17006683349609375, -0.1489410400390625, -0.12781524658203125, -0.106689453125, -0.08556365966796875, -0.0644378662109375, -0.04331207275390625, -0.022186279296875, -0.00106048583984375, 0.0200653076171875, 0.04119110107421875, 0.06231689453125, 0.08344268798828125, 0.1045684814453125, 0.12569427490234375, 0.146820068359375, 0.16794586181640625, 0.1890716552734375, 0.21019744873046875, 0.2313232421875, 0.25244903564453125, 0.2735748291015625, 0.29470062255859375, 0.315826416015625, 0.33695220947265625, 0.3580780029296875, 0.37920379638671875, 0.40032958984375, 0.42145538330078125, 0.4425811767578125, 0.46370697021484375, 0.484832763671875, 0.5059585571289062, 0.5270843505859375, 0.5482101440429688, 0.5693359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 8.0, 19.0, 17.0, 37.0, 76.0, 112.0, 150.0, 230.0, 350.0, 544.0, 851.0, 1294.0, 2068.0, 3260.0, 5435.0, 9017.0, 14766.0, 24497.0, 40298.0, 64996.0, 101558.0, 147295.0, 179144.0, 155404.0, 111210.0, 72108.0, 44589.0, 27220.0, 16203.0, 9685.0, 6128.0, 3702.0, 2260.0, 1442.0, 896.0, 594.0, 353.0, 248.0, 169.0, 98.0, 80.0, 43.0, 33.0, 23.0, 14.0, 6.0, 11.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66552734375, -0.645721435546875, -0.62591552734375, -0.606109619140625, -0.5863037109375, -0.566497802734375, -0.54669189453125, -0.526885986328125, -0.507080078125, -0.487274169921875, -0.46746826171875, -0.447662353515625, -0.4278564453125, -0.408050537109375, -0.38824462890625, -0.368438720703125, -0.3486328125, -0.328826904296875, -0.30902099609375, -0.289215087890625, -0.2694091796875, -0.249603271484375, -0.22979736328125, -0.209991455078125, -0.190185546875, -0.170379638671875, -0.15057373046875, -0.130767822265625, -0.1109619140625, -0.091156005859375, -0.07135009765625, -0.051544189453125, -0.03173828125, -0.011932373046875, 0.00787353515625, 0.027679443359375, 0.0474853515625, 0.067291259765625, 0.08709716796875, 0.106903076171875, 0.126708984375, 0.146514892578125, 0.16632080078125, 0.186126708984375, 0.2059326171875, 0.225738525390625, 0.24554443359375, 0.265350341796875, 0.28515625, 0.304962158203125, 0.32476806640625, 0.344573974609375, 0.3643798828125, 0.384185791015625, 0.40399169921875, 0.423797607421875, 0.443603515625, 0.463409423828125, 0.48321533203125, 0.503021240234375, 0.5228271484375, 0.542633056640625, 0.56243896484375, 0.582244873046875, 0.60205078125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 5.0, 5.0, 9.0, 14.0, 9.0, 14.0, 14.0, 22.0, 22.0, 23.0, 28.0, 39.0, 36.0, 35.0, 28.0, 48.0, 48.0, 40.0, 1067.0, 62.0, 42.0, 47.0, 50.0, 30.0, 34.0, 36.0, 29.0, 20.0, 23.0, 29.0, 18.0, 16.0, 13.0, 13.0, 10.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65673828125, -0.635223388671875, -0.61370849609375, -0.592193603515625, -0.5706787109375, -0.549163818359375, -0.52764892578125, -0.506134033203125, -0.484619140625, -0.463104248046875, -0.44158935546875, -0.420074462890625, -0.3985595703125, -0.377044677734375, -0.35552978515625, -0.334014892578125, -0.3125, -0.290985107421875, -0.26947021484375, -0.247955322265625, -0.2264404296875, -0.204925537109375, -0.18341064453125, -0.161895751953125, -0.140380859375, -0.118865966796875, -0.09735107421875, -0.075836181640625, -0.0543212890625, -0.032806396484375, -0.01129150390625, 0.010223388671875, 0.03173828125, 0.053253173828125, 0.07476806640625, 0.096282958984375, 0.1177978515625, 0.139312744140625, 0.16082763671875, 0.182342529296875, 0.203857421875, 0.225372314453125, 0.24688720703125, 0.268402099609375, 0.2899169921875, 0.311431884765625, 0.33294677734375, 0.354461669921875, 0.3759765625, 0.397491455078125, 0.41900634765625, 0.440521240234375, 0.4620361328125, 0.483551025390625, 0.50506591796875, 0.526580810546875, 0.548095703125, 0.569610595703125, 0.59112548828125, 0.612640380859375, 0.6341552734375, 0.655670166015625, 0.67718505859375, 0.698699951171875, 0.72021484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 6.0, 3.0, 5.0, 4.0, 12.0, 15.0, 20.0, 40.0, 59.0, 58.0, 82.0, 133.0, 210.0, 276.0, 378.0, 570.0, 813.0, 1164.0, 1750.0, 2669.0, 3797.0, 5615.0, 8660.0, 13629.0, 22686.0, 45313.0, 175298.0, 1443544.0, 249500.0, 53007.0, 25031.0, 14726.0, 9142.0, 6082.0, 4082.0, 2719.0, 1889.0, 1303.0, 869.0, 630.0, 412.0, 269.0, 208.0, 148.0, 101.0, 65.0, 51.0, 38.0, 16.0, 12.0, 11.0, 9.0, 4.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.59033203125, -0.5710296630859375, -0.551727294921875, -0.5324249267578125, -0.51312255859375, -0.4938201904296875, -0.474517822265625, -0.4552154541015625, -0.4359130859375, -0.4166107177734375, -0.397308349609375, -0.3780059814453125, -0.35870361328125, -0.3394012451171875, -0.320098876953125, -0.3007965087890625, -0.281494140625, -0.2621917724609375, -0.242889404296875, -0.2235870361328125, -0.20428466796875, -0.1849822998046875, -0.165679931640625, -0.1463775634765625, -0.1270751953125, -0.1077728271484375, -0.088470458984375, -0.0691680908203125, -0.04986572265625, -0.0305633544921875, -0.011260986328125, 0.0080413818359375, 0.02734375, 0.0466461181640625, 0.065948486328125, 0.0852508544921875, 0.10455322265625, 0.1238555908203125, 0.143157958984375, 0.1624603271484375, 0.1817626953125, 0.2010650634765625, 0.220367431640625, 0.2396697998046875, 0.25897216796875, 0.2782745361328125, 0.297576904296875, 0.3168792724609375, 0.336181640625, 0.3554840087890625, 0.374786376953125, 0.3940887451171875, 0.41339111328125, 0.4326934814453125, 0.451995849609375, 0.4712982177734375, 0.4906005859375, 0.5099029541015625, 0.529205322265625, 0.5485076904296875, 0.56781005859375, 0.5871124267578125, 0.606414794921875, 0.6257171630859375, 0.64501953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 14.0, 12.0, 15.0, 23.0, 25.0, 35.0, 40.0, 77.0, 105.0, 90.0, 103.0, 93.0, 93.0, 62.0, 55.0, 48.0, 23.0, 21.0, 9.0, 9.0, 11.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.21038246154785156, -0.20372390747070312, -0.1970653533935547, -0.19040679931640625, -0.1837482452392578, -0.17708969116210938, -0.17043113708496094, -0.1637725830078125, -0.15711402893066406, -0.15045547485351562, -0.1437969207763672, -0.13713836669921875, -0.1304798126220703, -0.12382125854492188, -0.11716270446777344, -0.110504150390625, -0.10384559631347656, -0.09718704223632812, -0.09052848815917969, -0.08386993408203125, -0.07721138000488281, -0.07055282592773438, -0.06389427185058594, -0.0572357177734375, -0.05057716369628906, -0.043918609619140625, -0.03726005554199219, -0.03060150146484375, -0.023942947387695312, -0.017284393310546875, -0.010625839233398438, -0.00396728515625, 0.0026912689208984375, 0.009349822998046875, 0.016008377075195312, 0.02266693115234375, 0.029325485229492188, 0.035984039306640625, 0.04264259338378906, 0.0493011474609375, 0.05595970153808594, 0.06261825561523438, 0.06927680969238281, 0.07593536376953125, 0.08259391784667969, 0.08925247192382812, 0.09591102600097656, 0.102569580078125, 0.10922813415527344, 0.11588668823242188, 0.12254524230957031, 0.12920379638671875, 0.1358623504638672, 0.14252090454101562, 0.14917945861816406, 0.1558380126953125, 0.16249656677246094, 0.16915512084960938, 0.1758136749267578, 0.18247222900390625, 0.1891307830810547, 0.19578933715820312, 0.20244789123535156, 0.2091064453125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 11.0, 9.0, 25.0, 16.0, 37.0, 50.0, 52.0, 72.0, 87.0, 143.0, 285.0, 586.0, 1903.0, 13715.0, 671972.0, 347247.0, 9655.0, 1437.0, 482.0, 235.0, 161.0, 108.0, 60.0, 61.0, 42.0, 19.0, 24.0, 14.0, 5.0, 7.0, 11.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3671875, -2.2880859375, -2.208984375, -2.1298828125, -2.05078125, -1.9716796875, -1.892578125, -1.8134765625, -1.734375, -1.6552734375, -1.576171875, -1.4970703125, -1.41796875, -1.3388671875, -1.259765625, -1.1806640625, -1.1015625, -1.0224609375, -0.943359375, -0.8642578125, -0.78515625, -0.7060546875, -0.626953125, -0.5478515625, -0.46875, -0.3896484375, -0.310546875, -0.2314453125, -0.15234375, -0.0732421875, 0.005859375, 0.0849609375, 0.1640625, 0.2431640625, 0.322265625, 0.4013671875, 0.48046875, 0.5595703125, 0.638671875, 0.7177734375, 0.796875, 0.8759765625, 0.955078125, 1.0341796875, 1.11328125, 1.1923828125, 1.271484375, 1.3505859375, 1.4296875, 1.5087890625, 1.587890625, 1.6669921875, 1.74609375, 1.8251953125, 1.904296875, 1.9833984375, 2.0625, 2.1416015625, 2.220703125, 2.2998046875, 2.37890625, 2.4580078125, 2.537109375, 2.6162109375, 2.6953125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 22.0, 20.0, 18.0, 36.0, 47.0, 75.0, 129.0, 177.0, 158.0, 122.0, 66.0, 45.0, 18.0, 19.0, 8.0, 9.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7907149195671082, -0.7484149932861328, -0.7061150670051575, -0.6638151407241821, -0.6215152740478516, -0.5792152881622314, -0.5369154214859009, -0.49461549520492554, -0.4523155689239502, -0.41001564264297485, -0.3677157163619995, -0.32541581988334656, -0.2831158936023712, -0.24081596732139587, -0.19851607084274292, -0.15621614456176758, -0.11391621828079224, -0.07161629945039749, -0.029316380620002747, 0.012983530759811401, 0.05528345704078674, 0.09758338332176208, 0.13988327980041504, 0.18218320608139038, 0.22448313236236572, 0.26678305864334106, 0.3090829849243164, 0.35138288140296936, 0.3936828076839447, 0.43598273396492004, 0.478282630443573, 0.5205825567245483, 0.5628825426101685, 0.6051824688911438, 0.6474823951721191, 0.6897822618484497, 0.7320822477340698, 0.7743821144104004, 0.8166820406913757, 0.8589819669723511, 0.9012818932533264, 0.9435818195343018, 0.9858817458152771, 1.0281816720962524, 1.070481538772583, 1.1127815246582031, 1.1550813913345337, 1.1973812580108643, 1.2396812438964844, 1.281981110572815, 1.324281096458435, 1.3665809631347656, 1.4088809490203857, 1.4511808156967163, 1.4934806823730469, 1.535780668258667, 1.578080654144287, 1.6203805208206177, 1.6626805067062378, 1.7049803733825684, 1.7472803592681885, 1.789580225944519, 1.8318800926208496, 1.8741800785064697, 1.9164799451828003]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 6.0, 1.0, 1.0, 3.0, 9.0, 7.0, 11.0, 16.0, 16.0, 27.0, 20.0, 35.0, 27.0, 36.0, 38.0, 40.0, 43.0, 59.0, 47.0, 53.0, 40.0, 41.0, 53.0, 54.0, 47.0, 41.0, 42.0, 29.0, 30.0, 26.0, 19.0, 21.0, 12.0, 10.0, 10.0, 12.0, 4.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46852099895477295, -0.45353963971138, -0.43855828046798706, -0.4235769212245941, -0.40859556198120117, -0.39361417293548584, -0.3786328434944153, -0.36365145444869995, -0.348670095205307, -0.33368873596191406, -0.3187073767185211, -0.3037260174751282, -0.28874465823173523, -0.2737632989883423, -0.25878190994262695, -0.243800550699234, -0.22881920635700226, -0.21383784711360931, -0.19885648787021637, -0.18387511372566223, -0.1688937544822693, -0.15391239523887634, -0.1389310359954834, -0.12394966930150986, -0.10896831005811691, -0.09398695081472397, -0.07900558412075043, -0.06402422487735748, -0.04904286190867424, -0.034061498939991, -0.019080139696598053, -0.004098773002624512, 0.010882586240768433, 0.025863949209451675, 0.04084531217813492, 0.05582667142152786, 0.0708080381155014, 0.08578939735889435, 0.10077075660228729, 0.11575212329626083, 0.13073348999023438, 0.14571484923362732, 0.16069620847702026, 0.1756775677204132, 0.19065894186496735, 0.2056403011083603, 0.22062166035175323, 0.23560303449630737, 0.25058436393737793, 0.2655657231807709, 0.2805470824241638, 0.29552844166755676, 0.3105098009109497, 0.32549118995666504, 0.3404725193977356, 0.3554539084434509, 0.37043526768684387, 0.3854166269302368, 0.40039798617362976, 0.4153793454170227, 0.43036070466041565, 0.4453420639038086, 0.4603234529495239, 0.47530481219291687, 0.4902861714363098]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 11.0, 3.0, 10.0, 8.0, 11.0, 16.0, 13.0, 12.0, 31.0, 32.0, 18.0, 32.0, 33.0, 38.0, 42.0, 39.0, 37.0, 47.0, 49.0, 55.0, 46.0, 49.0, 56.0, 43.0, 41.0, 43.0, 31.0, 23.0, 17.0, 20.0, 12.0, 18.0, 20.0, 13.0, 12.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.77734375, -0.7553939819335938, -0.7334442138671875, -0.7114944458007812, -0.689544677734375, -0.6675949096679688, -0.6456451416015625, -0.6236953735351562, -0.60174560546875, -0.5797958374023438, -0.5578460693359375, -0.5358963012695312, -0.513946533203125, -0.49199676513671875, -0.4700469970703125, -0.44809722900390625, -0.4261474609375, -0.40419769287109375, -0.3822479248046875, -0.36029815673828125, -0.338348388671875, -0.31639862060546875, -0.2944488525390625, -0.27249908447265625, -0.25054931640625, -0.22859954833984375, -0.2066497802734375, -0.18470001220703125, -0.162750244140625, -0.14080047607421875, -0.1188507080078125, -0.09690093994140625, -0.074951171875, -0.05300140380859375, -0.0310516357421875, -0.00910186767578125, 0.012847900390625, 0.03479766845703125, 0.0567474365234375, 0.07869720458984375, 0.10064697265625, 0.12259674072265625, 0.1445465087890625, 0.16649627685546875, 0.188446044921875, 0.21039581298828125, 0.2323455810546875, 0.25429534912109375, 0.2762451171875, 0.29819488525390625, 0.3201446533203125, 0.34209442138671875, 0.364044189453125, 0.38599395751953125, 0.4079437255859375, 0.42989349365234375, 0.45184326171875, 0.47379302978515625, 0.4957427978515625, 0.5176925659179688, 0.539642333984375, 0.5615921020507812, 0.5835418701171875, 0.6054916381835938, 0.62744140625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 22.0, 23.0, 42.0, 41.0, 63.0, 109.0, 122.0, 219.0, 336.0, 496.0, 756.0, 1183.0, 2094.0, 3478.0, 5824.0, 10793.0, 20451.0, 42165.0, 94178.0, 211628.0, 315258.0, 181151.0, 80677.0, 36428.0, 18022.0, 9609.0, 5262.0, 3079.0, 1811.0, 1094.0, 727.0, 474.0, 304.0, 197.0, 136.0, 91.0, 58.0, 26.0, 32.0, 27.0, 18.0, 11.0, 11.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.861328125, -1.80560302734375, -1.7498779296875, -1.69415283203125, -1.638427734375, -1.58270263671875, -1.5269775390625, -1.47125244140625, -1.41552734375, -1.35980224609375, -1.3040771484375, -1.24835205078125, -1.192626953125, -1.13690185546875, -1.0811767578125, -1.02545166015625, -0.9697265625, -0.91400146484375, -0.8582763671875, -0.80255126953125, -0.746826171875, -0.69110107421875, -0.6353759765625, -0.57965087890625, -0.52392578125, -0.46820068359375, -0.4124755859375, -0.35675048828125, -0.301025390625, -0.24530029296875, -0.1895751953125, -0.13385009765625, -0.078125, -0.02239990234375, 0.0333251953125, 0.08905029296875, 0.144775390625, 0.20050048828125, 0.2562255859375, 0.31195068359375, 0.36767578125, 0.42340087890625, 0.4791259765625, 0.53485107421875, 0.590576171875, 0.64630126953125, 0.7020263671875, 0.75775146484375, 0.8134765625, 0.86920166015625, 0.9249267578125, 0.98065185546875, 1.036376953125, 1.09210205078125, 1.1478271484375, 1.20355224609375, 1.25927734375, 1.31500244140625, 1.3707275390625, 1.42645263671875, 1.482177734375, 1.53790283203125, 1.5936279296875, 1.64935302734375, 1.705078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 6.0, 5.0, 6.0, 21.0, 25.0, 34.0, 38.0, 39.0, 64.0, 84.0, 119.0, 222.0, 866.0, 842.0, 209.0, 126.0, 86.0, 65.0, 46.0, 39.0, 37.0, 28.0, 16.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.625, -3.5, -3.375, -3.25, -3.125, -3.0, -2.875, -2.75, -2.625, -2.5, -2.375, -2.25, -2.125, -2.0, -1.875, -1.75, -1.625, -1.5, -1.375, -1.25, -1.125, -1.0, -0.875, -0.75, -0.625, -0.5, -0.375, -0.25, -0.125, 0.0, 0.125, 0.25, 0.375, 0.5, 0.625, 0.75, 0.875, 1.0, 1.125, 1.25, 1.375, 1.5, 1.625, 1.75, 1.875, 2.0, 2.125, 2.25, 2.375, 2.5, 2.625, 2.75, 2.875, 3.0, 3.125, 3.25, 3.375, 3.5, 3.625, 3.75, 3.875, 4.0, 4.125, 4.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 4.0, 10.0, 10.0, 7.0, 28.0, 30.0, 43.0, 58.0, 94.0, 156.0, 312.0, 485.0, 925.0, 1694.0, 4049.0, 11945.0, 79239.0, 2364643.0, 636204.0, 32461.0, 7375.0, 2822.0, 1386.0, 721.0, 369.0, 225.0, 141.0, 82.0, 57.0, 37.0, 24.0, 22.0, 7.0, 11.0, 8.0, 4.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0625, -7.80078125, -7.5390625, -7.27734375, -7.015625, -6.75390625, -6.4921875, -6.23046875, -5.96875, -5.70703125, -5.4453125, -5.18359375, -4.921875, -4.66015625, -4.3984375, -4.13671875, -3.875, -3.61328125, -3.3515625, -3.08984375, -2.828125, -2.56640625, -2.3046875, -2.04296875, -1.78125, -1.51953125, -1.2578125, -0.99609375, -0.734375, -0.47265625, -0.2109375, 0.05078125, 0.3125, 0.57421875, 0.8359375, 1.09765625, 1.359375, 1.62109375, 1.8828125, 2.14453125, 2.40625, 2.66796875, 2.9296875, 3.19140625, 3.453125, 3.71484375, 3.9765625, 4.23828125, 4.5, 4.76171875, 5.0234375, 5.28515625, 5.546875, 5.80859375, 6.0703125, 6.33203125, 6.59375, 6.85546875, 7.1171875, 7.37890625, 7.640625, 7.90234375, 8.1640625, 8.42578125, 8.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 53.0, 375.0, 507.0, 71.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.940403938293457, -10.264060020446777, -8.587717056274414, -6.911373138427734, -5.235029697418213, -3.5586862564086914, -1.8823423385620117, -0.20599937438964844, 1.4703445434570312, 3.1466879844665527, 4.823031425476074, 6.499375343322754, 8.175718307495117, 9.852062225341797, 11.528406143188477, 13.20474910736084, 14.88109302520752, 16.557435989379883, 18.233779907226562, 19.910123825073242, 21.586467742919922, 23.26280975341797, 24.93915557861328, 26.615497589111328, 28.291841506958008, 29.968185424804688, 31.644529342651367, 33.32087326049805, 34.997215270996094, 36.673561096191406, 38.34990310668945, 40.0262451171875, 41.70258712768555, 43.378929138183594, 45.055274963378906, 46.73161697387695, 48.407962799072266, 50.08430480957031, 51.760650634765625, 53.43699264526367, 55.11333465576172, 56.789676666259766, 58.46602249145508, 60.142364501953125, 61.81871032714844, 63.495052337646484, 65.17139434814453, 66.84774017333984, 68.52408599853516, 70.20043182373047, 71.87677001953125, 73.55311584472656, 75.22946166992188, 76.90580749511719, 78.58214569091797, 80.25849151611328, 81.93482971191406, 83.61117553710938, 85.28751373291016, 86.96385955810547, 88.64020538330078, 90.31654357910156, 91.99288940429688, 93.66923522949219, 95.3455810546875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 12.0, 9.0, 10.0, 8.0, 11.0, 9.0, 18.0, 18.0, 20.0, 31.0, 31.0, 31.0, 41.0, 34.0, 35.0, 42.0, 54.0, 40.0, 52.0, 51.0, 43.0, 48.0, 48.0, 32.0, 43.0, 34.0, 33.0, 32.0, 20.0, 20.0, 13.0, 12.0, 20.0, 13.0, 9.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101920127868652, -8.788911819458008, -8.475902557373047, -8.162894248962402, -7.8498854637146, -7.536876678466797, -7.223868370056152, -6.91085958480835, -6.597850799560547, -6.284842014312744, -5.971833229064941, -5.658824920654297, -5.345816135406494, -5.032807350158691, -4.719799041748047, -4.406790256500244, -4.093781471252441, -3.7807726860046387, -3.467764139175415, -3.1547555923461914, -2.8417468070983887, -2.528738021850586, -2.2157294750213623, -1.9027209281921387, -1.589712142944336, -1.2767034769058228, -0.9636948108673096, -0.6506861448287964, -0.3376774787902832, -0.02466881275177002, 0.28833985328674316, 0.6013484001159668, 0.9143571853637695, 1.2273658514022827, 1.540374517440796, 1.853383183479309, 2.1663918495178223, 2.479400634765625, 2.7924091815948486, 3.1054177284240723, 3.418426513671875, 3.7314352989196777, 4.0444440841674805, 4.357452392578125, 4.670461177825928, 4.9834699630737305, 5.296478271484375, 5.609487056732178, 5.9224958419799805, 6.235504627227783, 6.548513412475586, 6.8615217208862305, 7.174530506134033, 7.487539291381836, 7.8005475997924805, 8.113555908203125, 8.426565170288086, 8.73957347869873, 9.052582740783691, 9.365591049194336, 9.678600311279297, 9.991608619689941, 10.304616928100586, 10.617626190185547, 10.930634498596191]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 10.0, 10.0, 12.0, 17.0, 18.0, 19.0, 23.0, 25.0, 30.0, 29.0, 43.0, 37.0, 34.0, 39.0, 37.0, 46.0, 50.0, 38.0, 33.0, 65.0, 32.0, 38.0, 40.0, 28.0, 32.0, 36.0, 30.0, 20.0, 17.0, 16.0, 11.0, 18.0, 6.0, 11.0, 5.0, 3.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7250900268554688, -0.7016448974609375, -0.6781997680664062, -0.654754638671875, -0.6313095092773438, -0.6078643798828125, -0.5844192504882812, -0.56097412109375, -0.5375289916992188, -0.5140838623046875, -0.49063873291015625, -0.467193603515625, -0.44374847412109375, -0.4203033447265625, -0.39685821533203125, -0.3734130859375, -0.34996795654296875, -0.3265228271484375, -0.30307769775390625, -0.279632568359375, -0.25618743896484375, -0.2327423095703125, -0.20929718017578125, -0.18585205078125, -0.16240692138671875, -0.1389617919921875, -0.11551666259765625, -0.092071533203125, -0.06862640380859375, -0.0451812744140625, -0.02173614501953125, 0.001708984375, 0.02515411376953125, 0.0485992431640625, 0.07204437255859375, 0.095489501953125, 0.11893463134765625, 0.1423797607421875, 0.16582489013671875, 0.18927001953125, 0.21271514892578125, 0.2361602783203125, 0.25960540771484375, 0.283050537109375, 0.30649566650390625, 0.3299407958984375, 0.35338592529296875, 0.3768310546875, 0.40027618408203125, 0.4237213134765625, 0.44716644287109375, 0.470611572265625, 0.49405670166015625, 0.5175018310546875, 0.5409469604492188, 0.56439208984375, 0.5878372192382812, 0.6112823486328125, 0.6347274780273438, 0.658172607421875, 0.6816177368164062, 0.7050628662109375, 0.7285079956054688, 0.751953125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 23.0, 25.0, 35.0, 57.0, 96.0, 116.0, 181.0, 284.0, 495.0, 606.0, 1054.0, 1618.0, 2402.0, 3804.0, 6113.0, 9866.0, 17006.0, 31432.0, 63784.0, 167367.0, 812541.0, 2269823.0, 550536.0, 133501.0, 54398.0, 27436.0, 14985.0, 9047.0, 5436.0, 3512.0, 2340.0, 1412.0, 921.0, 675.0, 455.0, 283.0, 196.0, 121.0, 87.0, 69.0, 49.0, 26.0, 17.0, 14.0, 7.0, 10.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.6441497802734375, -1.590057373046875, -1.5359649658203125, -1.48187255859375, -1.4277801513671875, -1.373687744140625, -1.3195953369140625, -1.2655029296875, -1.2114105224609375, -1.157318115234375, -1.1032257080078125, -1.04913330078125, -0.9950408935546875, -0.940948486328125, -0.8868560791015625, -0.832763671875, -0.7786712646484375, -0.724578857421875, -0.6704864501953125, -0.61639404296875, -0.5623016357421875, -0.508209228515625, -0.4541168212890625, -0.4000244140625, -0.3459320068359375, -0.291839599609375, -0.2377471923828125, -0.18365478515625, -0.1295623779296875, -0.075469970703125, -0.0213775634765625, 0.03271484375, 0.0868072509765625, 0.140899658203125, 0.1949920654296875, 0.24908447265625, 0.3031768798828125, 0.357269287109375, 0.4113616943359375, 0.4654541015625, 0.5195465087890625, 0.573638916015625, 0.6277313232421875, 0.68182373046875, 0.7359161376953125, 0.790008544921875, 0.8441009521484375, 0.898193359375, 0.9522857666015625, 1.006378173828125, 1.0604705810546875, 1.11456298828125, 1.1686553955078125, 1.222747802734375, 1.2768402099609375, 1.3309326171875, 1.3850250244140625, 1.439117431640625, 1.4932098388671875, 1.54730224609375, 1.6013946533203125, 1.655487060546875, 1.7095794677734375, 1.763671875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 8.0, 15.0, 28.0, 38.0, 66.0, 104.0, 215.0, 418.0, 854.0, 1052.0, 537.0, 327.0, 169.0, 93.0, 58.0, 32.0, 19.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.18212890625, -3.0322265625, -2.88232421875, -2.732421875, -2.58251953125, -2.4326171875, -2.28271484375, -2.1328125, -1.98291015625, -1.8330078125, -1.68310546875, -1.533203125, -1.38330078125, -1.2333984375, -1.08349609375, -0.93359375, -0.78369140625, -0.6337890625, -0.48388671875, -0.333984375, -0.18408203125, -0.0341796875, 0.11572265625, 0.265625, 0.41552734375, 0.5654296875, 0.71533203125, 0.865234375, 1.01513671875, 1.1650390625, 1.31494140625, 1.46484375, 1.61474609375, 1.7646484375, 1.91455078125, 2.064453125, 2.21435546875, 2.3642578125, 2.51416015625, 2.6640625, 2.81396484375, 2.9638671875, 3.11376953125, 3.263671875, 3.41357421875, 3.5634765625, 3.71337890625, 3.86328125, 4.01318359375, 4.1630859375, 4.31298828125, 4.462890625, 4.61279296875, 4.7626953125, 4.91259765625, 5.0625, 5.21240234375, 5.3623046875, 5.51220703125, 5.662109375, 5.81201171875, 5.9619140625, 6.11181640625, 6.26171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 20.0, 25.0, 24.0, 45.0, 50.0, 85.0, 136.0, 207.0, 260.0, 534.0, 1127.0, 2912.0, 9388.0, 40953.0, 294113.0, 3348972.0, 426475.0, 51464.0, 11273.0, 3387.0, 1223.0, 593.0, 344.0, 198.0, 143.0, 105.0, 66.0, 45.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.55718994140625, -5.3214111328125, -5.08563232421875, -4.849853515625, -4.61407470703125, -4.3782958984375, -4.14251708984375, -3.90673828125, -3.67095947265625, -3.4351806640625, -3.19940185546875, -2.963623046875, -2.72784423828125, -2.4920654296875, -2.25628662109375, -2.0205078125, -1.78472900390625, -1.5489501953125, -1.31317138671875, -1.077392578125, -0.84161376953125, -0.6058349609375, -0.37005615234375, -0.13427734375, 0.10150146484375, 0.3372802734375, 0.57305908203125, 0.808837890625, 1.04461669921875, 1.2803955078125, 1.51617431640625, 1.751953125, 1.98773193359375, 2.2235107421875, 2.45928955078125, 2.695068359375, 2.93084716796875, 3.1666259765625, 3.40240478515625, 3.63818359375, 3.87396240234375, 4.1097412109375, 4.34552001953125, 4.581298828125, 4.81707763671875, 5.0528564453125, 5.28863525390625, 5.5244140625, 5.76019287109375, 5.9959716796875, 6.23175048828125, 6.467529296875, 6.70330810546875, 6.9390869140625, 7.17486572265625, 7.41064453125, 7.64642333984375, 7.8822021484375, 8.11798095703125, 8.353759765625, 8.58953857421875, 8.8253173828125, 9.06109619140625, 9.296875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 9.0, 3.0, 8.0, 18.0, 24.0, 24.0, 41.0, 44.0, 59.0, 80.0, 87.0, 130.0, 106.0, 87.0, 62.0, 60.0, 53.0, 32.0, 28.0, 14.0, 13.0, 9.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.659172058105469, -15.299201011657715, -14.939230918884277, -14.579259872436523, -14.219289779663086, -13.859318733215332, -13.499347686767578, -13.13937759399414, -12.779406547546387, -12.419435501098633, -12.059465408325195, -11.699494361877441, -11.339523315429688, -10.97955322265625, -10.619582176208496, -10.259611129760742, -9.899641036987305, -9.53966999053955, -9.179699897766113, -8.81972885131836, -8.459758758544922, -8.099787712097168, -7.739816665649414, -7.379846096038818, -7.019875526428223, -6.659904956817627, -6.299934387207031, -5.939963340759277, -5.579992771148682, -5.220022201538086, -4.860051155090332, -4.500080585479736, -4.140110015869141, -3.780139446258545, -3.42016863822937, -3.0601978302001953, -2.7002272605895996, -2.340256690979004, -1.980285882949829, -1.6203150749206543, -1.2603445053100586, -0.9003738164901733, -0.5404031276702881, -0.18043243885040283, 0.17953824996948242, 0.5395089387893677, 0.8994796276092529, 1.2594504356384277, 1.6194210052490234, 1.9793916940689087, 2.339362382888794, 2.6993331909179688, 3.0593037605285645, 3.41927433013916, 3.779245138168335, 4.13921594619751, 4.4991865158081055, 4.859157085418701, 5.219127655029297, 5.579098701477051, 5.9390692710876465, 6.299039840698242, 6.659010887145996, 7.018981456756592, 7.3789520263671875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 9.0, 5.0, 9.0, 13.0, 13.0, 16.0, 18.0, 20.0, 22.0, 26.0, 38.0, 29.0, 30.0, 32.0, 33.0, 35.0, 40.0, 38.0, 42.0, 55.0, 43.0, 33.0, 47.0, 42.0, 40.0, 35.0, 31.0, 25.0, 20.0, 27.0, 17.0, 19.0, 17.0, 17.0, 10.0, 14.0, 9.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.366325378417969, -9.082765579223633, -8.79920482635498, -8.515645027160645, -8.232085227966309, -7.948524475097656, -7.66496467590332, -7.381404399871826, -7.097844123840332, -6.814283847808838, -6.530724048614502, -6.247163772583008, -5.963603496551514, -5.6800432205200195, -5.396483421325684, -5.1129231452941895, -4.8293633460998535, -4.545803070068359, -4.262243270874023, -3.9786829948425293, -3.695122718811035, -3.41156268119812, -3.128002643585205, -2.844442367553711, -2.560882329940796, -2.277322292327881, -1.9937620162963867, -1.7102019786834717, -1.426641821861267, -1.1430816650390625, -0.8595216274261475, -0.5759614706039429, -0.2924013137817383, -0.008841186761856079, 0.2747189402580261, 0.5582790374755859, 0.8418391942977905, 1.1253993511199951, 1.4089593887329102, 1.6925195455551147, 1.9760797023773193, 2.2596397399902344, 2.5432000160217285, 2.8267600536346436, 3.1103200912475586, 3.3938803672790527, 3.6774404048919678, 3.961000442504883, 4.244560718536377, 4.528120994567871, 4.811680793762207, 5.095241069793701, 5.378801345825195, 5.662361145019531, 5.945921421051025, 6.2294816970825195, 6.5130414962768555, 6.79660177230835, 7.0801615715026855, 7.36372184753418, 7.647282123565674, 7.930842399597168, 8.214402198791504, 8.49796199798584, 8.781522750854492]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 11.0, 16.0, 19.0, 22.0, 21.0, 16.0, 35.0, 38.0, 37.0, 30.0, 33.0, 34.0, 40.0, 50.0, 49.0, 52.0, 50.0, 38.0, 39.0, 46.0, 35.0, 34.0, 31.0, 18.0, 32.0, 25.0, 19.0, 24.0, 13.0, 16.0, 10.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7509765625, -0.726806640625, -0.70263671875, -0.678466796875, -0.654296875, -0.630126953125, -0.60595703125, -0.581787109375, -0.5576171875, -0.533447265625, -0.50927734375, -0.485107421875, -0.4609375, -0.436767578125, -0.41259765625, -0.388427734375, -0.3642578125, -0.340087890625, -0.31591796875, -0.291748046875, -0.267578125, -0.243408203125, -0.21923828125, -0.195068359375, -0.1708984375, -0.146728515625, -0.12255859375, -0.098388671875, -0.07421875, -0.050048828125, -0.02587890625, -0.001708984375, 0.0224609375, 0.046630859375, 0.07080078125, 0.094970703125, 0.119140625, 0.143310546875, 0.16748046875, 0.191650390625, 0.2158203125, 0.239990234375, 0.26416015625, 0.288330078125, 0.3125, 0.336669921875, 0.36083984375, 0.385009765625, 0.4091796875, 0.433349609375, 0.45751953125, 0.481689453125, 0.505859375, 0.530029296875, 0.55419921875, 0.578369140625, 0.6025390625, 0.626708984375, 0.65087890625, 0.675048828125, 0.69921875, 0.723388671875, 0.74755859375, 0.771728515625, 0.7958984375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 17.0, 25.0, 29.0, 56.0, 82.0, 136.0, 163.0, 258.0, 364.0, 537.0, 760.0, 1026.0, 1492.0, 2322.0, 3281.0, 4664.0, 6876.0, 10158.0, 14604.0, 21760.0, 32012.0, 46455.0, 66102.0, 89496.0, 112905.0, 130327.0, 125596.0, 105952.0, 81271.0, 59616.0, 41478.0, 28299.0, 19310.0, 12773.0, 8924.0, 6065.0, 4152.0, 2812.0, 2024.0, 1361.0, 872.0, 654.0, 479.0, 319.0, 228.0, 156.0, 109.0, 73.0, 39.0, 27.0, 19.0, 14.0, 9.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.56494140625, -0.5477371215820312, -0.5305328369140625, -0.5133285522460938, -0.496124267578125, -0.47891998291015625, -0.4617156982421875, -0.44451141357421875, -0.42730712890625, -0.41010284423828125, -0.3928985595703125, -0.37569427490234375, -0.358489990234375, -0.34128570556640625, -0.3240814208984375, -0.30687713623046875, -0.2896728515625, -0.27246856689453125, -0.2552642822265625, -0.23805999755859375, -0.220855712890625, -0.20365142822265625, -0.1864471435546875, -0.16924285888671875, -0.15203857421875, -0.13483428955078125, -0.1176300048828125, -0.10042572021484375, -0.083221435546875, -0.06601715087890625, -0.0488128662109375, -0.03160858154296875, -0.014404296875, 0.00279998779296875, 0.0200042724609375, 0.03720855712890625, 0.054412841796875, 0.07161712646484375, 0.0888214111328125, 0.10602569580078125, 0.12322998046875, 0.14043426513671875, 0.1576385498046875, 0.17484283447265625, 0.192047119140625, 0.20925140380859375, 0.2264556884765625, 0.24365997314453125, 0.2608642578125, 0.27806854248046875, 0.2952728271484375, 0.31247711181640625, 0.329681396484375, 0.34688568115234375, 0.3640899658203125, 0.38129425048828125, 0.39849853515625, 0.41570281982421875, 0.4329071044921875, 0.45011138916015625, 0.467315673828125, 0.48451995849609375, 0.5017242431640625, 0.5189285278320312, 0.5361328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 12.0, 5.0, 3.0, 12.0, 11.0, 11.0, 19.0, 12.0, 12.0, 25.0, 23.0, 25.0, 27.0, 31.0, 36.0, 34.0, 34.0, 39.0, 47.0, 44.0, 1067.0, 33.0, 42.0, 36.0, 34.0, 31.0, 39.0, 44.0, 40.0, 26.0, 25.0, 21.0, 35.0, 14.0, 14.0, 11.0, 10.0, 7.0, 4.0, 7.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7138671875, -0.6908111572265625, -0.667755126953125, -0.6446990966796875, -0.62164306640625, -0.5985870361328125, -0.575531005859375, -0.5524749755859375, -0.5294189453125, -0.5063629150390625, -0.483306884765625, -0.4602508544921875, -0.43719482421875, -0.4141387939453125, -0.391082763671875, -0.3680267333984375, -0.344970703125, -0.3219146728515625, -0.298858642578125, -0.2758026123046875, -0.25274658203125, -0.2296905517578125, -0.206634521484375, -0.1835784912109375, -0.1605224609375, -0.1374664306640625, -0.114410400390625, -0.0913543701171875, -0.06829833984375, -0.0452423095703125, -0.022186279296875, 0.0008697509765625, 0.02392578125, 0.0469818115234375, 0.070037841796875, 0.0930938720703125, 0.11614990234375, 0.1392059326171875, 0.162261962890625, 0.1853179931640625, 0.2083740234375, 0.2314300537109375, 0.254486083984375, 0.2775421142578125, 0.30059814453125, 0.3236541748046875, 0.346710205078125, 0.3697662353515625, 0.392822265625, 0.4158782958984375, 0.438934326171875, 0.4619903564453125, 0.48504638671875, 0.5081024169921875, 0.531158447265625, 0.5542144775390625, 0.5772705078125, 0.6003265380859375, 0.623382568359375, 0.6464385986328125, 0.66949462890625, 0.6925506591796875, 0.715606689453125, 0.7386627197265625, 0.76171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 12.0, 10.0, 23.0, 28.0, 63.0, 58.0, 96.0, 131.0, 224.0, 309.0, 515.0, 672.0, 1075.0, 1639.0, 2355.0, 3661.0, 5358.0, 8275.0, 13067.0, 22011.0, 47711.0, 259574.0, 1510294.0, 132842.0, 35779.0, 18520.0, 11449.0, 7214.0, 4671.0, 3221.0, 2039.0, 1405.0, 909.0, 634.0, 401.0, 288.0, 215.0, 127.0, 78.0, 63.0, 29.0, 29.0, 19.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6856231689453125, -0.662261962890625, -0.6389007568359375, -0.61553955078125, -0.5921783447265625, -0.568817138671875, -0.5454559326171875, -0.5220947265625, -0.4987335205078125, -0.475372314453125, -0.4520111083984375, -0.42864990234375, -0.4052886962890625, -0.381927490234375, -0.3585662841796875, -0.335205078125, -0.3118438720703125, -0.288482666015625, -0.2651214599609375, -0.24176025390625, -0.2183990478515625, -0.195037841796875, -0.1716766357421875, -0.1483154296875, -0.1249542236328125, -0.101593017578125, -0.0782318115234375, -0.05487060546875, -0.0315093994140625, -0.008148193359375, 0.0152130126953125, 0.03857421875, 0.0619354248046875, 0.085296630859375, 0.1086578369140625, 0.13201904296875, 0.1553802490234375, 0.178741455078125, 0.2021026611328125, 0.2254638671875, 0.2488250732421875, 0.272186279296875, 0.2955474853515625, 0.31890869140625, 0.3422698974609375, 0.365631103515625, 0.3889923095703125, 0.412353515625, 0.4357147216796875, 0.459075927734375, 0.4824371337890625, 0.50579833984375, 0.5291595458984375, 0.552520751953125, 0.5758819580078125, 0.5992431640625, 0.6226043701171875, 0.645965576171875, 0.6693267822265625, 0.69268798828125, 0.7160491943359375, 0.739410400390625, 0.7627716064453125, 0.7861328125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 12.0, 6.0, 17.0, 15.0, 16.0, 19.0, 39.0, 33.0, 43.0, 53.0, 73.0, 90.0, 85.0, 93.0, 73.0, 62.0, 60.0, 48.0, 39.0, 18.0, 16.0, 11.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14349937438964844, -0.13831710815429688, -0.1331348419189453, -0.12795257568359375, -0.12277030944824219, -0.11758804321289062, -0.11240577697753906, -0.1072235107421875, -0.10204124450683594, -0.09685897827148438, -0.09167671203613281, -0.08649444580078125, -0.08131217956542969, -0.07612991333007812, -0.07094764709472656, -0.065765380859375, -0.06058311462402344, -0.055400848388671875, -0.05021858215332031, -0.04503631591796875, -0.03985404968261719, -0.034671783447265625, -0.029489517211914062, -0.0243072509765625, -0.019124984741210938, -0.013942718505859375, -0.008760452270507812, -0.00357818603515625, 0.0016040802001953125, 0.006786346435546875, 0.011968612670898438, 0.01715087890625, 0.022333145141601562, 0.027515411376953125, 0.03269767761230469, 0.03787994384765625, 0.04306221008300781, 0.048244476318359375, 0.05342674255371094, 0.0586090087890625, 0.06379127502441406, 0.06897354125976562, 0.07415580749511719, 0.07933807373046875, 0.08452033996582031, 0.08970260620117188, 0.09488487243652344, 0.100067138671875, 0.10524940490722656, 0.11043167114257812, 0.11561393737792969, 0.12079620361328125, 0.1259784698486328, 0.13116073608398438, 0.13634300231933594, 0.1415252685546875, 0.14670753479003906, 0.15188980102539062, 0.1570720672607422, 0.16225433349609375, 0.1674365997314453, 0.17261886596679688, 0.17780113220214844, 0.1829833984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 8.0, 6.0, 14.0, 10.0, 18.0, 27.0, 31.0, 43.0, 58.0, 60.0, 95.0, 121.0, 171.0, 354.0, 1555.0, 12829.0, 849159.0, 176536.0, 5651.0, 878.0, 262.0, 157.0, 129.0, 82.0, 46.0, 41.0, 43.0, 26.0, 28.0, 11.0, 19.0, 15.0, 8.0, 6.0, 5.0, 10.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.53515625, -2.45794677734375, -2.3807373046875, -2.30352783203125, -2.226318359375, -2.14910888671875, -2.0718994140625, -1.99468994140625, -1.91748046875, -1.84027099609375, -1.7630615234375, -1.68585205078125, -1.608642578125, -1.53143310546875, -1.4542236328125, -1.37701416015625, -1.2998046875, -1.22259521484375, -1.1453857421875, -1.06817626953125, -0.990966796875, -0.91375732421875, -0.8365478515625, -0.75933837890625, -0.68212890625, -0.60491943359375, -0.5277099609375, -0.45050048828125, -0.373291015625, -0.29608154296875, -0.2188720703125, -0.14166259765625, -0.064453125, 0.01275634765625, 0.0899658203125, 0.16717529296875, 0.244384765625, 0.32159423828125, 0.3988037109375, 0.47601318359375, 0.55322265625, 0.63043212890625, 0.7076416015625, 0.78485107421875, 0.862060546875, 0.93927001953125, 1.0164794921875, 1.09368896484375, 1.1708984375, 1.24810791015625, 1.3253173828125, 1.40252685546875, 1.479736328125, 1.55694580078125, 1.6341552734375, 1.71136474609375, 1.78857421875, 1.86578369140625, 1.9429931640625, 2.02020263671875, 2.097412109375, 2.17462158203125, 2.2518310546875, 2.32904052734375, 2.40625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 13.0, 22.0, 69.0, 168.0, 420.0, 187.0, 70.0, 34.0, 15.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123091459274292, -3.029902696609497, -2.936713933944702, -2.8435251712799072, -2.750336170196533, -2.6571474075317383, -2.5639586448669434, -2.4707698822021484, -2.3775811195373535, -2.2843923568725586, -2.1912035942077637, -2.0980148315429688, -2.004826068878174, -1.9116371870040894, -1.8184483051300049, -1.72525954246521, -1.632070779800415, -1.5388820171356201, -1.4456932544708252, -1.3525043725967407, -1.2593156099319458, -1.1661268472671509, -1.0729379653930664, -0.9797492027282715, -0.8865604400634766, -0.7933716773986816, -0.7001828551292419, -0.6069940328598022, -0.5138052701950073, -0.42061647772789, -0.3274276852607727, -0.234238862991333, -0.1410503387451172, -0.04786154627799988, 0.04532724618911743, 0.13851603865623474, 0.23170483112335205, 0.32489362359046936, 0.41808241605758667, 0.5112712383270264, 0.6044600009918213, 0.6976487636566162, 0.7908375859260559, 0.8840264081954956, 0.9772151708602905, 1.0704039335250854, 1.16359281539917, 1.2567815780639648, 1.3499703407287598, 1.4431591033935547, 1.5363478660583496, 1.629536747932434, 1.722725510597229, 1.815914273262024, 1.9091031551361084, 2.0022919178009033, 2.0954806804656982, 2.188669443130493, 2.281858205795288, 2.375046968460083, 2.468235969543457, 2.561424732208252, 2.654613494873047, 2.747802257537842, 2.8409910202026367]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 3.0, 9.0, 14.0, 12.0, 21.0, 28.0, 27.0, 50.0, 31.0, 42.0, 47.0, 48.0, 66.0, 46.0, 59.0, 76.0, 54.0, 49.0, 42.0, 48.0, 40.0, 36.0, 28.0, 23.0, 17.0, 18.0, 20.0, 13.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.011688232421875, -0.9810954928398132, -0.9505027532577515, -0.9199100136756897, -0.8893172740936279, -0.8587245345115662, -0.8281317949295044, -0.7975390553474426, -0.7669463157653809, -0.7363535761833191, -0.7057608366012573, -0.6751680970191956, -0.6445753574371338, -0.613982617855072, -0.5833898782730103, -0.5527971386909485, -0.5222043991088867, -0.49161165952682495, -0.4610189199447632, -0.4304261803627014, -0.39983344078063965, -0.3692407011985779, -0.3386479616165161, -0.30805522203445435, -0.2774624228477478, -0.24686968326568604, -0.21627694368362427, -0.1856842041015625, -0.15509146451950073, -0.12449871003627777, -0.093905970454216, -0.06331323087215424, -0.03272050619125366, -0.0021277647465467453, 0.02846497669816017, 0.05905772000551224, 0.089650459587574, 0.12024320662021637, 0.15083594620227814, 0.1814286857843399, 0.21202142536640167, 0.24261416494846344, 0.2732069194316864, 0.30379965901374817, 0.33439239859580994, 0.3649851381778717, 0.39557787775993347, 0.42617061734199524, 0.456763356924057, 0.4873560965061188, 0.5179488658905029, 0.5485416054725647, 0.5791343450546265, 0.6097270846366882, 0.64031982421875, 0.6709125638008118, 0.7015053033828735, 0.7320980429649353, 0.7626907825469971, 0.7932835221290588, 0.8238762617111206, 0.8544690012931824, 0.8850617408752441, 0.9156544804573059, 0.9462472200393677]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 11.0, 10.0, 10.0, 8.0, 19.0, 22.0, 25.0, 20.0, 18.0, 29.0, 28.0, 29.0, 37.0, 39.0, 43.0, 45.0, 44.0, 36.0, 41.0, 56.0, 38.0, 46.0, 29.0, 32.0, 32.0, 27.0, 30.0, 31.0, 30.0, 22.0, 15.0, 22.0, 17.0, 8.0, 8.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.728515625, -0.7051010131835938, -0.6816864013671875, -0.6582717895507812, -0.634857177734375, -0.6114425659179688, -0.5880279541015625, -0.5646133422851562, -0.54119873046875, -0.5177841186523438, -0.4943695068359375, -0.47095489501953125, -0.447540283203125, -0.42412567138671875, -0.4007110595703125, -0.37729644775390625, -0.3538818359375, -0.33046722412109375, -0.3070526123046875, -0.28363800048828125, -0.260223388671875, -0.23680877685546875, -0.2133941650390625, -0.18997955322265625, -0.16656494140625, -0.14315032958984375, -0.1197357177734375, -0.09632110595703125, -0.072906494140625, -0.04949188232421875, -0.0260772705078125, -0.00266265869140625, 0.020751953125, 0.04416656494140625, 0.0675811767578125, 0.09099578857421875, 0.114410400390625, 0.13782501220703125, 0.1612396240234375, 0.18465423583984375, 0.20806884765625, 0.23148345947265625, 0.2548980712890625, 0.27831268310546875, 0.301727294921875, 0.32514190673828125, 0.3485565185546875, 0.37197113037109375, 0.3953857421875, 0.41880035400390625, 0.4422149658203125, 0.46562957763671875, 0.489044189453125, 0.5124588012695312, 0.5358734130859375, 0.5592880249023438, 0.58270263671875, 0.6061172485351562, 0.6295318603515625, 0.6529464721679688, 0.676361083984375, 0.6997756958007812, 0.7231903076171875, 0.7466049194335938, 0.77001953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 7.0, 15.0, 29.0, 43.0, 55.0, 72.0, 112.0, 129.0, 185.0, 274.0, 443.0, 622.0, 1015.0, 1688.0, 2751.0, 4800.0, 8589.0, 15805.0, 31266.0, 64796.0, 134919.0, 241006.0, 251144.0, 145474.0, 70452.0, 34012.0, 16913.0, 8908.0, 5084.0, 2884.0, 1742.0, 1119.0, 696.0, 486.0, 325.0, 202.0, 161.0, 111.0, 82.0, 32.0, 28.0, 16.0, 13.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.833038330078125, -0.80621337890625, -0.779388427734375, -0.7525634765625, -0.725738525390625, -0.69891357421875, -0.672088623046875, -0.645263671875, -0.618438720703125, -0.59161376953125, -0.564788818359375, -0.5379638671875, -0.511138916015625, -0.48431396484375, -0.457489013671875, -0.4306640625, -0.403839111328125, -0.37701416015625, -0.350189208984375, -0.3233642578125, -0.296539306640625, -0.26971435546875, -0.242889404296875, -0.216064453125, -0.189239501953125, -0.16241455078125, -0.135589599609375, -0.1087646484375, -0.081939697265625, -0.05511474609375, -0.028289794921875, -0.00146484375, 0.025360107421875, 0.05218505859375, 0.079010009765625, 0.1058349609375, 0.132659912109375, 0.15948486328125, 0.186309814453125, 0.213134765625, 0.239959716796875, 0.26678466796875, 0.293609619140625, 0.3204345703125, 0.347259521484375, 0.37408447265625, 0.400909423828125, 0.427734375, 0.454559326171875, 0.48138427734375, 0.508209228515625, 0.5350341796875, 0.561859130859375, 0.58868408203125, 0.615509033203125, 0.642333984375, 0.669158935546875, 0.69598388671875, 0.722808837890625, 0.7496337890625, 0.776458740234375, 0.80328369140625, 0.830108642578125, 0.85693359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 12.0, 9.0, 10.0, 3.0, 13.0, 19.0, 16.0, 29.0, 18.0, 35.0, 35.0, 31.0, 48.0, 47.0, 62.0, 77.0, 118.0, 237.0, 1343.0, 278.0, 124.0, 75.0, 60.0, 48.0, 39.0, 43.0, 36.0, 32.0, 24.0, 23.0, 17.0, 21.0, 12.0, 11.0, 13.0, 8.0, 2.0, 6.0, 2.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.928375244140625, -2.82940673828125, -2.730438232421875, -2.6314697265625, -2.532501220703125, -2.43353271484375, -2.334564208984375, -2.235595703125, -2.136627197265625, -2.03765869140625, -1.938690185546875, -1.8397216796875, -1.740753173828125, -1.64178466796875, -1.542816162109375, -1.44384765625, -1.344879150390625, -1.24591064453125, -1.146942138671875, -1.0479736328125, -0.949005126953125, -0.85003662109375, -0.751068115234375, -0.652099609375, -0.553131103515625, -0.45416259765625, -0.355194091796875, -0.2562255859375, -0.157257080078125, -0.05828857421875, 0.040679931640625, 0.1396484375, 0.238616943359375, 0.33758544921875, 0.436553955078125, 0.5355224609375, 0.634490966796875, 0.73345947265625, 0.832427978515625, 0.931396484375, 1.030364990234375, 1.12933349609375, 1.228302001953125, 1.3272705078125, 1.426239013671875, 1.52520751953125, 1.624176025390625, 1.72314453125, 1.822113037109375, 1.92108154296875, 2.020050048828125, 2.1190185546875, 2.217987060546875, 2.31695556640625, 2.415924072265625, 2.514892578125, 2.613861083984375, 2.71282958984375, 2.811798095703125, 2.9107666015625, 3.009735107421875, 3.10870361328125, 3.207672119140625, 3.306640625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 14.0, 20.0, 37.0, 48.0, 75.0, 97.0, 124.0, 182.0, 260.0, 421.0, 584.0, 880.0, 1239.0, 1890.0, 2877.0, 4601.0, 8254.0, 19370.0, 106836.0, 2439924.0, 494116.0, 35411.0, 11747.0, 5978.0, 3565.0, 2277.0, 1501.0, 1047.0, 741.0, 475.0, 336.0, 209.0, 151.0, 114.0, 92.0, 55.0, 42.0, 24.0, 21.0, 12.0, 10.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.33984375, -5.17669677734375, -5.0135498046875, -4.85040283203125, -4.687255859375, -4.52410888671875, -4.3609619140625, -4.19781494140625, -4.03466796875, -3.87152099609375, -3.7083740234375, -3.54522705078125, -3.382080078125, -3.21893310546875, -3.0557861328125, -2.89263916015625, -2.7294921875, -2.56634521484375, -2.4031982421875, -2.24005126953125, -2.076904296875, -1.91375732421875, -1.7506103515625, -1.58746337890625, -1.42431640625, -1.26116943359375, -1.0980224609375, -0.93487548828125, -0.771728515625, -0.60858154296875, -0.4454345703125, -0.28228759765625, -0.119140625, 0.04400634765625, 0.2071533203125, 0.37030029296875, 0.533447265625, 0.69659423828125, 0.8597412109375, 1.02288818359375, 1.18603515625, 1.34918212890625, 1.5123291015625, 1.67547607421875, 1.838623046875, 2.00177001953125, 2.1649169921875, 2.32806396484375, 2.4912109375, 2.65435791015625, 2.8175048828125, 2.98065185546875, 3.143798828125, 3.30694580078125, 3.4700927734375, 3.63323974609375, 3.79638671875, 3.95953369140625, 4.1226806640625, 4.28582763671875, 4.448974609375, 4.61212158203125, 4.7752685546875, 4.93841552734375, 5.1015625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 11.0, 25.0, 34.0, 92.0, 186.0, 277.0, 207.0, 105.0, 46.0, 17.0, 6.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.837425231933594, -10.219122886657715, -9.600820541381836, -8.98251724243164, -8.364214897155762, -7.745912551879883, -7.127609729766846, -6.509306907653809, -5.89100456237793, -5.272702217102051, -4.654399394989014, -4.036096572875977, -3.4177942276000977, -2.7994916439056396, -2.1811890602111816, -1.5628862380981445, -0.9445838928222656, -0.3262813091278076, 0.2920212745666504, 0.9103238582611084, 1.5286264419555664, 2.1469290256500244, 2.7652316093444824, 3.3835344314575195, 4.001836776733398, 4.620139122009277, 5.2384419441223145, 5.856744766235352, 6.4750471115112305, 7.093349456787109, 7.7116522789001465, 8.329955101013184, 8.94825553894043, 9.566557884216309, 10.184860229492188, 10.803163528442383, 11.421465873718262, 12.03976821899414, 12.658071517944336, 13.276373863220215, 13.894676208496094, 14.512978553771973, 15.131280899047852, 15.749584197998047, 16.36788558959961, 16.986188888549805, 17.6044921875, 18.222793579101562, 18.841096878051758, 19.459400177001953, 20.077701568603516, 20.69600486755371, 21.314308166503906, 21.93260955810547, 22.550912857055664, 23.16921615600586, 23.787517547607422, 24.405820846557617, 25.02412223815918, 25.642425537109375, 26.260726928710938, 26.879030227661133, 27.497333526611328, 28.11563491821289, 28.733938217163086]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 9.0, 8.0, 7.0, 15.0, 8.0, 14.0, 16.0, 17.0, 26.0, 33.0, 29.0, 36.0, 33.0, 46.0, 39.0, 43.0, 47.0, 49.0, 42.0, 54.0, 45.0, 39.0, 45.0, 52.0, 31.0, 32.0, 19.0, 25.0, 23.0, 27.0, 24.0, 11.0, 13.0, 11.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.091780662536621, -10.756503105163574, -10.421225547790527, -10.08594799041748, -9.750670433044434, -9.415392875671387, -9.08011531829834, -8.744837760925293, -8.409560203552246, -8.0742826461792, -7.739005088806152, -7.4037275314331055, -7.068449974060059, -6.733172416687012, -6.397894859313965, -6.062617301940918, -5.727339744567871, -5.392062187194824, -5.056784629821777, -4.7215070724487305, -4.386229515075684, -4.050951957702637, -3.71567440032959, -3.380396842956543, -3.045119285583496, -2.709841728210449, -2.3745641708374023, -2.0392866134643555, -1.7040090560913086, -1.3687314987182617, -1.0334539413452148, -0.698176383972168, -0.3628978729248047, -0.027620315551757812, 0.30765724182128906, 0.6429347991943359, 0.9782123565673828, 1.3134899139404297, 1.6487674713134766, 1.9840450286865234, 2.3193225860595703, 2.654600143432617, 2.989877700805664, 3.325155258178711, 3.660432815551758, 3.9957103729248047, 4.330987930297852, 4.666265487670898, 5.001543045043945, 5.336820602416992, 5.672098159790039, 6.007375717163086, 6.342653274536133, 6.67793083190918, 7.013208389282227, 7.348485946655273, 7.68376350402832, 8.019041061401367, 8.354318618774414, 8.689596176147461, 9.024873733520508, 9.360151290893555, 9.695428848266602, 10.030706405639648, 10.365983963012695]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 9.0, 19.0, 20.0, 18.0, 23.0, 21.0, 18.0, 28.0, 26.0, 42.0, 41.0, 37.0, 36.0, 51.0, 36.0, 53.0, 41.0, 51.0, 46.0, 46.0, 27.0, 36.0, 35.0, 35.0, 31.0, 24.0, 22.0, 18.0, 13.0, 16.0, 10.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.84814453125, -0.8229598999023438, -0.7977752685546875, -0.7725906372070312, -0.747406005859375, -0.7222213745117188, -0.6970367431640625, -0.6718521118164062, -0.64666748046875, -0.6214828491210938, -0.5962982177734375, -0.5711135864257812, -0.545928955078125, -0.5207443237304688, -0.4955596923828125, -0.47037506103515625, -0.4451904296875, -0.42000579833984375, -0.3948211669921875, -0.36963653564453125, -0.344451904296875, -0.31926727294921875, -0.2940826416015625, -0.26889801025390625, -0.24371337890625, -0.21852874755859375, -0.1933441162109375, -0.16815948486328125, -0.142974853515625, -0.11779022216796875, -0.0926055908203125, -0.06742095947265625, -0.042236328125, -0.01705169677734375, 0.0081329345703125, 0.03331756591796875, 0.058502197265625, 0.08368682861328125, 0.1088714599609375, 0.13405609130859375, 0.15924072265625, 0.18442535400390625, 0.2096099853515625, 0.23479461669921875, 0.259979248046875, 0.28516387939453125, 0.3103485107421875, 0.33553314208984375, 0.3607177734375, 0.38590240478515625, 0.4110870361328125, 0.43627166748046875, 0.461456298828125, 0.48664093017578125, 0.5118255615234375, 0.5370101928710938, 0.56219482421875, 0.5873794555664062, 0.6125640869140625, 0.6377487182617188, 0.662933349609375, 0.6881179809570312, 0.7133026123046875, 0.7384872436523438, 0.763671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 12.0, 6.0, 11.0, 14.0, 21.0, 20.0, 37.0, 38.0, 56.0, 72.0, 106.0, 158.0, 215.0, 375.0, 646.0, 1144.0, 2439.0, 5458.0, 12773.0, 33926.0, 115156.0, 977435.0, 2678846.0, 269561.0, 59791.0, 20303.0, 8006.0, 3651.0, 1724.0, 868.0, 457.0, 277.0, 182.0, 126.0, 82.0, 61.0, 57.0, 35.0, 24.0, 14.0, 16.0, 10.0, 12.0, 13.0, 12.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.890625, -2.80621337890625, -2.7218017578125, -2.63739013671875, -2.552978515625, -2.46856689453125, -2.3841552734375, -2.29974365234375, -2.21533203125, -2.13092041015625, -2.0465087890625, -1.96209716796875, -1.877685546875, -1.79327392578125, -1.7088623046875, -1.62445068359375, -1.5400390625, -1.45562744140625, -1.3712158203125, -1.28680419921875, -1.202392578125, -1.11798095703125, -1.0335693359375, -0.94915771484375, -0.86474609375, -0.78033447265625, -0.6959228515625, -0.61151123046875, -0.527099609375, -0.44268798828125, -0.3582763671875, -0.27386474609375, -0.189453125, -0.10504150390625, -0.0206298828125, 0.06378173828125, 0.148193359375, 0.23260498046875, 0.3170166015625, 0.40142822265625, 0.48583984375, 0.57025146484375, 0.6546630859375, 0.73907470703125, 0.823486328125, 0.90789794921875, 0.9923095703125, 1.07672119140625, 1.1611328125, 1.24554443359375, 1.3299560546875, 1.41436767578125, 1.498779296875, 1.58319091796875, 1.6676025390625, 1.75201416015625, 1.83642578125, 1.92083740234375, 2.0052490234375, 2.08966064453125, 2.174072265625, 2.25848388671875, 2.3428955078125, 2.42730712890625, 2.51171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 14.0, 16.0, 17.0, 35.0, 36.0, 46.0, 64.0, 84.0, 142.0, 190.0, 325.0, 493.0, 664.0, 628.0, 433.0, 258.0, 181.0, 129.0, 84.0, 61.0, 44.0, 31.0, 34.0, 17.0, 13.0, 11.0, 4.0, 0.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.234466552734375, -2.13690185546875, -2.039337158203125, -1.9417724609375, -1.844207763671875, -1.74664306640625, -1.649078369140625, -1.551513671875, -1.453948974609375, -1.35638427734375, -1.258819580078125, -1.1612548828125, -1.063690185546875, -0.96612548828125, -0.868560791015625, -0.77099609375, -0.673431396484375, -0.57586669921875, -0.478302001953125, -0.3807373046875, -0.283172607421875, -0.18560791015625, -0.088043212890625, 0.009521484375, 0.107086181640625, 0.20465087890625, 0.302215576171875, 0.3997802734375, 0.497344970703125, 0.59490966796875, 0.692474365234375, 0.7900390625, 0.887603759765625, 0.98516845703125, 1.082733154296875, 1.1802978515625, 1.277862548828125, 1.37542724609375, 1.472991943359375, 1.570556640625, 1.668121337890625, 1.76568603515625, 1.863250732421875, 1.9608154296875, 2.058380126953125, 2.15594482421875, 2.253509521484375, 2.35107421875, 2.448638916015625, 2.54620361328125, 2.643768310546875, 2.7413330078125, 2.838897705078125, 2.93646240234375, 3.034027099609375, 3.131591796875, 3.229156494140625, 3.32672119140625, 3.424285888671875, 3.5218505859375, 3.619415283203125, 3.71697998046875, 3.814544677734375, 3.912109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 11.0, 17.0, 8.0, 15.0, 8.0, 17.0, 37.0, 50.0, 66.0, 130.0, 189.0, 305.0, 630.0, 1157.0, 2445.0, 5030.0, 11419.0, 28302.0, 79707.0, 298029.0, 2020611.0, 1412923.0, 225708.0, 64939.0, 23794.0, 9840.0, 4430.0, 2061.0, 1052.0, 535.0, 281.0, 177.0, 114.0, 51.0, 46.0, 36.0, 43.0, 23.0, 13.0, 5.0, 9.0, 3.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.02734375, -3.901123046875, -3.77490234375, -3.648681640625, -3.5224609375, -3.396240234375, -3.27001953125, -3.143798828125, -3.017578125, -2.891357421875, -2.76513671875, -2.638916015625, -2.5126953125, -2.386474609375, -2.26025390625, -2.134033203125, -2.0078125, -1.881591796875, -1.75537109375, -1.629150390625, -1.5029296875, -1.376708984375, -1.25048828125, -1.124267578125, -0.998046875, -0.871826171875, -0.74560546875, -0.619384765625, -0.4931640625, -0.366943359375, -0.24072265625, -0.114501953125, 0.01171875, 0.137939453125, 0.26416015625, 0.390380859375, 0.5166015625, 0.642822265625, 0.76904296875, 0.895263671875, 1.021484375, 1.147705078125, 1.27392578125, 1.400146484375, 1.5263671875, 1.652587890625, 1.77880859375, 1.905029296875, 2.03125, 2.157470703125, 2.28369140625, 2.409912109375, 2.5361328125, 2.662353515625, 2.78857421875, 2.914794921875, 3.041015625, 3.167236328125, 3.29345703125, 3.419677734375, 3.5458984375, 3.672119140625, 3.79833984375, 3.924560546875, 4.05078125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 9.0, 20.0, 44.0, 69.0, 99.0, 122.0, 145.0, 161.0, 114.0, 93.0, 56.0, 36.0, 13.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96290111541748, -15.368990898132324, -14.775080680847168, -14.181170463562012, -13.587259292602539, -12.993349075317383, -12.399438858032227, -11.80552864074707, -11.211618423461914, -10.617708206176758, -10.023797988891602, -9.429887771606445, -8.835977554321289, -8.242067337036133, -7.64815616607666, -7.054245948791504, -6.460335731506348, -5.866425514221191, -5.272515296936035, -4.678604602813721, -4.0846943855285645, -3.490784168243408, -2.896873712539673, -2.3029632568359375, -1.7090530395507812, -1.1151427030563354, -0.5212323665618896, 0.07267796993255615, 0.666588306427002, 1.2604985237121582, 1.8544089794158936, 2.448319435119629, 3.0422306060791016, 3.636140823364258, 4.230051040649414, 4.8239617347717285, 5.417871952056885, 6.011782169342041, 6.6056928634643555, 7.199603080749512, 7.793513298034668, 8.387423515319824, 8.98133373260498, 9.575243949890137, 10.16915512084961, 10.763065338134766, 11.356975555419922, 11.950885772705078, 12.544795989990234, 13.13870620727539, 13.732616424560547, 14.326526641845703, 14.92043685913086, 15.514347076416016, 16.108257293701172, 16.702167510986328, 17.296077728271484, 17.88998794555664, 18.483898162841797, 19.077808380126953, 19.67171859741211, 20.265628814697266, 20.859539031982422, 21.453449249267578, 22.047361373901367]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 7.0, 11.0, 5.0, 12.0, 16.0, 16.0, 13.0, 23.0, 24.0, 31.0, 34.0, 41.0, 35.0, 31.0, 38.0, 42.0, 46.0, 35.0, 37.0, 33.0, 42.0, 30.0, 49.0, 39.0, 26.0, 31.0, 32.0, 25.0, 31.0, 19.0, 23.0, 16.0, 24.0, 19.0, 9.0, 7.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.851471900939941, -6.5974884033203125, -6.343504428863525, -6.0895209312438965, -5.835537433624268, -5.5815534591674805, -5.327569961547852, -5.073586463928223, -4.819602966308594, -4.565619468688965, -4.311635494232178, -4.057651996612549, -3.80366849899292, -3.549684762954712, -3.295701026916504, -3.041717529296875, -2.787733554840088, -2.53374981880188, -2.279766321182251, -2.025782585144043, -1.7717989683151245, -1.517815351486206, -1.263831615447998, -1.0098479986190796, -0.7558643817901611, -0.5018807649612427, -0.24789708852767944, 0.006086587905883789, 0.26007020473480225, 0.5140538215637207, 0.7680375576019287, 1.0220211744308472, 1.2760047912597656, 1.529988408088684, 1.7839720249176025, 2.0379557609558105, 2.2919392585754395, 2.5459229946136475, 2.7999067306518555, 3.0538902282714844, 3.3078739643096924, 3.5618577003479004, 3.8158411979675293, 4.069825172424316, 4.323808670043945, 4.577792167663574, 4.831775665283203, 5.08575963973999, 5.339743137359619, 5.593726634979248, 5.847710609436035, 6.101694107055664, 6.355677604675293, 6.609661102294922, 6.863645076751709, 7.117628574371338, 7.371612548828125, 7.625596046447754, 7.879580020904541, 8.133563995361328, 8.387547492980957, 8.641530990600586, 8.895514488220215, 9.149497985839844, 9.403481483459473]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 3.0, 7.0, 12.0, 15.0, 9.0, 9.0, 16.0, 24.0, 21.0, 14.0, 30.0, 24.0, 25.0, 31.0, 38.0, 42.0, 44.0, 41.0, 43.0, 46.0, 41.0, 46.0, 39.0, 44.0, 44.0, 40.0, 33.0, 30.0, 34.0, 24.0, 18.0, 19.0, 14.0, 8.0, 19.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7783203125, -0.75238037109375, -0.7264404296875, -0.70050048828125, -0.674560546875, -0.64862060546875, -0.6226806640625, -0.59674072265625, -0.57080078125, -0.54486083984375, -0.5189208984375, -0.49298095703125, -0.467041015625, -0.44110107421875, -0.4151611328125, -0.38922119140625, -0.36328125, -0.33734130859375, -0.3114013671875, -0.28546142578125, -0.259521484375, -0.23358154296875, -0.2076416015625, -0.18170166015625, -0.15576171875, -0.12982177734375, -0.1038818359375, -0.07794189453125, -0.052001953125, -0.02606201171875, -0.0001220703125, 0.02581787109375, 0.0517578125, 0.07769775390625, 0.1036376953125, 0.12957763671875, 0.155517578125, 0.18145751953125, 0.2073974609375, 0.23333740234375, 0.25927734375, 0.28521728515625, 0.3111572265625, 0.33709716796875, 0.363037109375, 0.38897705078125, 0.4149169921875, 0.44085693359375, 0.466796875, 0.49273681640625, 0.5186767578125, 0.54461669921875, 0.570556640625, 0.59649658203125, 0.6224365234375, 0.64837646484375, 0.67431640625, 0.70025634765625, 0.7261962890625, 0.75213623046875, 0.778076171875, 0.80401611328125, 0.8299560546875, 0.85589599609375, 0.8818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 18.0, 21.0, 31.0, 58.0, 82.0, 113.0, 184.0, 259.0, 444.0, 631.0, 954.0, 1429.0, 2164.0, 3414.0, 5425.0, 8236.0, 12632.0, 19416.0, 29741.0, 45241.0, 66463.0, 92575.0, 119479.0, 136570.0, 132476.0, 111489.0, 84564.0, 59404.0, 39763.0, 26397.0, 17096.0, 11185.0, 7032.0, 4720.0, 2951.0, 2027.0, 1289.0, 912.0, 556.0, 349.0, 247.0, 183.0, 108.0, 64.0, 44.0, 24.0, 27.0, 18.0, 14.0, 12.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.58642578125, -0.5667800903320312, -0.5471343994140625, -0.5274887084960938, -0.507843017578125, -0.48819732666015625, -0.4685516357421875, -0.44890594482421875, -0.42926025390625, -0.40961456298828125, -0.3899688720703125, -0.37032318115234375, -0.350677490234375, -0.33103179931640625, -0.3113861083984375, -0.29174041748046875, -0.2720947265625, -0.25244903564453125, -0.2328033447265625, -0.21315765380859375, -0.193511962890625, -0.17386627197265625, -0.1542205810546875, -0.13457489013671875, -0.11492919921875, -0.09528350830078125, -0.0756378173828125, -0.05599212646484375, -0.036346435546875, -0.01670074462890625, 0.0029449462890625, 0.02259063720703125, 0.042236328125, 0.06188201904296875, 0.0815277099609375, 0.10117340087890625, 0.120819091796875, 0.14046478271484375, 0.1601104736328125, 0.17975616455078125, 0.19940185546875, 0.21904754638671875, 0.2386932373046875, 0.25833892822265625, 0.277984619140625, 0.29763031005859375, 0.3172760009765625, 0.33692169189453125, 0.3565673828125, 0.37621307373046875, 0.3958587646484375, 0.41550445556640625, 0.435150146484375, 0.45479583740234375, 0.4744415283203125, 0.49408721923828125, 0.51373291015625, 0.5333786010742188, 0.5530242919921875, 0.5726699829101562, 0.592315673828125, 0.6119613647460938, 0.6316070556640625, 0.6512527465820312, 0.6708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 7.0, 13.0, 14.0, 9.0, 11.0, 13.0, 29.0, 18.0, 19.0, 24.0, 34.0, 27.0, 32.0, 39.0, 32.0, 32.0, 31.0, 36.0, 42.0, 1058.0, 40.0, 27.0, 51.0, 29.0, 48.0, 36.0, 30.0, 26.0, 19.0, 26.0, 24.0, 31.0, 19.0, 13.0, 17.0, 8.0, 10.0, 6.0, 7.0, 5.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74951171875, -0.7255325317382812, -0.7015533447265625, -0.6775741577148438, -0.653594970703125, -0.6296157836914062, -0.6056365966796875, -0.5816574096679688, -0.55767822265625, -0.5336990356445312, -0.5097198486328125, -0.48574066162109375, -0.461761474609375, -0.43778228759765625, -0.4138031005859375, -0.38982391357421875, -0.3658447265625, -0.34186553955078125, -0.3178863525390625, -0.29390716552734375, -0.269927978515625, -0.24594879150390625, -0.2219696044921875, -0.19799041748046875, -0.17401123046875, -0.15003204345703125, -0.1260528564453125, -0.10207366943359375, -0.078094482421875, -0.05411529541015625, -0.0301361083984375, -0.00615692138671875, 0.017822265625, 0.04180145263671875, 0.0657806396484375, 0.08975982666015625, 0.113739013671875, 0.13771820068359375, 0.1616973876953125, 0.18567657470703125, 0.20965576171875, 0.23363494873046875, 0.2576141357421875, 0.28159332275390625, 0.305572509765625, 0.32955169677734375, 0.3535308837890625, 0.37751007080078125, 0.4014892578125, 0.42546844482421875, 0.4494476318359375, 0.47342681884765625, 0.497406005859375, 0.5213851928710938, 0.5453643798828125, 0.5693435668945312, 0.59332275390625, 0.6173019409179688, 0.6412811279296875, 0.6652603149414062, 0.689239501953125, 0.7132186889648438, 0.7371978759765625, 0.7611770629882812, 0.78515625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 9.0, 9.0, 14.0, 32.0, 37.0, 52.0, 101.0, 121.0, 223.0, 324.0, 469.0, 721.0, 1018.0, 1628.0, 2409.0, 3501.0, 5202.0, 8208.0, 12561.0, 20015.0, 40649.0, 185192.0, 1544069.0, 174861.0, 40004.0, 20008.0, 12235.0, 7756.0, 5101.0, 3461.0, 2401.0, 1550.0, 1056.0, 697.0, 489.0, 318.0, 211.0, 126.0, 91.0, 71.0, 42.0, 33.0, 13.0, 15.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.86669921875, -0.8415679931640625, -0.816436767578125, -0.7913055419921875, -0.76617431640625, -0.7410430908203125, -0.715911865234375, -0.6907806396484375, -0.6656494140625, -0.6405181884765625, -0.615386962890625, -0.5902557373046875, -0.56512451171875, -0.5399932861328125, -0.514862060546875, -0.4897308349609375, -0.464599609375, -0.4394683837890625, -0.414337158203125, -0.3892059326171875, -0.36407470703125, -0.3389434814453125, -0.313812255859375, -0.2886810302734375, -0.2635498046875, -0.2384185791015625, -0.213287353515625, -0.1881561279296875, -0.16302490234375, -0.1378936767578125, -0.112762451171875, -0.0876312255859375, -0.0625, -0.0373687744140625, -0.012237548828125, 0.0128936767578125, 0.03802490234375, 0.0631561279296875, 0.088287353515625, 0.1134185791015625, 0.1385498046875, 0.1636810302734375, 0.188812255859375, 0.2139434814453125, 0.23907470703125, 0.2642059326171875, 0.289337158203125, 0.3144683837890625, 0.339599609375, 0.3647308349609375, 0.389862060546875, 0.4149932861328125, 0.44012451171875, 0.4652557373046875, 0.490386962890625, 0.5155181884765625, 0.5406494140625, 0.5657806396484375, 0.590911865234375, 0.6160430908203125, 0.64117431640625, 0.6663055419921875, 0.691436767578125, 0.7165679931640625, 0.74169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 11.0, 7.0, 5.0, 14.0, 7.0, 17.0, 27.0, 32.0, 31.0, 45.0, 41.0, 43.0, 58.0, 84.0, 86.0, 69.0, 72.0, 72.0, 43.0, 45.0, 33.0, 24.0, 20.0, 19.0, 11.0, 12.0, 11.0, 10.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.125244140625, -0.12112998962402344, -0.11701583862304688, -0.11290168762207031, -0.10878753662109375, -0.10467338562011719, -0.10055923461914062, -0.09644508361816406, -0.0923309326171875, -0.08821678161621094, -0.08410263061523438, -0.07998847961425781, -0.07587432861328125, -0.07176017761230469, -0.06764602661132812, -0.06353187561035156, -0.059417724609375, -0.05530357360839844, -0.051189422607421875, -0.04707527160644531, -0.04296112060546875, -0.03884696960449219, -0.034732818603515625, -0.030618667602539062, -0.0265045166015625, -0.022390365600585938, -0.018276214599609375, -0.014162063598632812, -0.01004791259765625, -0.0059337615966796875, -0.001819610595703125, 0.0022945404052734375, 0.00640869140625, 0.010522842407226562, 0.014636993408203125, 0.018751144409179688, 0.02286529541015625, 0.026979446411132812, 0.031093597412109375, 0.03520774841308594, 0.0393218994140625, 0.04343605041503906, 0.047550201416015625, 0.05166435241699219, 0.05577850341796875, 0.05989265441894531, 0.06400680541992188, 0.06812095642089844, 0.072235107421875, 0.07634925842285156, 0.08046340942382812, 0.08457756042480469, 0.08869171142578125, 0.09280586242675781, 0.09692001342773438, 0.10103416442871094, 0.1051483154296875, 0.10926246643066406, 0.11337661743164062, 0.11749076843261719, 0.12160491943359375, 0.1257190704345703, 0.12983322143554688, 0.13394737243652344, 0.1380615234375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 14.0, 10.0, 11.0, 18.0, 27.0, 24.0, 35.0, 36.0, 60.0, 82.0, 132.0, 188.0, 312.0, 895.0, 5953.0, 161862.0, 855148.0, 20580.0, 1879.0, 445.0, 221.0, 141.0, 113.0, 67.0, 61.0, 38.0, 27.0, 18.0, 23.0, 14.0, 19.0, 11.0, 10.0, 12.0, 7.0, 7.0, 4.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.1171875, -2.055328369140625, -1.99346923828125, -1.931610107421875, -1.8697509765625, -1.807891845703125, -1.74603271484375, -1.684173583984375, -1.622314453125, -1.560455322265625, -1.49859619140625, -1.436737060546875, -1.3748779296875, -1.313018798828125, -1.25115966796875, -1.189300537109375, -1.12744140625, -1.065582275390625, -1.00372314453125, -0.941864013671875, -0.8800048828125, -0.818145751953125, -0.75628662109375, -0.694427490234375, -0.632568359375, -0.570709228515625, -0.50885009765625, -0.446990966796875, -0.3851318359375, -0.323272705078125, -0.26141357421875, -0.199554443359375, -0.1376953125, -0.075836181640625, -0.01397705078125, 0.047882080078125, 0.1097412109375, 0.171600341796875, 0.23345947265625, 0.295318603515625, 0.357177734375, 0.419036865234375, 0.48089599609375, 0.542755126953125, 0.6046142578125, 0.666473388671875, 0.72833251953125, 0.790191650390625, 0.85205078125, 0.913909912109375, 0.97576904296875, 1.037628173828125, 1.0994873046875, 1.161346435546875, 1.22320556640625, 1.285064697265625, 1.346923828125, 1.408782958984375, 1.47064208984375, 1.532501220703125, 1.5943603515625, 1.656219482421875, 1.71807861328125, 1.779937744140625, 1.841796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 22.0, 61.0, 133.0, 251.0, 304.0, 146.0, 47.0, 26.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1922073364257812, -2.1312191486358643, -2.0702309608459473, -2.0092427730560303, -1.9482544660568237, -1.8872662782669067, -1.8262780904769897, -1.7652899026870728, -1.7043017148971558, -1.6433135271072388, -1.5823253393173218, -1.5213370323181152, -1.4603488445281982, -1.3993606567382812, -1.3383724689483643, -1.2773842811584473, -1.2163960933685303, -1.1554079055786133, -1.0944197177886963, -1.0334315299987793, -0.9724432826042175, -0.9114550352096558, -0.8504668474197388, -0.7894786596298218, -0.7284903526306152, -0.6675021648406982, -0.6065139174461365, -0.5455257296562195, -0.4845375418663025, -0.4235493242740631, -0.36256110668182373, -0.30157291889190674, -0.24058473110198975, -0.17959652841091156, -0.11860831826925278, -0.057620108127593994, 0.003368094563484192, 0.06435629725456238, 0.12534451484680176, 0.18633270263671875, 0.24732092022895813, 0.3083091378211975, 0.3692973256111145, 0.4302855432033539, 0.49127376079559326, 0.5522619485855103, 0.6132501363754272, 0.6742383241653442, 0.735226571559906, 0.796214759349823, 0.8572030067443848, 0.9181911945343018, 0.9791793823242188, 1.0401675701141357, 1.1011557579040527, 1.1621439456939697, 1.2231322526931763, 1.2841204404830933, 1.3451086282730103, 1.4060969352722168, 1.4670851230621338, 1.5280733108520508, 1.5890614986419678, 1.6500496864318848, 1.7110378742218018]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 6.0, 12.0, 9.0, 10.0, 11.0, 9.0, 17.0, 11.0, 21.0, 28.0, 25.0, 33.0, 20.0, 32.0, 35.0, 27.0, 31.0, 37.0, 51.0, 45.0, 30.0, 48.0, 46.0, 32.0, 37.0, 27.0, 27.0, 33.0, 19.0, 26.0, 25.0, 25.0, 15.0, 20.0, 26.0, 13.0, 12.0, 6.0, 8.0, 9.0, 9.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.42906856536865234, -0.41569530963897705, -0.40232208371162415, -0.38894882798194885, -0.37557557225227356, -0.36220234632492065, -0.34882909059524536, -0.33545583486557007, -0.3220825791358948, -0.3087093234062195, -0.2953360974788666, -0.2819628417491913, -0.268589586019516, -0.2552163600921631, -0.2418431043624878, -0.2284698486328125, -0.2150966078042984, -0.2017233669757843, -0.188350111246109, -0.1749768704175949, -0.16160361468791962, -0.14823037385940552, -0.13485711812973022, -0.12148387730121613, -0.10811062902212143, -0.09473738074302673, -0.08136413246393204, -0.06799088418483734, -0.054617639631032944, -0.041244395077228546, -0.02787114679813385, -0.014497898519039154, -0.001124650239944458, 0.012248597107827663, 0.025621844455599785, 0.03899509087204933, 0.05236833915114403, 0.06574158370494843, 0.07911483198404312, 0.09248808026313782, 0.10586132854223251, 0.11923457682132721, 0.1326078176498413, 0.1459810733795166, 0.1593543142080307, 0.1727275550365448, 0.1861008107662201, 0.19947406649589539, 0.21284730732440948, 0.22622054815292358, 0.23959380388259888, 0.25296705961227417, 0.2663402855396271, 0.27971354126930237, 0.29308679699897766, 0.30646002292633057, 0.31983327865600586, 0.33320653438568115, 0.34657976031303406, 0.35995301604270935, 0.37332627177238464, 0.38669949769973755, 0.40007275342941284, 0.41344600915908813, 0.4268192648887634]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 7.0, 11.0, 9.0, 11.0, 19.0, 16.0, 12.0, 31.0, 27.0, 28.0, 21.0, 36.0, 30.0, 35.0, 35.0, 49.0, 38.0, 55.0, 55.0, 41.0, 54.0, 45.0, 47.0, 36.0, 33.0, 46.0, 32.0, 17.0, 14.0, 18.0, 13.0, 8.0, 19.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7777786254882812, -0.7508697509765625, -0.7239608764648438, -0.697052001953125, -0.6701431274414062, -0.6432342529296875, -0.6163253784179688, -0.58941650390625, -0.5625076293945312, -0.5355987548828125, -0.5086898803710938, -0.481781005859375, -0.45487213134765625, -0.4279632568359375, -0.40105438232421875, -0.3741455078125, -0.34723663330078125, -0.3203277587890625, -0.29341888427734375, -0.266510009765625, -0.23960113525390625, -0.2126922607421875, -0.18578338623046875, -0.15887451171875, -0.13196563720703125, -0.1050567626953125, -0.07814788818359375, -0.051239013671875, -0.02433013916015625, 0.0025787353515625, 0.02948760986328125, 0.056396484375, 0.08330535888671875, 0.1102142333984375, 0.13712310791015625, 0.164031982421875, 0.19094085693359375, 0.2178497314453125, 0.24475860595703125, 0.27166748046875, 0.29857635498046875, 0.3254852294921875, 0.35239410400390625, 0.379302978515625, 0.40621185302734375, 0.4331207275390625, 0.46002960205078125, 0.4869384765625, 0.5138473510742188, 0.5407562255859375, 0.5676651000976562, 0.594573974609375, 0.6214828491210938, 0.6483917236328125, 0.6753005981445312, 0.70220947265625, 0.7291183471679688, 0.7560272216796875, 0.7829360961914062, 0.809844970703125, 0.8367538452148438, 0.8636627197265625, 0.8905715942382812, 0.91748046875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 8.0, 29.0, 28.0, 31.0, 68.0, 88.0, 134.0, 221.0, 361.0, 613.0, 905.0, 1573.0, 2632.0, 4708.0, 8804.0, 17789.0, 47584.0, 220570.0, 556553.0, 122001.0, 32949.0, 14145.0, 6978.0, 3970.0, 2200.0, 1363.0, 838.0, 499.0, 307.0, 216.0, 135.0, 89.0, 47.0, 27.0, 24.0, 13.0, 15.0, 4.0, 7.0, 5.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.052734375, -1.992950439453125, -1.93316650390625, -1.873382568359375, -1.8135986328125, -1.753814697265625, -1.69403076171875, -1.634246826171875, -1.574462890625, -1.514678955078125, -1.45489501953125, -1.395111083984375, -1.3353271484375, -1.275543212890625, -1.21575927734375, -1.155975341796875, -1.09619140625, -1.036407470703125, -0.97662353515625, -0.916839599609375, -0.8570556640625, -0.797271728515625, -0.73748779296875, -0.677703857421875, -0.617919921875, -0.558135986328125, -0.49835205078125, -0.438568115234375, -0.3787841796875, -0.319000244140625, -0.25921630859375, -0.199432373046875, -0.1396484375, -0.079864501953125, -0.02008056640625, 0.039703369140625, 0.0994873046875, 0.159271240234375, 0.21905517578125, 0.278839111328125, 0.338623046875, 0.398406982421875, 0.45819091796875, 0.517974853515625, 0.5777587890625, 0.637542724609375, 0.69732666015625, 0.757110595703125, 0.81689453125, 0.876678466796875, 0.93646240234375, 0.996246337890625, 1.0560302734375, 1.115814208984375, 1.17559814453125, 1.235382080078125, 1.295166015625, 1.354949951171875, 1.41473388671875, 1.474517822265625, 1.5343017578125, 1.594085693359375, 1.65386962890625, 1.713653564453125, 1.7734375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 5.0, 8.0, 13.0, 13.0, 11.0, 16.0, 22.0, 24.0, 19.0, 25.0, 35.0, 28.0, 32.0, 38.0, 37.0, 57.0, 61.0, 103.0, 142.0, 1422.0, 276.0, 127.0, 80.0, 66.0, 48.0, 59.0, 26.0, 40.0, 24.0, 23.0, 24.0, 17.0, 16.0, 24.0, 15.0, 14.0, 5.0, 11.0, 13.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.162109375, -3.071197509765625, -2.98028564453125, -2.889373779296875, -2.7984619140625, -2.707550048828125, -2.61663818359375, -2.525726318359375, -2.434814453125, -2.343902587890625, -2.25299072265625, -2.162078857421875, -2.0711669921875, -1.980255126953125, -1.88934326171875, -1.798431396484375, -1.70751953125, -1.616607666015625, -1.52569580078125, -1.434783935546875, -1.3438720703125, -1.252960205078125, -1.16204833984375, -1.071136474609375, -0.980224609375, -0.889312744140625, -0.79840087890625, -0.707489013671875, -0.6165771484375, -0.525665283203125, -0.43475341796875, -0.343841552734375, -0.2529296875, -0.162017822265625, -0.07110595703125, 0.019805908203125, 0.1107177734375, 0.201629638671875, 0.29254150390625, 0.383453369140625, 0.474365234375, 0.565277099609375, 0.65618896484375, 0.747100830078125, 0.8380126953125, 0.928924560546875, 1.01983642578125, 1.110748291015625, 1.20166015625, 1.292572021484375, 1.38348388671875, 1.474395751953125, 1.5653076171875, 1.656219482421875, 1.74713134765625, 1.838043212890625, 1.928955078125, 2.019866943359375, 2.11077880859375, 2.201690673828125, 2.2926025390625, 2.383514404296875, 2.47442626953125, 2.565338134765625, 2.65625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 5.0, 8.0, 10.0, 15.0, 18.0, 17.0, 23.0, 33.0, 36.0, 35.0, 79.0, 109.0, 155.0, 317.0, 591.0, 1229.0, 2450.0, 5828.0, 16060.0, 56597.0, 407071.0, 2397243.0, 200157.0, 37258.0, 11767.0, 4407.0, 1977.0, 921.0, 461.0, 265.0, 166.0, 96.0, 64.0, 47.0, 38.0, 30.0, 28.0, 25.0, 13.0, 12.0, 11.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.28515625, -3.173248291015625, -3.06134033203125, -2.949432373046875, -2.8375244140625, -2.725616455078125, -2.61370849609375, -2.501800537109375, -2.389892578125, -2.277984619140625, -2.16607666015625, -2.054168701171875, -1.9422607421875, -1.830352783203125, -1.71844482421875, -1.606536865234375, -1.49462890625, -1.382720947265625, -1.27081298828125, -1.158905029296875, -1.0469970703125, -0.935089111328125, -0.82318115234375, -0.711273193359375, -0.599365234375, -0.487457275390625, -0.37554931640625, -0.263641357421875, -0.1517333984375, -0.039825439453125, 0.07208251953125, 0.183990478515625, 0.2958984375, 0.407806396484375, 0.51971435546875, 0.631622314453125, 0.7435302734375, 0.855438232421875, 0.96734619140625, 1.079254150390625, 1.191162109375, 1.303070068359375, 1.41497802734375, 1.526885986328125, 1.6387939453125, 1.750701904296875, 1.86260986328125, 1.974517822265625, 2.08642578125, 2.198333740234375, 2.31024169921875, 2.422149658203125, 2.5340576171875, 2.645965576171875, 2.75787353515625, 2.869781494140625, 2.981689453125, 3.093597412109375, 3.20550537109375, 3.317413330078125, 3.4293212890625, 3.541229248046875, 3.65313720703125, 3.765045166015625, 3.876953125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 58.0, 290.0, 442.0, 176.0, 39.0, 3.0], "bins": [-55.20594787597656, -54.29047775268555, -53.3750114440918, -52.45954132080078, -51.54407501220703, -50.628604888916016, -49.713134765625, -48.79766845703125, -47.882198333740234, -46.96672821044922, -46.05126190185547, -45.13579177856445, -44.2203254699707, -43.30485534667969, -42.38938903808594, -41.47391891479492, -40.55845260620117, -39.642982482910156, -38.727516174316406, -37.81204605102539, -36.89657974243164, -35.981109619140625, -35.065643310546875, -34.15017318725586, -33.234703063964844, -32.31923294067383, -31.403766632080078, -30.488296508789062, -29.57282829284668, -28.657360076904297, -27.741891860961914, -26.82642364501953, -25.91095542907715, -24.995487213134766, -24.080018997192383, -23.16455078125, -22.249080657958984, -21.3336124420166, -20.41814422607422, -19.502676010131836, -18.587207794189453, -17.67173957824707, -16.756271362304688, -15.840802192687988, -14.925333976745605, -14.009864807128906, -13.094396591186523, -12.17892837524414, -11.263458251953125, -10.347990036010742, -9.432520866394043, -8.51705265045166, -7.601584434509277, -6.686115741729736, -5.770647048950195, -4.8551788330078125, -3.9397106170654297, -3.0242421627044678, -2.108773708343506, -1.1933050155639648, -0.27783656120300293, 0.637631893157959, 1.5531005859375, 2.468568801879883, 3.384037494659424]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 3.0, 11.0, 9.0, 14.0, 30.0, 37.0, 22.0, 39.0, 32.0, 28.0, 42.0, 50.0, 39.0, 32.0, 49.0, 59.0, 49.0, 53.0, 50.0, 34.0, 32.0, 45.0, 39.0, 32.0, 15.0, 27.0, 27.0, 11.0, 19.0, 13.0, 8.0, 9.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.994815826416016, -8.629061698913574, -8.26330852508545, -7.897554397583008, -7.531800746917725, -7.166047096252441, -6.80029296875, -6.434539318084717, -6.068785667419434, -5.70303201675415, -5.337277889251709, -4.971524238586426, -4.605770587921143, -4.240016937255859, -3.874262809753418, -3.5085091590881348, -3.1427550315856934, -2.777001142501831, -2.411247491836548, -2.0454936027526855, -1.6797398328781128, -1.31398606300354, -0.9482321739196777, -0.5824785232543945, -0.21672463417053223, 0.14902916550636292, 0.5147829651832581, 0.8805367946624756, 1.2462905645370483, 1.612044334411621, 1.9777982234954834, 2.3435518741607666, 2.709305763244629, 3.075059652328491, 3.4408133029937744, 3.8065671920776367, 4.17232084274292, 4.538074493408203, 4.9038286209106445, 5.269582271575928, 5.635335922241211, 6.001089572906494, 6.3668437004089355, 6.732597351074219, 7.098351001739502, 7.464104652404785, 7.829858779907227, 8.195611953735352, 8.56136703491211, 8.92712116241455, 9.292874336242676, 9.658628463745117, 10.024382591247559, 10.390135765075684, 10.755889892578125, 11.12164306640625, 11.487397193908691, 11.853151321411133, 12.218904495239258, 12.5846586227417, 12.95041275024414, 13.316165924072266, 13.681920051574707, 14.047674179077148, 14.413427352905273]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 10.0, 16.0, 16.0, 20.0, 28.0, 29.0, 24.0, 30.0, 33.0, 40.0, 45.0, 43.0, 40.0, 50.0, 41.0, 54.0, 36.0, 53.0, 47.0, 45.0, 40.0, 33.0, 32.0, 30.0, 25.0, 21.0, 14.0, 15.0, 8.0, 13.0, 12.0, 4.0, 3.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84423828125, -0.8149337768554688, -0.7856292724609375, -0.7563247680664062, -0.727020263671875, -0.6977157592773438, -0.6684112548828125, -0.6391067504882812, -0.60980224609375, -0.5804977416992188, -0.5511932373046875, -0.5218887329101562, -0.492584228515625, -0.46327972412109375, -0.4339752197265625, -0.40467071533203125, -0.3753662109375, -0.34606170654296875, -0.3167572021484375, -0.28745269775390625, -0.258148193359375, -0.22884368896484375, -0.1995391845703125, -0.17023468017578125, -0.14093017578125, -0.11162567138671875, -0.0823211669921875, -0.05301666259765625, -0.023712158203125, 0.00559234619140625, 0.0348968505859375, 0.06420135498046875, 0.093505859375, 0.12281036376953125, 0.1521148681640625, 0.18141937255859375, 0.210723876953125, 0.24002838134765625, 0.2693328857421875, 0.29863739013671875, 0.32794189453125, 0.35724639892578125, 0.3865509033203125, 0.41585540771484375, 0.445159912109375, 0.47446441650390625, 0.5037689208984375, 0.5330734252929688, 0.5623779296875, 0.5916824340820312, 0.6209869384765625, 0.6502914428710938, 0.679595947265625, 0.7089004516601562, 0.7382049560546875, 0.7675094604492188, 0.79681396484375, 0.8261184692382812, 0.8554229736328125, 0.8847274780273438, 0.914031982421875, 0.9433364868164062, 0.9726409912109375, 1.0019454956054688, 1.03125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 2.0, 12.0, 14.0, 21.0, 23.0, 42.0, 53.0, 105.0, 174.0, 330.0, 644.0, 1500.0, 3719.0, 9061.0, 26064.0, 108975.0, 2121047.0, 1785596.0, 97908.0, 24040.0, 8580.0, 3326.0, 1466.0, 705.0, 363.0, 177.0, 104.0, 64.0, 47.0, 27.0, 19.0, 21.0, 13.0, 5.0, 7.0, 9.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.496612548828125, -3.37994384765625, -3.263275146484375, -3.1466064453125, -3.029937744140625, -2.91326904296875, -2.796600341796875, -2.679931640625, -2.563262939453125, -2.44659423828125, -2.329925537109375, -2.2132568359375, -2.096588134765625, -1.97991943359375, -1.863250732421875, -1.74658203125, -1.629913330078125, -1.51324462890625, -1.396575927734375, -1.2799072265625, -1.163238525390625, -1.04656982421875, -0.929901123046875, -0.813232421875, -0.696563720703125, -0.57989501953125, -0.463226318359375, -0.3465576171875, -0.229888916015625, -0.11322021484375, 0.003448486328125, 0.1201171875, 0.236785888671875, 0.35345458984375, 0.470123291015625, 0.5867919921875, 0.703460693359375, 0.82012939453125, 0.936798095703125, 1.053466796875, 1.170135498046875, 1.28680419921875, 1.403472900390625, 1.5201416015625, 1.636810302734375, 1.75347900390625, 1.870147705078125, 1.98681640625, 2.103485107421875, 2.22015380859375, 2.336822509765625, 2.4534912109375, 2.570159912109375, 2.68682861328125, 2.803497314453125, 2.920166015625, 3.036834716796875, 3.15350341796875, 3.270172119140625, 3.3868408203125, 3.503509521484375, 3.62017822265625, 3.736846923828125, 3.853515625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 11.0, 10.0, 21.0, 37.0, 54.0, 98.0, 171.0, 339.0, 710.0, 1096.0, 748.0, 351.0, 177.0, 111.0, 65.0, 26.0, 21.0, 13.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.375, -7.213134765625, -7.05126953125, -6.889404296875, -6.7275390625, -6.565673828125, -6.40380859375, -6.241943359375, -6.080078125, -5.918212890625, -5.75634765625, -5.594482421875, -5.4326171875, -5.270751953125, -5.10888671875, -4.947021484375, -4.78515625, -4.623291015625, -4.46142578125, -4.299560546875, -4.1376953125, -3.975830078125, -3.81396484375, -3.652099609375, -3.490234375, -3.328369140625, -3.16650390625, -3.004638671875, -2.8427734375, -2.680908203125, -2.51904296875, -2.357177734375, -2.1953125, -2.033447265625, -1.87158203125, -1.709716796875, -1.5478515625, -1.385986328125, -1.22412109375, -1.062255859375, -0.900390625, -0.738525390625, -0.57666015625, -0.414794921875, -0.2529296875, -0.091064453125, 0.07080078125, 0.232666015625, 0.39453125, 0.556396484375, 0.71826171875, 0.880126953125, 1.0419921875, 1.203857421875, 1.36572265625, 1.527587890625, 1.689453125, 1.851318359375, 2.01318359375, 2.175048828125, 2.3369140625, 2.498779296875, 2.66064453125, 2.822509765625, 2.984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 10.0, 23.0, 22.0, 24.0, 27.0, 43.0, 70.0, 119.0, 219.0, 663.0, 2083.0, 8485.0, 54974.0, 1118586.0, 2898624.0, 93448.0, 12587.0, 2711.0, 835.0, 320.0, 155.0, 71.0, 45.0, 27.0, 30.0, 15.0, 22.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.39447021484375, -6.1053466796875, -5.81622314453125, -5.527099609375, -5.23797607421875, -4.9488525390625, -4.65972900390625, -4.37060546875, -4.08148193359375, -3.7923583984375, -3.50323486328125, -3.214111328125, -2.92498779296875, -2.6358642578125, -2.34674072265625, -2.0576171875, -1.76849365234375, -1.4793701171875, -1.19024658203125, -0.901123046875, -0.61199951171875, -0.3228759765625, -0.03375244140625, 0.25537109375, 0.54449462890625, 0.8336181640625, 1.12274169921875, 1.411865234375, 1.70098876953125, 1.9901123046875, 2.27923583984375, 2.568359375, 2.85748291015625, 3.1466064453125, 3.43572998046875, 3.724853515625, 4.01397705078125, 4.3031005859375, 4.59222412109375, 4.88134765625, 5.17047119140625, 5.4595947265625, 5.74871826171875, 6.037841796875, 6.32696533203125, 6.6160888671875, 6.90521240234375, 7.1943359375, 7.48345947265625, 7.7725830078125, 8.06170654296875, 8.350830078125, 8.63995361328125, 8.9290771484375, 9.21820068359375, 9.50732421875, 9.79644775390625, 10.0855712890625, 10.37469482421875, 10.663818359375, 10.95294189453125, 11.2420654296875, 11.53118896484375, 11.8203125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 19.0, 44.0, 61.0, 129.0, 201.0, 194.0, 166.0, 105.0, 46.0, 20.0, 9.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.7143669128418, -35.8249397277832, -34.93551254272461, -34.046085357666016, -33.15665817260742, -32.26723098754883, -31.377803802490234, -30.488378524780273, -29.59895133972168, -28.709524154663086, -27.820096969604492, -26.9306697845459, -26.041242599487305, -25.151817321777344, -24.26239013671875, -23.372962951660156, -22.483535766601562, -21.59410858154297, -20.704681396484375, -19.81525421142578, -18.925827026367188, -18.036399841308594, -17.14697265625, -16.25754737854004, -15.368118286132812, -14.478691101074219, -13.589263916015625, -12.699836730957031, -11.810410499572754, -10.92098331451416, -10.031556129455566, -9.142129898071289, -8.252702713012695, -7.363275527954102, -6.473848819732666, -5.584421634674072, -4.694994926452637, -3.805567741394043, -2.916140556335449, -2.0267138481140137, -1.13728666305542, -0.2478596568107605, 0.6415673494338989, 1.5309944152832031, 2.4204213619232178, 3.3098483085632324, 4.199275493621826, 5.088702201843262, 5.9781293869018555, 6.867556571960449, 7.756983280181885, 8.64640998840332, 9.535837173461914, 10.425264358520508, 11.314691543579102, 12.204118728637695, 13.093545913696289, 13.982973098754883, 14.872400283813477, 15.76182746887207, 16.651254653930664, 17.540679931640625, 18.43010711669922, 19.319534301757812, 20.208961486816406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 13.0, 10.0, 15.0, 20.0, 18.0, 21.0, 21.0, 28.0, 24.0, 34.0, 33.0, 53.0, 35.0, 36.0, 35.0, 41.0, 58.0, 38.0, 31.0, 31.0, 33.0, 40.0, 28.0, 33.0, 32.0, 28.0, 28.0, 28.0, 16.0, 15.0, 13.0, 12.0, 9.0, 12.0, 5.0, 5.0, 12.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.801793098449707, -8.55057144165039, -8.29935073852539, -8.048129081726074, -7.796907424926758, -7.5456862449646, -7.294465065002441, -7.043243408203125, -6.792022228240967, -6.540801048278809, -6.289579391479492, -6.038358211517334, -5.787137031555176, -5.535915374755859, -5.284694194793701, -5.033473014831543, -4.782251358032227, -4.531030178070068, -4.279808521270752, -4.028587341308594, -3.7773659229278564, -3.526144504547119, -3.274923324584961, -3.0237019062042236, -2.7724804878234863, -2.521259069442749, -2.2700376510620117, -2.0188164710998535, -1.7675950527191162, -1.516373634338379, -1.2651523351669312, -1.0139310359954834, -0.7627086639404297, -0.5114873051643372, -0.26026594638824463, -0.0090445876121521, 0.24217677116394043, 0.49339818954467773, 0.7446194887161255, 0.9958407878875732, 1.2470622062683105, 1.4982836246490479, 1.7495049238204956, 2.0007262229919434, 2.2519476413726807, 2.503169059753418, 2.754390239715576, 3.0056116580963135, 3.256833076477051, 3.508054494857788, 3.7592759132385254, 4.010497093200684, 4.26171875, 4.512939929962158, 4.764161109924316, 5.015382766723633, 5.266603946685791, 5.517825126647949, 5.769046783447266, 6.020267963409424, 6.271489143371582, 6.522710800170898, 6.773931980133057, 7.025153160095215, 7.276374816894531]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 12.0, 10.0, 16.0, 16.0, 20.0, 24.0, 19.0, 27.0, 22.0, 18.0, 29.0, 31.0, 28.0, 34.0, 38.0, 40.0, 48.0, 42.0, 53.0, 43.0, 50.0, 42.0, 33.0, 39.0, 36.0, 31.0, 23.0, 18.0, 23.0, 15.0, 17.0, 16.0, 13.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87744140625, -0.8497467041015625, -0.822052001953125, -0.7943572998046875, -0.76666259765625, -0.7389678955078125, -0.711273193359375, -0.6835784912109375, -0.6558837890625, -0.6281890869140625, -0.600494384765625, -0.5727996826171875, -0.54510498046875, -0.5174102783203125, -0.489715576171875, -0.4620208740234375, -0.434326171875, -0.4066314697265625, -0.378936767578125, -0.3512420654296875, -0.32354736328125, -0.2958526611328125, -0.268157958984375, -0.2404632568359375, -0.2127685546875, -0.1850738525390625, -0.157379150390625, -0.1296844482421875, -0.10198974609375, -0.0742950439453125, -0.046600341796875, -0.0189056396484375, 0.0087890625, 0.0364837646484375, 0.064178466796875, 0.0918731689453125, 0.11956787109375, 0.1472625732421875, 0.174957275390625, 0.2026519775390625, 0.2303466796875, 0.2580413818359375, 0.285736083984375, 0.3134307861328125, 0.34112548828125, 0.3688201904296875, 0.396514892578125, 0.4242095947265625, 0.451904296875, 0.4795989990234375, 0.507293701171875, 0.5349884033203125, 0.56268310546875, 0.5903778076171875, 0.618072509765625, 0.6457672119140625, 0.6734619140625, 0.7011566162109375, 0.728851318359375, 0.7565460205078125, 0.78424072265625, 0.8119354248046875, 0.839630126953125, 0.8673248291015625, 0.89501953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 12.0, 17.0, 36.0, 46.0, 49.0, 109.0, 145.0, 265.0, 332.0, 508.0, 825.0, 1226.0, 1761.0, 2665.0, 4020.0, 5901.0, 8889.0, 13255.0, 19568.0, 29233.0, 42656.0, 60681.0, 84802.0, 111115.0, 133089.0, 134891.0, 112511.0, 85538.0, 61731.0, 42538.0, 29630.0, 19618.0, 13538.0, 8966.0, 6126.0, 4103.0, 2752.0, 1815.0, 1193.0, 850.0, 516.0, 342.0, 230.0, 170.0, 95.0, 75.0, 38.0, 37.0, 20.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.68701171875, -0.6668167114257812, -0.6466217041015625, -0.6264266967773438, -0.606231689453125, -0.5860366821289062, -0.5658416748046875, -0.5456466674804688, -0.52545166015625, -0.5052566528320312, -0.4850616455078125, -0.46486663818359375, -0.444671630859375, -0.42447662353515625, -0.4042816162109375, -0.38408660888671875, -0.3638916015625, -0.34369659423828125, -0.3235015869140625, -0.30330657958984375, -0.283111572265625, -0.26291656494140625, -0.2427215576171875, -0.22252655029296875, -0.20233154296875, -0.18213653564453125, -0.1619415283203125, -0.14174652099609375, -0.121551513671875, -0.10135650634765625, -0.0811614990234375, -0.06096649169921875, -0.040771484375, -0.02057647705078125, -0.0003814697265625, 0.01981353759765625, 0.040008544921875, 0.06020355224609375, 0.0803985595703125, 0.10059356689453125, 0.12078857421875, 0.14098358154296875, 0.1611785888671875, 0.18137359619140625, 0.201568603515625, 0.22176361083984375, 0.2419586181640625, 0.26215362548828125, 0.2823486328125, 0.30254364013671875, 0.3227386474609375, 0.34293365478515625, 0.363128662109375, 0.38332366943359375, 0.4035186767578125, 0.42371368408203125, 0.44390869140625, 0.46410369873046875, 0.4842987060546875, 0.5044937133789062, 0.524688720703125, 0.5448837280273438, 0.5650787353515625, 0.5852737426757812, 0.60546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 14.0, 21.0, 21.0, 21.0, 21.0, 25.0, 36.0, 47.0, 26.0, 49.0, 38.0, 43.0, 38.0, 47.0, 1068.0, 42.0, 43.0, 46.0, 46.0, 36.0, 42.0, 47.0, 28.0, 24.0, 27.0, 26.0, 17.0, 9.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.255859375, -1.2216720581054688, -1.1874847412109375, -1.1532974243164062, -1.119110107421875, -1.0849227905273438, -1.0507354736328125, -1.0165481567382812, -0.98236083984375, -0.9481735229492188, -0.9139862060546875, -0.8797988891601562, -0.845611572265625, -0.8114242553710938, -0.7772369384765625, -0.7430496215820312, -0.7088623046875, -0.6746749877929688, -0.6404876708984375, -0.6063003540039062, -0.572113037109375, -0.5379257202148438, -0.5037384033203125, -0.46955108642578125, -0.43536376953125, -0.40117645263671875, -0.3669891357421875, -0.33280181884765625, -0.298614501953125, -0.26442718505859375, -0.2302398681640625, -0.19605255126953125, -0.161865234375, -0.12767791748046875, -0.0934906005859375, -0.05930328369140625, -0.025115966796875, 0.00907135009765625, 0.0432586669921875, 0.07744598388671875, 0.11163330078125, 0.14582061767578125, 0.1800079345703125, 0.21419525146484375, 0.248382568359375, 0.28256988525390625, 0.3167572021484375, 0.35094451904296875, 0.3851318359375, 0.41931915283203125, 0.4535064697265625, 0.48769378662109375, 0.521881103515625, 0.5560684204101562, 0.5902557373046875, 0.6244430541992188, 0.65863037109375, 0.6928176879882812, 0.7270050048828125, 0.7611923217773438, 0.795379638671875, 0.8295669555664062, 0.8637542724609375, 0.8979415893554688, 0.93212890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 7.0, 5.0, 9.0, 20.0, 28.0, 46.0, 85.0, 120.0, 169.0, 279.0, 435.0, 683.0, 1038.0, 1751.0, 2729.0, 4218.0, 7153.0, 11815.0, 21167.0, 46316.0, 256580.0, 1551521.0, 114898.0, 33507.0, 16922.0, 9815.0, 5820.0, 3649.0, 2376.0, 1460.0, 925.0, 591.0, 368.0, 211.0, 133.0, 110.0, 70.0, 44.0, 24.0, 14.0, 9.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99072265625, -0.9557418823242188, -0.9207611083984375, -0.8857803344726562, -0.850799560546875, -0.8158187866210938, -0.7808380126953125, -0.7458572387695312, -0.71087646484375, -0.6758956909179688, -0.6409149169921875, -0.6059341430664062, -0.570953369140625, -0.5359725952148438, -0.5009918212890625, -0.46601104736328125, -0.4310302734375, -0.39604949951171875, -0.3610687255859375, -0.32608795166015625, -0.291107177734375, -0.25612640380859375, -0.2211456298828125, -0.18616485595703125, -0.15118408203125, -0.11620330810546875, -0.0812225341796875, -0.04624176025390625, -0.011260986328125, 0.02371978759765625, 0.0587005615234375, 0.09368133544921875, 0.128662109375, 0.16364288330078125, 0.1986236572265625, 0.23360443115234375, 0.268585205078125, 0.30356597900390625, 0.3385467529296875, 0.37352752685546875, 0.40850830078125, 0.44348907470703125, 0.4784698486328125, 0.5134506225585938, 0.548431396484375, 0.5834121704101562, 0.6183929443359375, 0.6533737182617188, 0.6883544921875, 0.7233352661132812, 0.7583160400390625, 0.7932968139648438, 0.828277587890625, 0.8632583618164062, 0.8982391357421875, 0.9332199096679688, 0.96820068359375, 1.0031814575195312, 1.0381622314453125, 1.0731430053710938, 1.108123779296875, 1.1431045532226562, 1.1780853271484375, 1.2130661010742188, 1.248046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 6.0, 7.0, 7.0, 4.0, 12.0, 18.0, 9.0, 17.0, 35.0, 33.0, 41.0, 45.0, 52.0, 68.0, 86.0, 72.0, 88.0, 52.0, 50.0, 45.0, 46.0, 35.0, 36.0, 22.0, 19.0, 18.0, 15.0, 13.0, 6.0, 8.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207763671875, -0.2004852294921875, -0.193206787109375, -0.1859283447265625, -0.17864990234375, -0.1713714599609375, -0.164093017578125, -0.1568145751953125, -0.1495361328125, -0.1422576904296875, -0.134979248046875, -0.1277008056640625, -0.12042236328125, -0.1131439208984375, -0.105865478515625, -0.0985870361328125, -0.09130859375, -0.0840301513671875, -0.076751708984375, -0.0694732666015625, -0.06219482421875, -0.0549163818359375, -0.047637939453125, -0.0403594970703125, -0.0330810546875, -0.0258026123046875, -0.018524169921875, -0.0112457275390625, -0.00396728515625, 0.0033111572265625, 0.010589599609375, 0.0178680419921875, 0.025146484375, 0.0324249267578125, 0.039703369140625, 0.0469818115234375, 0.05426025390625, 0.0615386962890625, 0.068817138671875, 0.0760955810546875, 0.0833740234375, 0.0906524658203125, 0.097930908203125, 0.1052093505859375, 0.11248779296875, 0.1197662353515625, 0.127044677734375, 0.1343231201171875, 0.1416015625, 0.1488800048828125, 0.156158447265625, 0.1634368896484375, 0.17071533203125, 0.1779937744140625, 0.185272216796875, 0.1925506591796875, 0.1998291015625, 0.2071075439453125, 0.214385986328125, 0.2216644287109375, 0.22894287109375, 0.2362213134765625, 0.243499755859375, 0.2507781982421875, 0.258056640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 7.0, 12.0, 9.0, 18.0, 21.0, 37.0, 49.0, 46.0, 73.0, 126.0, 163.0, 282.0, 798.0, 3332.0, 26636.0, 744937.0, 255586.0, 12958.0, 2079.0, 559.0, 263.0, 197.0, 87.0, 79.0, 51.0, 35.0, 28.0, 16.0, 12.0, 8.0, 9.0, 10.0, 6.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4921875, -3.394775390625, -3.29736328125, -3.199951171875, -3.1025390625, -3.005126953125, -2.90771484375, -2.810302734375, -2.712890625, -2.615478515625, -2.51806640625, -2.420654296875, -2.3232421875, -2.225830078125, -2.12841796875, -2.031005859375, -1.93359375, -1.836181640625, -1.73876953125, -1.641357421875, -1.5439453125, -1.446533203125, -1.34912109375, -1.251708984375, -1.154296875, -1.056884765625, -0.95947265625, -0.862060546875, -0.7646484375, -0.667236328125, -0.56982421875, -0.472412109375, -0.375, -0.277587890625, -0.18017578125, -0.082763671875, 0.0146484375, 0.112060546875, 0.20947265625, 0.306884765625, 0.404296875, 0.501708984375, 0.59912109375, 0.696533203125, 0.7939453125, 0.891357421875, 0.98876953125, 1.086181640625, 1.18359375, 1.281005859375, 1.37841796875, 1.475830078125, 1.5732421875, 1.670654296875, 1.76806640625, 1.865478515625, 1.962890625, 2.060302734375, 2.15771484375, 2.255126953125, 2.3525390625, 2.449951171875, 2.54736328125, 2.644775390625, 2.7421875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 16.0, 20.0, 44.0, 129.0, 431.0, 243.0, 81.0, 28.0, 10.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.804503440856934, -6.6024394035339355, -6.400374889373779, -6.198310852050781, -5.996246814727783, -5.794182777404785, -5.592118263244629, -5.390054225921631, -5.187990188598633, -4.985926151275635, -4.7838616371154785, -4.5817975997924805, -4.379733562469482, -4.177669525146484, -3.975605010986328, -3.77354097366333, -3.571476459503174, -3.3694121837615967, -3.1673481464385986, -2.9652838706970215, -2.7632198333740234, -2.5611555576324463, -2.359091281890869, -2.157027244567871, -1.954962968826294, -1.7528988122940063, -1.5508346557617188, -1.3487703800201416, -1.146706223487854, -0.9446420669555664, -0.7425777912139893, -0.5405136346817017, -0.33844995498657227, -0.13638576865196228, 0.0656784176826477, 0.2677426338195801, 0.4698067903518677, 0.6718709468841553, 0.8739352226257324, 1.07599937915802, 1.2780635356903076, 1.4801276922225952, 1.6821918487548828, 1.88425612449646, 2.086320400238037, 2.288384437561035, 2.4904487133026123, 2.6925129890441895, 2.8945770263671875, 3.0966413021087646, 3.2987053394317627, 3.50076961517334, 3.702833652496338, 3.904897928237915, 4.106962203979492, 4.30902624130249, 4.511090278625488, 4.713154315948486, 4.915218830108643, 5.117282867431641, 5.319346904754639, 5.521410942077637, 5.723475456237793, 5.925539493560791, 6.127604007720947]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 4.0, 5.0, 11.0, 18.0, 13.0, 22.0, 25.0, 33.0, 28.0, 44.0, 30.0, 62.0, 51.0, 33.0, 54.0, 38.0, 66.0, 58.0, 48.0, 46.0, 48.0, 35.0, 48.0, 40.0, 18.0, 21.0, 18.0, 9.0, 12.0, 13.0, 15.0, 7.0, 5.0, 9.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5857336521148682, -1.539997935295105, -1.4942622184753418, -1.448526382446289, -1.4027906656265259, -1.3570549488067627, -1.3113192319869995, -1.2655835151672363, -1.2198477983474731, -1.17411208152771, -1.1283763647079468, -1.0826406478881836, -1.0369048118591309, -0.9911690950393677, -0.9454333782196045, -0.8996976613998413, -0.8539618849754333, -0.8082261681556702, -0.7624903917312622, -0.716754674911499, -0.6710189580917358, -0.6252832412719727, -0.5795474648475647, -0.5338117480278015, -0.48807600140571594, -0.44234025478363037, -0.3966045379638672, -0.3508687913417816, -0.30513304471969604, -0.25939732789993286, -0.2136615812778473, -0.1679258644580841, -0.12219011783599854, -0.07645438611507416, -0.030718646943569183, 0.015017092227935791, 0.06075282394886017, 0.10648855566978455, 0.15222430229187012, 0.1979600191116333, 0.24369576573371887, 0.28943151235580444, 0.3351672291755676, 0.3809029757976532, 0.42663872241973877, 0.47237443923950195, 0.5181101560592651, 0.5638458728790283, 0.6095816493034363, 0.6553173661231995, 0.7010531425476074, 0.7467888593673706, 0.7925245761871338, 0.838260293006897, 0.8839960694313049, 0.9297317862510681, 0.9754675626754761, 1.0212032794952393, 1.0669389963150024, 1.1126747131347656, 1.1584105491638184, 1.2041462659835815, 1.2498819828033447, 1.295617699623108, 1.341353416442871]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 0.0, 4.0, 10.0, 4.0, 9.0, 12.0, 19.0, 16.0, 15.0, 21.0, 24.0, 23.0, 31.0, 37.0, 27.0, 31.0, 31.0, 38.0, 32.0, 52.0, 42.0, 57.0, 49.0, 48.0, 51.0, 44.0, 35.0, 39.0, 15.0, 24.0, 26.0, 22.0, 13.0, 19.0, 19.0, 12.0, 11.0, 10.0, 9.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89697265625, -0.8680572509765625, -0.839141845703125, -0.8102264404296875, -0.78131103515625, -0.7523956298828125, -0.723480224609375, -0.6945648193359375, -0.6656494140625, -0.6367340087890625, -0.607818603515625, -0.5789031982421875, -0.54998779296875, -0.5210723876953125, -0.492156982421875, -0.4632415771484375, -0.434326171875, -0.4054107666015625, -0.376495361328125, -0.3475799560546875, -0.31866455078125, -0.2897491455078125, -0.260833740234375, -0.2319183349609375, -0.2030029296875, -0.1740875244140625, -0.145172119140625, -0.1162567138671875, -0.08734130859375, -0.0584259033203125, -0.029510498046875, -0.0005950927734375, 0.0283203125, 0.0572357177734375, 0.086151123046875, 0.1150665283203125, 0.14398193359375, 0.1728973388671875, 0.201812744140625, 0.2307281494140625, 0.2596435546875, 0.2885589599609375, 0.317474365234375, 0.3463897705078125, 0.37530517578125, 0.4042205810546875, 0.433135986328125, 0.4620513916015625, 0.490966796875, 0.5198822021484375, 0.548797607421875, 0.5777130126953125, 0.60662841796875, 0.6355438232421875, 0.664459228515625, 0.6933746337890625, 0.7222900390625, 0.7512054443359375, 0.780120849609375, 0.8090362548828125, 0.83795166015625, 0.8668670654296875, 0.895782470703125, 0.9246978759765625, 0.95361328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 12.0, 14.0, 28.0, 41.0, 51.0, 75.0, 113.0, 181.0, 233.0, 361.0, 608.0, 917.0, 1413.0, 2222.0, 3779.0, 6946.0, 13770.0, 31347.0, 89323.0, 327926.0, 389574.0, 108639.0, 36866.0, 15361.0, 7689.0, 4245.0, 2541.0, 1480.0, 970.0, 606.0, 417.0, 243.0, 181.0, 125.0, 73.0, 45.0, 46.0, 30.0, 16.0, 15.0, 7.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.449920654296875, -1.40472412109375, -1.359527587890625, -1.3143310546875, -1.269134521484375, -1.22393798828125, -1.178741455078125, -1.133544921875, -1.088348388671875, -1.04315185546875, -0.997955322265625, -0.9527587890625, -0.907562255859375, -0.86236572265625, -0.817169189453125, -0.77197265625, -0.726776123046875, -0.68157958984375, -0.636383056640625, -0.5911865234375, -0.545989990234375, -0.50079345703125, -0.455596923828125, -0.410400390625, -0.365203857421875, -0.32000732421875, -0.274810791015625, -0.2296142578125, -0.184417724609375, -0.13922119140625, -0.094024658203125, -0.048828125, -0.003631591796875, 0.04156494140625, 0.086761474609375, 0.1319580078125, 0.177154541015625, 0.22235107421875, 0.267547607421875, 0.312744140625, 0.357940673828125, 0.40313720703125, 0.448333740234375, 0.4935302734375, 0.538726806640625, 0.58392333984375, 0.629119873046875, 0.67431640625, 0.719512939453125, 0.76470947265625, 0.809906005859375, 0.8551025390625, 0.900299072265625, 0.94549560546875, 0.990692138671875, 1.035888671875, 1.081085205078125, 1.12628173828125, 1.171478271484375, 1.2166748046875, 1.261871337890625, 1.30706787109375, 1.352264404296875, 1.3974609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 2.0, 10.0, 14.0, 10.0, 16.0, 17.0, 23.0, 17.0, 29.0, 29.0, 24.0, 37.0, 33.0, 39.0, 56.0, 52.0, 80.0, 103.0, 230.0, 1429.0, 194.0, 104.0, 64.0, 67.0, 44.0, 35.0, 48.0, 32.0, 34.0, 33.0, 22.0, 21.0, 17.0, 15.0, 10.0, 7.0, 13.0, 6.0, 6.0, 11.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.443359375, -3.3404541015625, -3.237548828125, -3.1346435546875, -3.03173828125, -2.9288330078125, -2.825927734375, -2.7230224609375, -2.6201171875, -2.5172119140625, -2.414306640625, -2.3114013671875, -2.20849609375, -2.1055908203125, -2.002685546875, -1.8997802734375, -1.796875, -1.6939697265625, -1.591064453125, -1.4881591796875, -1.38525390625, -1.2823486328125, -1.179443359375, -1.0765380859375, -0.9736328125, -0.8707275390625, -0.767822265625, -0.6649169921875, -0.56201171875, -0.4591064453125, -0.356201171875, -0.2532958984375, -0.150390625, -0.0474853515625, 0.055419921875, 0.1583251953125, 0.26123046875, 0.3641357421875, 0.467041015625, 0.5699462890625, 0.6728515625, 0.7757568359375, 0.878662109375, 0.9815673828125, 1.08447265625, 1.1873779296875, 1.290283203125, 1.3931884765625, 1.49609375, 1.5989990234375, 1.701904296875, 1.8048095703125, 1.90771484375, 2.0106201171875, 2.113525390625, 2.2164306640625, 2.3193359375, 2.4222412109375, 2.525146484375, 2.6280517578125, 2.73095703125, 2.8338623046875, 2.936767578125, 3.0396728515625, 3.142578125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 10.0, 12.0, 11.0, 16.0, 29.0, 32.0, 50.0, 87.0, 175.0, 218.0, 478.0, 933.0, 2067.0, 5096.0, 13941.0, 57559.0, 1167102.0, 1800036.0, 71611.0, 16121.0, 5619.0, 2255.0, 1040.0, 485.0, 244.0, 170.0, 105.0, 73.0, 42.0, 28.0, 19.0, 22.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.955078125, -3.797210693359375, -3.63934326171875, -3.481475830078125, -3.3236083984375, -3.165740966796875, -3.00787353515625, -2.850006103515625, -2.692138671875, -2.534271240234375, -2.37640380859375, -2.218536376953125, -2.0606689453125, -1.902801513671875, -1.74493408203125, -1.587066650390625, -1.42919921875, -1.271331787109375, -1.11346435546875, -0.955596923828125, -0.7977294921875, -0.639862060546875, -0.48199462890625, -0.324127197265625, -0.166259765625, -0.008392333984375, 0.14947509765625, 0.307342529296875, 0.4652099609375, 0.623077392578125, 0.78094482421875, 0.938812255859375, 1.0966796875, 1.254547119140625, 1.41241455078125, 1.570281982421875, 1.7281494140625, 1.886016845703125, 2.04388427734375, 2.201751708984375, 2.359619140625, 2.517486572265625, 2.67535400390625, 2.833221435546875, 2.9910888671875, 3.148956298828125, 3.30682373046875, 3.464691162109375, 3.62255859375, 3.780426025390625, 3.93829345703125, 4.096160888671875, 4.2540283203125, 4.411895751953125, 4.56976318359375, 4.727630615234375, 4.885498046875, 5.043365478515625, 5.20123291015625, 5.359100341796875, 5.5169677734375, 5.674835205078125, 5.83270263671875, 5.990570068359375, 6.1484375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 237.0, 698.0, 69.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.47452735900879, -15.380653381347656, -13.286779403686523, -11.192906379699707, -9.099032402038574, -7.005158424377441, -4.911285400390625, -2.817411422729492, -0.7235374450683594, 1.3703362941741943, 3.464210033416748, 5.558083534240723, 7.6519575119018555, 9.745831489562988, 11.839704513549805, 13.933578491210938, 16.02745246887207, 18.121326446533203, 20.215200424194336, 22.30907440185547, 24.40294647216797, 26.496822357177734, 28.590694427490234, 30.684568405151367, 32.7784423828125, 34.872314453125, 36.966190338134766, 39.060062408447266, 41.15393829345703, 43.24781036376953, 45.34168243408203, 47.4355583190918, 49.52942657470703, 51.62329864501953, 53.7171745300293, 55.8110466003418, 57.90492248535156, 59.99879455566406, 62.09266662597656, 64.18653869628906, 66.2804183959961, 68.3742904663086, 70.4681625366211, 72.56204223632812, 74.65591430664062, 76.74978637695312, 78.84365844726562, 80.93753051757812, 83.03140258789062, 85.12527465820312, 87.21914672851562, 89.31302642822266, 91.40689849853516, 93.50077056884766, 95.59464263916016, 97.68852233886719, 99.78239440917969, 101.87626647949219, 103.97013854980469, 106.06401824951172, 108.15789031982422, 110.25176239013672, 112.34563446044922, 114.43951416015625, 116.53338623046875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 4.0, 1.0, 7.0, 3.0, 2.0, 11.0, 6.0, 15.0, 14.0, 14.0, 14.0, 21.0, 18.0, 31.0, 28.0, 28.0, 22.0, 26.0, 38.0, 37.0, 33.0, 33.0, 50.0, 44.0, 37.0, 31.0, 30.0, 27.0, 27.0, 39.0, 29.0, 34.0, 25.0, 28.0, 29.0, 23.0, 17.0, 19.0, 12.0, 10.0, 11.0, 7.0, 18.0, 8.0, 6.0, 8.0, 3.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.972294807434082, -9.66366958618164, -9.355045318603516, -9.046420097351074, -8.737794876098633, -8.429170608520508, -8.120545387268066, -7.811920642852783, -7.5032958984375, -7.194671154022217, -6.886046409606934, -6.577421188354492, -6.268796443939209, -5.960171699523926, -5.651546478271484, -5.342921733856201, -5.034296989440918, -4.725672245025635, -4.417047500610352, -4.10842227935791, -3.799797534942627, -3.4911727905273438, -3.1825478076934814, -2.873922824859619, -2.565298080444336, -2.2566733360290527, -1.9480483531951904, -1.6394234895706177, -1.330798625946045, -1.0221737623214722, -0.7135488986968994, -0.4049239158630371, -0.09630012512207031, 0.21232473850250244, 0.5209496021270752, 0.829574465751648, 1.1381993293762207, 1.4468241930007935, 1.7554490566253662, 2.0640740394592285, 2.3726987838745117, 2.681323528289795, 2.9899485111236572, 3.2985734939575195, 3.6071982383728027, 3.915822982788086, 4.224448204040527, 4.5330729484558105, 4.841697692871094, 5.150322437286377, 5.45894718170166, 5.767572402954102, 6.076197147369385, 6.384821891784668, 6.693447113037109, 7.002071857452393, 7.310696601867676, 7.619321346282959, 7.927946090698242, 8.236571311950684, 8.545196533203125, 8.85382080078125, 9.162446022033691, 9.471071243286133, 9.779695510864258]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 16.0, 17.0, 20.0, 16.0, 15.0, 29.0, 31.0, 26.0, 31.0, 35.0, 44.0, 34.0, 32.0, 48.0, 45.0, 37.0, 46.0, 40.0, 54.0, 42.0, 34.0, 33.0, 29.0, 29.0, 25.0, 20.0, 14.0, 23.0, 22.0, 7.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.89208984375, -0.8633270263671875, -0.834564208984375, -0.8058013916015625, -0.77703857421875, -0.7482757568359375, -0.719512939453125, -0.6907501220703125, -0.6619873046875, -0.6332244873046875, -0.604461669921875, -0.5756988525390625, -0.54693603515625, -0.5181732177734375, -0.489410400390625, -0.4606475830078125, -0.431884765625, -0.4031219482421875, -0.374359130859375, -0.3455963134765625, -0.31683349609375, -0.2880706787109375, -0.259307861328125, -0.2305450439453125, -0.2017822265625, -0.1730194091796875, -0.144256591796875, -0.1154937744140625, -0.08673095703125, -0.0579681396484375, -0.029205322265625, -0.0004425048828125, 0.0283203125, 0.0570831298828125, 0.085845947265625, 0.1146087646484375, 0.14337158203125, 0.1721343994140625, 0.200897216796875, 0.2296600341796875, 0.2584228515625, 0.2871856689453125, 0.315948486328125, 0.3447113037109375, 0.37347412109375, 0.4022369384765625, 0.430999755859375, 0.4597625732421875, 0.488525390625, 0.5172882080078125, 0.546051025390625, 0.5748138427734375, 0.60357666015625, 0.6323394775390625, 0.661102294921875, 0.6898651123046875, 0.7186279296875, 0.7473907470703125, 0.776153564453125, 0.8049163818359375, 0.83367919921875, 0.8624420166015625, 0.891204833984375, 0.9199676513671875, 0.94873046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 3.0, 10.0, 10.0, 19.0, 27.0, 39.0, 52.0, 72.0, 149.0, 170.0, 297.0, 440.0, 748.0, 1189.0, 1945.0, 3506.0, 6274.0, 11672.0, 23980.0, 56294.0, 208923.0, 1593136.0, 1908752.0, 258490.0, 64149.0, 25703.0, 12244.0, 6603.0, 3783.0, 2063.0, 1304.0, 769.0, 525.0, 315.0, 186.0, 147.0, 98.0, 58.0, 40.0, 29.0, 18.0, 17.0, 11.0, 10.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.09844970703125, -2.0308837890625, -1.96331787109375, -1.895751953125, -1.82818603515625, -1.7606201171875, -1.69305419921875, -1.62548828125, -1.55792236328125, -1.4903564453125, -1.42279052734375, -1.355224609375, -1.28765869140625, -1.2200927734375, -1.15252685546875, -1.0849609375, -1.01739501953125, -0.9498291015625, -0.88226318359375, -0.814697265625, -0.74713134765625, -0.6795654296875, -0.61199951171875, -0.54443359375, -0.47686767578125, -0.4093017578125, -0.34173583984375, -0.274169921875, -0.20660400390625, -0.1390380859375, -0.07147216796875, -0.00390625, 0.06365966796875, 0.1312255859375, 0.19879150390625, 0.266357421875, 0.33392333984375, 0.4014892578125, 0.46905517578125, 0.53662109375, 0.60418701171875, 0.6717529296875, 0.73931884765625, 0.806884765625, 0.87445068359375, 0.9420166015625, 1.00958251953125, 1.0771484375, 1.14471435546875, 1.2122802734375, 1.27984619140625, 1.347412109375, 1.41497802734375, 1.4825439453125, 1.55010986328125, 1.61767578125, 1.68524169921875, 1.7528076171875, 1.82037353515625, 1.887939453125, 1.95550537109375, 2.0230712890625, 2.09063720703125, 2.158203125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 8.0, 14.0, 17.0, 24.0, 34.0, 36.0, 39.0, 53.0, 60.0, 94.0, 125.0, 157.0, 227.0, 297.0, 422.0, 462.0, 481.0, 386.0, 241.0, 194.0, 148.0, 117.0, 83.0, 67.0, 61.0, 51.0, 26.0, 24.0, 27.0, 16.0, 7.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9228515625, -1.8535919189453125, -1.784332275390625, -1.7150726318359375, -1.64581298828125, -1.5765533447265625, -1.507293701171875, -1.4380340576171875, -1.3687744140625, -1.2995147705078125, -1.230255126953125, -1.1609954833984375, -1.09173583984375, -1.0224761962890625, -0.953216552734375, -0.8839569091796875, -0.814697265625, -0.7454376220703125, -0.676177978515625, -0.6069183349609375, -0.53765869140625, -0.4683990478515625, -0.399139404296875, -0.3298797607421875, -0.2606201171875, -0.1913604736328125, -0.122100830078125, -0.0528411865234375, 0.01641845703125, 0.0856781005859375, 0.154937744140625, 0.2241973876953125, 0.29345703125, 0.3627166748046875, 0.431976318359375, 0.5012359619140625, 0.57049560546875, 0.6397552490234375, 0.709014892578125, 0.7782745361328125, 0.8475341796875, 0.9167938232421875, 0.986053466796875, 1.0553131103515625, 1.12457275390625, 1.1938323974609375, 1.263092041015625, 1.3323516845703125, 1.401611328125, 1.4708709716796875, 1.540130615234375, 1.6093902587890625, 1.67864990234375, 1.7479095458984375, 1.817169189453125, 1.8864288330078125, 1.9556884765625, 2.0249481201171875, 2.094207763671875, 2.1634674072265625, 2.23272705078125, 2.3019866943359375, 2.371246337890625, 2.4405059814453125, 2.509765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 12.0, 28.0, 37.0, 45.0, 57.0, 115.0, 142.0, 238.0, 344.0, 588.0, 885.0, 1455.0, 2413.0, 4178.0, 7796.0, 14583.0, 30127.0, 67535.0, 179436.0, 688019.0, 2230790.0, 661475.0, 176247.0, 66039.0, 29367.0, 14375.0, 7553.0, 4124.0, 2400.0, 1408.0, 903.0, 560.0, 351.0, 199.0, 146.0, 109.0, 71.0, 42.0, 31.0, 16.0, 17.0, 9.0, 6.0, 4.0, 2.0, 2.0], "bins": [-3.423828125, -3.334869384765625, -3.24591064453125, -3.156951904296875, -3.0679931640625, -2.979034423828125, -2.89007568359375, -2.801116943359375, -2.712158203125, -2.623199462890625, -2.53424072265625, -2.445281982421875, -2.3563232421875, -2.267364501953125, -2.17840576171875, -2.089447021484375, -2.00048828125, -1.911529541015625, -1.82257080078125, -1.733612060546875, -1.6446533203125, -1.555694580078125, -1.46673583984375, -1.377777099609375, -1.288818359375, -1.199859619140625, -1.11090087890625, -1.021942138671875, -0.9329833984375, -0.844024658203125, -0.75506591796875, -0.666107177734375, -0.5771484375, -0.488189697265625, -0.39923095703125, -0.310272216796875, -0.2213134765625, -0.132354736328125, -0.04339599609375, 0.045562744140625, 0.134521484375, 0.223480224609375, 0.31243896484375, 0.401397705078125, 0.4903564453125, 0.579315185546875, 0.66827392578125, 0.757232666015625, 0.84619140625, 0.935150146484375, 1.02410888671875, 1.113067626953125, 1.2020263671875, 1.290985107421875, 1.37994384765625, 1.468902587890625, 1.557861328125, 1.646820068359375, 1.73577880859375, 1.824737548828125, 1.9136962890625, 2.002655029296875, 2.09161376953125, 2.180572509765625, 2.26953125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 23.0, 20.0, 41.0, 68.0, 82.0, 125.0, 119.0, 123.0, 120.0, 73.0, 49.0, 58.0, 36.0, 18.0, 15.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.158880233764648, -9.64907455444336, -9.13926887512207, -8.629462242126465, -8.119656562805176, -7.609850883483887, -7.1000447273254395, -6.590238571166992, -6.080432891845703, -5.570627212524414, -5.060821056365967, -4.5510149002075195, -4.0412092208862305, -3.5314033031463623, -3.021597385406494, -2.511791467666626, -2.001985549926758, -1.4921796321868896, -0.9823737144470215, -0.4725677967071533, 0.037238121032714844, 0.547044038772583, 1.0568499565124512, 1.5666558742523193, 2.0764617919921875, 2.5862677097320557, 3.096073627471924, 3.605879545211792, 4.11568546295166, 4.625491142272949, 5.1352972984313965, 5.645103454589844, 6.154909133911133, 6.664714813232422, 7.174520969390869, 7.684327125549316, 8.194132804870605, 8.703938484191895, 9.2137451171875, 9.723550796508789, 10.233356475830078, 10.743162155151367, 11.252967834472656, 11.762774467468262, 12.27258014678955, 12.78238582611084, 13.292192459106445, 13.801998138427734, 14.311803817749023, 14.821609497070312, 15.331415176391602, 15.841221809387207, 16.351028442382812, 16.8608341217041, 17.37063980102539, 17.88044548034668, 18.39025115966797, 18.900056838989258, 19.409862518310547, 19.919668197631836, 20.429473876953125, 20.939281463623047, 21.449087142944336, 21.958892822265625, 22.468698501586914]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 7.0, 5.0, 7.0, 4.0, 18.0, 15.0, 11.0, 13.0, 21.0, 21.0, 27.0, 20.0, 31.0, 35.0, 34.0, 26.0, 34.0, 30.0, 43.0, 35.0, 46.0, 48.0, 40.0, 36.0, 37.0, 37.0, 34.0, 31.0, 29.0, 24.0, 36.0, 25.0, 24.0, 19.0, 17.0, 12.0, 13.0, 11.0, 10.0, 13.0, 12.0, 3.0, 2.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.297189712524414, -8.033828735351562, -7.7704668045043945, -7.507105350494385, -7.243743896484375, -6.980382442474365, -6.7170209884643555, -6.453659534454346, -6.190298080444336, -5.926936626434326, -5.663575172424316, -5.400213718414307, -5.136852264404297, -4.873490810394287, -4.610129356384277, -4.346767902374268, -4.083406448364258, -3.820044994354248, -3.5566835403442383, -3.2933220863342285, -3.0299606323242188, -2.766599178314209, -2.503237724304199, -2.2398762702941895, -1.9765148162841797, -1.71315336227417, -1.4497919082641602, -1.1864304542541504, -0.9230690002441406, -0.6597075462341309, -0.3963460922241211, -0.13298463821411133, 0.13037681579589844, 0.3937382698059082, 0.657099723815918, 0.9204611778259277, 1.1838226318359375, 1.4471840858459473, 1.710545539855957, 1.9739069938659668, 2.2372684478759766, 2.5006299018859863, 2.763991355895996, 3.027352809906006, 3.2907142639160156, 3.5540757179260254, 3.817437171936035, 4.080798625946045, 4.344160079956055, 4.6075215339660645, 4.870882987976074, 5.134244441986084, 5.397605895996094, 5.6609673500061035, 5.924328804016113, 6.187690258026123, 6.451051712036133, 6.714413166046143, 6.977774620056152, 7.241136074066162, 7.504497528076172, 7.767858982086182, 8.031220436096191, 8.29458236694336, 8.557943344116211]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 18.0, 18.0, 22.0, 23.0, 32.0, 19.0, 44.0, 32.0, 47.0, 38.0, 52.0, 43.0, 51.0, 28.0, 50.0, 45.0, 46.0, 39.0, 35.0, 44.0, 34.0, 27.0, 33.0, 16.0, 15.0, 20.0, 17.0, 11.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.92041015625, -0.8886947631835938, -0.8569793701171875, -0.8252639770507812, -0.793548583984375, -0.7618331909179688, -0.7301177978515625, -0.6984024047851562, -0.66668701171875, -0.6349716186523438, -0.6032562255859375, -0.5715408325195312, -0.539825439453125, -0.5081100463867188, -0.4763946533203125, -0.44467926025390625, -0.4129638671875, -0.38124847412109375, -0.3495330810546875, -0.31781768798828125, -0.286102294921875, -0.25438690185546875, -0.2226715087890625, -0.19095611572265625, -0.15924072265625, -0.12752532958984375, -0.0958099365234375, -0.06409454345703125, -0.032379150390625, -0.00066375732421875, 0.0310516357421875, 0.06276702880859375, 0.094482421875, 0.12619781494140625, 0.1579132080078125, 0.18962860107421875, 0.221343994140625, 0.25305938720703125, 0.2847747802734375, 0.31649017333984375, 0.34820556640625, 0.37992095947265625, 0.4116363525390625, 0.44335174560546875, 0.475067138671875, 0.5067825317382812, 0.5384979248046875, 0.5702133178710938, 0.6019287109375, 0.6336441040039062, 0.6653594970703125, 0.6970748901367188, 0.728790283203125, 0.7605056762695312, 0.7922210693359375, 0.8239364624023438, 0.85565185546875, 0.8873672485351562, 0.9190826416015625, 0.9507980346679688, 0.982513427734375, 1.0142288208007812, 1.0459442138671875, 1.0776596069335938, 1.109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 7.0, 7.0, 10.0, 23.0, 37.0, 56.0, 85.0, 135.0, 198.0, 258.0, 420.0, 667.0, 959.0, 1429.0, 2127.0, 3114.0, 4687.0, 6912.0, 10416.0, 15600.0, 23313.0, 34231.0, 48904.0, 69049.0, 91918.0, 114413.0, 127329.0, 122600.0, 103637.0, 80122.0, 58694.0, 40957.0, 28154.0, 19317.0, 12832.0, 8631.0, 5709.0, 3852.0, 2520.0, 1745.0, 1216.0, 798.0, 546.0, 329.0, 222.0, 131.0, 85.0, 55.0, 33.0, 29.0, 16.0, 14.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62158203125, -0.6013717651367188, -0.5811614990234375, -0.5609512329101562, -0.540740966796875, -0.5205307006835938, -0.5003204345703125, -0.48011016845703125, -0.45989990234375, -0.43968963623046875, -0.4194793701171875, -0.39926910400390625, -0.379058837890625, -0.35884857177734375, -0.3386383056640625, -0.31842803955078125, -0.2982177734375, -0.27800750732421875, -0.2577972412109375, -0.23758697509765625, -0.217376708984375, -0.19716644287109375, -0.1769561767578125, -0.15674591064453125, -0.13653564453125, -0.11632537841796875, -0.0961151123046875, -0.07590484619140625, -0.055694580078125, -0.03548431396484375, -0.0152740478515625, 0.00493621826171875, 0.025146484375, 0.04535675048828125, 0.0655670166015625, 0.08577728271484375, 0.105987548828125, 0.12619781494140625, 0.1464080810546875, 0.16661834716796875, 0.18682861328125, 0.20703887939453125, 0.2272491455078125, 0.24745941162109375, 0.267669677734375, 0.28787994384765625, 0.3080902099609375, 0.32830047607421875, 0.3485107421875, 0.36872100830078125, 0.3889312744140625, 0.40914154052734375, 0.429351806640625, 0.44956207275390625, 0.4697723388671875, 0.48998260498046875, 0.51019287109375, 0.5304031372070312, 0.5506134033203125, 0.5708236694335938, 0.591033935546875, 0.6112442016601562, 0.6314544677734375, 0.6516647338867188, 0.671875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 3.0, 4.0, 13.0, 10.0, 14.0, 16.0, 13.0, 24.0, 23.0, 29.0, 25.0, 30.0, 32.0, 33.0, 41.0, 40.0, 43.0, 41.0, 44.0, 1075.0, 38.0, 43.0, 43.0, 35.0, 46.0, 25.0, 38.0, 21.0, 23.0, 32.0, 27.0, 16.0, 10.0, 14.0, 15.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0751953125, -1.0427398681640625, -1.010284423828125, -0.9778289794921875, -0.94537353515625, -0.9129180908203125, -0.880462646484375, -0.8480072021484375, -0.8155517578125, -0.7830963134765625, -0.750640869140625, -0.7181854248046875, -0.68572998046875, -0.6532745361328125, -0.620819091796875, -0.5883636474609375, -0.555908203125, -0.5234527587890625, -0.490997314453125, -0.4585418701171875, -0.42608642578125, -0.3936309814453125, -0.361175537109375, -0.3287200927734375, -0.2962646484375, -0.2638092041015625, -0.231353759765625, -0.1988983154296875, -0.16644287109375, -0.1339874267578125, -0.101531982421875, -0.0690765380859375, -0.03662109375, -0.0041656494140625, 0.028289794921875, 0.0607452392578125, 0.09320068359375, 0.1256561279296875, 0.158111572265625, 0.1905670166015625, 0.2230224609375, 0.2554779052734375, 0.287933349609375, 0.3203887939453125, 0.35284423828125, 0.3852996826171875, 0.417755126953125, 0.4502105712890625, 0.482666015625, 0.5151214599609375, 0.547576904296875, 0.5800323486328125, 0.61248779296875, 0.6449432373046875, 0.677398681640625, 0.7098541259765625, 0.7423095703125, 0.7747650146484375, 0.807220458984375, 0.8396759033203125, 0.87213134765625, 0.9045867919921875, 0.937042236328125, 0.9694976806640625, 1.001953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 18.0, 8.0, 19.0, 17.0, 27.0, 38.0, 58.0, 75.0, 133.0, 176.0, 269.0, 395.0, 554.0, 787.0, 1112.0, 1637.0, 2394.0, 3290.0, 4898.0, 7296.0, 10887.0, 16828.0, 30406.0, 97177.0, 1360538.0, 428095.0, 61016.0, 24392.0, 14692.0, 9414.0, 6463.0, 4323.0, 2975.0, 1984.0, 1421.0, 1054.0, 680.0, 472.0, 319.0, 246.0, 162.0, 114.0, 89.0, 56.0, 42.0, 31.0, 18.0, 11.0, 9.0, 6.0, 8.0, 0.0, 0.0, 6.0, 1.0, 2.0], "bins": [-0.9150390625, -0.887176513671875, -0.85931396484375, -0.831451416015625, -0.8035888671875, -0.775726318359375, -0.74786376953125, -0.720001220703125, -0.692138671875, -0.664276123046875, -0.63641357421875, -0.608551025390625, -0.5806884765625, -0.552825927734375, -0.52496337890625, -0.497100830078125, -0.46923828125, -0.441375732421875, -0.41351318359375, -0.385650634765625, -0.3577880859375, -0.329925537109375, -0.30206298828125, -0.274200439453125, -0.246337890625, -0.218475341796875, -0.19061279296875, -0.162750244140625, -0.1348876953125, -0.107025146484375, -0.07916259765625, -0.051300048828125, -0.0234375, 0.004425048828125, 0.03228759765625, 0.060150146484375, 0.0880126953125, 0.115875244140625, 0.14373779296875, 0.171600341796875, 0.199462890625, 0.227325439453125, 0.25518798828125, 0.283050537109375, 0.3109130859375, 0.338775634765625, 0.36663818359375, 0.394500732421875, 0.42236328125, 0.450225830078125, 0.47808837890625, 0.505950927734375, 0.5338134765625, 0.561676025390625, 0.58953857421875, 0.617401123046875, 0.645263671875, 0.673126220703125, 0.70098876953125, 0.728851318359375, 0.7567138671875, 0.784576416015625, 0.81243896484375, 0.840301513671875, 0.8681640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 3.0, 2.0, 10.0, 8.0, 9.0, 15.0, 16.0, 19.0, 24.0, 24.0, 17.0, 29.0, 30.0, 40.0, 39.0, 52.0, 44.0, 51.0, 62.0, 50.0, 49.0, 57.0, 38.0, 51.0, 35.0, 28.0, 32.0, 27.0, 23.0, 17.0, 19.0, 14.0, 8.0, 3.0, 11.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.096923828125, -0.09407997131347656, -0.09123611450195312, -0.08839225769042969, -0.08554840087890625, -0.08270454406738281, -0.07986068725585938, -0.07701683044433594, -0.0741729736328125, -0.07132911682128906, -0.06848526000976562, -0.06564140319824219, -0.06279754638671875, -0.05995368957519531, -0.057109832763671875, -0.05426597595214844, -0.051422119140625, -0.04857826232910156, -0.045734405517578125, -0.04289054870605469, -0.04004669189453125, -0.03720283508300781, -0.034358978271484375, -0.03151512145996094, -0.0286712646484375, -0.025827407836914062, -0.022983551025390625, -0.020139694213867188, -0.01729583740234375, -0.014451980590820312, -0.011608123779296875, -0.008764266967773438, -0.00592041015625, -0.0030765533447265625, -0.000232696533203125, 0.0026111602783203125, 0.00545501708984375, 0.008298873901367188, 0.011142730712890625, 0.013986587524414062, 0.0168304443359375, 0.019674301147460938, 0.022518157958984375, 0.025362014770507812, 0.02820587158203125, 0.031049728393554688, 0.033893585205078125, 0.03673744201660156, 0.039581298828125, 0.04242515563964844, 0.045269012451171875, 0.04811286926269531, 0.05095672607421875, 0.05380058288574219, 0.056644439697265625, 0.05948829650878906, 0.0623321533203125, 0.06517601013183594, 0.06801986694335938, 0.07086372375488281, 0.07370758056640625, 0.07655143737792969, 0.07939529418945312, 0.08223915100097656, 0.0850830078125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 4.0, 4.0, 10.0, 11.0, 18.0, 20.0, 36.0, 50.0, 69.0, 86.0, 139.0, 225.0, 307.0, 874.0, 7375.0, 373159.0, 652254.0, 11751.0, 1052.0, 403.0, 211.0, 151.0, 92.0, 64.0, 51.0, 23.0, 31.0, 22.0, 15.0, 7.0, 12.0, 8.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5576171875, -1.50213623046875, -1.4466552734375, -1.39117431640625, -1.335693359375, -1.28021240234375, -1.2247314453125, -1.16925048828125, -1.11376953125, -1.05828857421875, -1.0028076171875, -0.94732666015625, -0.891845703125, -0.83636474609375, -0.7808837890625, -0.72540283203125, -0.669921875, -0.61444091796875, -0.5589599609375, -0.50347900390625, -0.447998046875, -0.39251708984375, -0.3370361328125, -0.28155517578125, -0.22607421875, -0.17059326171875, -0.1151123046875, -0.05963134765625, -0.004150390625, 0.05133056640625, 0.1068115234375, 0.16229248046875, 0.2177734375, 0.27325439453125, 0.3287353515625, 0.38421630859375, 0.439697265625, 0.49517822265625, 0.5506591796875, 0.60614013671875, 0.66162109375, 0.71710205078125, 0.7725830078125, 0.82806396484375, 0.883544921875, 0.93902587890625, 0.9945068359375, 1.04998779296875, 1.10546875, 1.16094970703125, 1.2164306640625, 1.27191162109375, 1.327392578125, 1.38287353515625, 1.4383544921875, 1.49383544921875, 1.54931640625, 1.60479736328125, 1.6602783203125, 1.71575927734375, 1.771240234375, 1.82672119140625, 1.8822021484375, 1.93768310546875, 1.9931640625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 28.0, 78.0, 281.0, 417.0, 146.0, 45.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.656111478805542, -3.5602521896362305, -3.464393138885498, -3.3685338497161865, -3.272674560546875, -3.1768155097961426, -3.080956220626831, -2.9850969314575195, -2.889237880706787, -2.7933785915374756, -2.697519540786743, -2.6016602516174316, -2.50580096244812, -2.4099416732788086, -2.314082622528076, -2.2182233333587646, -2.122364044189453, -2.0265047550201416, -1.9306455850601196, -1.8347864151000977, -1.7389271259307861, -1.6430679559707642, -1.5472087860107422, -1.4513494968414307, -1.3554903268814087, -1.2596311569213867, -1.1637718677520752, -1.0679126977920532, -0.9720534682273865, -0.8761942386627197, -0.7803350687026978, -0.684475839138031, -0.5886166095733643, -0.4927573800086975, -0.39689818024635315, -0.3010389804840088, -0.20517975091934204, -0.10932052135467529, -0.01346135139465332, 0.08239787817001343, 0.17825710773468018, 0.2741163372993469, 0.3699755370616913, 0.46583473682403564, 0.5616939663887024, 0.6575531959533691, 0.7534123659133911, 0.8492715954780579, 0.9451308250427246, 1.0409899950027466, 1.136849284172058, 1.23270845413208, 1.3285677433013916, 1.4244269132614136, 1.5202860832214355, 1.616145372390747, 1.712004542350769, 1.807863712310791, 1.9037230014801025, 1.9995821714401245, 2.0954413414001465, 2.191300630569458, 2.2871599197387695, 2.383018970489502, 2.4788782596588135]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 4.0, 12.0, 6.0, 9.0, 18.0, 14.0, 13.0, 16.0, 23.0, 24.0, 32.0, 28.0, 34.0, 30.0, 40.0, 42.0, 45.0, 55.0, 43.0, 40.0, 43.0, 35.0, 31.0, 35.0, 33.0, 32.0, 37.0, 23.0, 31.0, 33.0, 18.0, 20.0, 15.0, 15.0, 8.0, 11.0, 9.0, 6.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.5994930267333984, -0.582394540309906, -0.5652959942817688, -0.5481975078582764, -0.5310989618301392, -0.5140004754066467, -0.4969019591808319, -0.4798034429550171, -0.46270492672920227, -0.44560641050338745, -0.42850789427757263, -0.4114093780517578, -0.3943108916282654, -0.3772123456001282, -0.36011385917663574, -0.3430153429508209, -0.3259168267250061, -0.3088183104991913, -0.29171979427337646, -0.27462127804756165, -0.2575227618217468, -0.2404242604970932, -0.22332575917243958, -0.20622724294662476, -0.18912872672080994, -0.17203021049499512, -0.1549316942691803, -0.13783319294452667, -0.12073467671871185, -0.10363616049289703, -0.08653765171766281, -0.06943914294242859, -0.05234062671661377, -0.03524211421608925, -0.018143601715564728, -0.001045089215040207, 0.016053423285484314, 0.03315193951129913, 0.050250448286533356, 0.06734895706176758, 0.0844474732875824, 0.10154598951339722, 0.11864449828863144, 0.13574300706386566, 0.15284152328968048, 0.1699400395154953, 0.18703854084014893, 0.20413705706596375, 0.22123557329177856, 0.23833408951759338, 0.2554326057434082, 0.272531121969223, 0.28962963819503784, 0.3067281246185303, 0.3238266408443451, 0.3409251570701599, 0.35802367329597473, 0.37512218952178955, 0.39222070574760437, 0.4093192219734192, 0.4264177083969116, 0.44351625442504883, 0.46061474084854126, 0.4777132570743561, 0.4948117733001709]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 7.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 13.0, 20.0, 30.0, 19.0, 31.0, 21.0, 37.0, 34.0, 37.0, 41.0, 32.0, 49.0, 43.0, 41.0, 47.0, 49.0, 40.0, 40.0, 45.0, 49.0, 40.0, 33.0, 44.0, 21.0, 16.0, 22.0, 15.0, 10.0, 8.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96875, -0.9354248046875, -0.902099609375, -0.8687744140625, -0.83544921875, -0.8021240234375, -0.768798828125, -0.7354736328125, -0.7021484375, -0.6688232421875, -0.635498046875, -0.6021728515625, -0.56884765625, -0.5355224609375, -0.502197265625, -0.4688720703125, -0.435546875, -0.4022216796875, -0.368896484375, -0.3355712890625, -0.30224609375, -0.2689208984375, -0.235595703125, -0.2022705078125, -0.1689453125, -0.1356201171875, -0.102294921875, -0.0689697265625, -0.03564453125, -0.0023193359375, 0.031005859375, 0.0643310546875, 0.09765625, 0.1309814453125, 0.164306640625, 0.1976318359375, 0.23095703125, 0.2642822265625, 0.297607421875, 0.3309326171875, 0.3642578125, 0.3975830078125, 0.430908203125, 0.4642333984375, 0.49755859375, 0.5308837890625, 0.564208984375, 0.5975341796875, 0.630859375, 0.6641845703125, 0.697509765625, 0.7308349609375, 0.76416015625, 0.7974853515625, 0.830810546875, 0.8641357421875, 0.8974609375, 0.9307861328125, 0.964111328125, 0.9974365234375, 1.03076171875, 1.0640869140625, 1.097412109375, 1.1307373046875, 1.1640625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 13.0, 19.0, 25.0, 50.0, 55.0, 103.0, 157.0, 221.0, 357.0, 596.0, 992.0, 1591.0, 2735.0, 5050.0, 9717.0, 23035.0, 67715.0, 257324.0, 463169.0, 142015.0, 41156.0, 15790.0, 7183.0, 3918.0, 2208.0, 1223.0, 798.0, 483.0, 289.0, 193.0, 112.0, 87.0, 55.0, 35.0, 24.0, 14.0, 15.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5534210205078125, -1.496490478515625, -1.4395599365234375, -1.38262939453125, -1.3256988525390625, -1.268768310546875, -1.2118377685546875, -1.1549072265625, -1.0979766845703125, -1.041046142578125, -0.9841156005859375, -0.92718505859375, -0.8702545166015625, -0.813323974609375, -0.7563934326171875, -0.699462890625, -0.6425323486328125, -0.585601806640625, -0.5286712646484375, -0.47174072265625, -0.4148101806640625, -0.357879638671875, -0.3009490966796875, -0.2440185546875, -0.1870880126953125, -0.130157470703125, -0.0732269287109375, -0.01629638671875, 0.0406341552734375, 0.097564697265625, 0.1544952392578125, 0.21142578125, 0.2683563232421875, 0.325286865234375, 0.3822174072265625, 0.43914794921875, 0.4960784912109375, 0.553009033203125, 0.6099395751953125, 0.6668701171875, 0.7238006591796875, 0.780731201171875, 0.8376617431640625, 0.89459228515625, 0.9515228271484375, 1.008453369140625, 1.0653839111328125, 1.122314453125, 1.1792449951171875, 1.236175537109375, 1.2931060791015625, 1.35003662109375, 1.4069671630859375, 1.463897705078125, 1.5208282470703125, 1.5777587890625, 1.6346893310546875, 1.691619873046875, 1.7485504150390625, 1.80548095703125, 1.8624114990234375, 1.919342041015625, 1.9762725830078125, 2.033203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 10.0, 13.0, 11.0, 13.0, 25.0, 28.0, 12.0, 32.0, 20.0, 36.0, 30.0, 31.0, 50.0, 64.0, 78.0, 143.0, 239.0, 1362.0, 196.0, 147.0, 73.0, 59.0, 44.0, 50.0, 45.0, 26.0, 30.0, 23.0, 16.0, 16.0, 15.0, 16.0, 12.0, 13.0, 7.0, 9.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.625, -3.516693115234375, -3.40838623046875, -3.300079345703125, -3.1917724609375, -3.083465576171875, -2.97515869140625, -2.866851806640625, -2.758544921875, -2.650238037109375, -2.54193115234375, -2.433624267578125, -2.3253173828125, -2.217010498046875, -2.10870361328125, -2.000396728515625, -1.89208984375, -1.783782958984375, -1.67547607421875, -1.567169189453125, -1.4588623046875, -1.350555419921875, -1.24224853515625, -1.133941650390625, -1.025634765625, -0.917327880859375, -0.80902099609375, -0.700714111328125, -0.5924072265625, -0.484100341796875, -0.37579345703125, -0.267486572265625, -0.1591796875, -0.050872802734375, 0.05743408203125, 0.165740966796875, 0.2740478515625, 0.382354736328125, 0.49066162109375, 0.598968505859375, 0.707275390625, 0.815582275390625, 0.92388916015625, 1.032196044921875, 1.1405029296875, 1.248809814453125, 1.35711669921875, 1.465423583984375, 1.57373046875, 1.682037353515625, 1.79034423828125, 1.898651123046875, 2.0069580078125, 2.115264892578125, 2.22357177734375, 2.331878662109375, 2.440185546875, 2.548492431640625, 2.65679931640625, 2.765106201171875, 2.8734130859375, 2.981719970703125, 3.09002685546875, 3.198333740234375, 3.306640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 7.0, 14.0, 10.0, 20.0, 22.0, 21.0, 32.0, 41.0, 60.0, 92.0, 154.0, 268.0, 424.0, 850.0, 1761.0, 3741.0, 9865.0, 32905.0, 204838.0, 2303098.0, 507858.0, 55198.0, 14339.0, 5381.0, 2254.0, 1052.0, 541.0, 297.0, 158.0, 99.0, 73.0, 48.0, 42.0, 26.0, 20.0, 19.0, 12.0, 17.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.892578125, -3.765655517578125, -3.63873291015625, -3.511810302734375, -3.3848876953125, -3.257965087890625, -3.13104248046875, -3.004119873046875, -2.877197265625, -2.750274658203125, -2.62335205078125, -2.496429443359375, -2.3695068359375, -2.242584228515625, -2.11566162109375, -1.988739013671875, -1.86181640625, -1.734893798828125, -1.60797119140625, -1.481048583984375, -1.3541259765625, -1.227203369140625, -1.10028076171875, -0.973358154296875, -0.846435546875, -0.719512939453125, -0.59259033203125, -0.465667724609375, -0.3387451171875, -0.211822509765625, -0.08489990234375, 0.042022705078125, 0.1689453125, 0.295867919921875, 0.42279052734375, 0.549713134765625, 0.6766357421875, 0.803558349609375, 0.93048095703125, 1.057403564453125, 1.184326171875, 1.311248779296875, 1.43817138671875, 1.565093994140625, 1.6920166015625, 1.818939208984375, 1.94586181640625, 2.072784423828125, 2.19970703125, 2.326629638671875, 2.45355224609375, 2.580474853515625, 2.7073974609375, 2.834320068359375, 2.96124267578125, 3.088165283203125, 3.215087890625, 3.342010498046875, 3.46893310546875, 3.595855712890625, 3.7227783203125, 3.849700927734375, 3.97662353515625, 4.103546142578125, 4.23046875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 82.0, 669.0, 249.0, 10.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.73983001708984, -111.76908874511719, -109.79834747314453, -107.82760620117188, -105.85686492919922, -103.88612365722656, -101.9153823852539, -99.94464111328125, -97.9738998413086, -96.00315856933594, -94.03241729736328, -92.06167602539062, -90.09093475341797, -88.12019348144531, -86.14945220947266, -84.1787109375, -82.20796966552734, -80.23722839355469, -78.26648712158203, -76.29574584960938, -74.32500457763672, -72.35426330566406, -70.3835220336914, -68.41278076171875, -66.4420394897461, -64.47129821777344, -62.50055694580078, -60.529815673828125, -58.55907440185547, -56.58833312988281, -54.617591857910156, -52.6468505859375, -50.67610549926758, -48.70536422729492, -46.734622955322266, -44.76388168334961, -42.79314041137695, -40.8223991394043, -38.85165786743164, -36.880916595458984, -34.91017532348633, -32.93943405151367, -30.968692779541016, -28.99795150756836, -27.027210235595703, -25.056468963623047, -23.08572769165039, -21.114986419677734, -19.144245147705078, -17.173503875732422, -15.202762603759766, -13.23202133178711, -11.261280059814453, -9.290538787841797, -7.319797515869141, -5.349056243896484, -3.3783159255981445, -1.4075746536254883, 0.563166618347168, 2.533907890319824, 4.5046491622924805, 6.475390434265137, 8.446131706237793, 10.41687297821045, 12.387614250183105]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 9.0, 6.0, 9.0, 4.0, 12.0, 21.0, 9.0, 20.0, 20.0, 26.0, 32.0, 24.0, 39.0, 33.0, 39.0, 43.0, 35.0, 36.0, 44.0, 33.0, 44.0, 44.0, 38.0, 37.0, 32.0, 32.0, 42.0, 30.0, 36.0, 24.0, 28.0, 21.0, 24.0, 8.0, 12.0, 11.0, 9.0, 6.0, 5.0, 10.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.440852165222168, -12.071533203125, -11.702214241027832, -11.332895278930664, -10.963577270507812, -10.594258308410645, -10.224939346313477, -9.855620384216309, -9.48630142211914, -9.116982460021973, -8.747663497924805, -8.378344535827637, -8.009025573730469, -7.639707088470459, -7.270388603210449, -6.901069641113281, -6.531750679016113, -6.162431716918945, -5.793112754821777, -5.423794269561768, -5.0544753074646, -4.685156345367432, -4.315837860107422, -3.946518898010254, -3.577199935913086, -3.207880973815918, -2.838562250137329, -2.4692435264587402, -2.0999245643615723, -1.7306057214736938, -1.3612868785858154, -0.9919681549072266, -0.6226482391357422, -0.25332939624786377, 0.11598944664001465, 0.48530828952789307, 0.8546271324157715, 1.22394597530365, 1.5932648181915283, 1.9625835418701172, 2.331902503967285, 2.701221466064453, 3.070540189743042, 3.439858913421631, 3.809177875518799, 4.178496837615967, 4.547815322875977, 4.9171342849731445, 5.2864532470703125, 5.6557722091674805, 6.025091171264648, 6.394409656524658, 6.763728618621826, 7.133047580718994, 7.502366065979004, 7.871685028076172, 8.24100399017334, 8.610322952270508, 8.979641914367676, 9.348960876464844, 9.718278884887695, 10.087597846984863, 10.456916809082031, 10.8262357711792, 11.195554733276367]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 11.0, 15.0, 19.0, 25.0, 27.0, 21.0, 38.0, 29.0, 30.0, 33.0, 40.0, 38.0, 45.0, 43.0, 44.0, 47.0, 46.0, 41.0, 44.0, 51.0, 41.0, 32.0, 33.0, 30.0, 15.0, 17.0, 12.0, 14.0, 21.0, 9.0, 9.0, 9.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0078125, -0.97503662109375, -0.9422607421875, -0.90948486328125, -0.876708984375, -0.84393310546875, -0.8111572265625, -0.77838134765625, -0.74560546875, -0.71282958984375, -0.6800537109375, -0.64727783203125, -0.614501953125, -0.58172607421875, -0.5489501953125, -0.51617431640625, -0.4833984375, -0.45062255859375, -0.4178466796875, -0.38507080078125, -0.352294921875, -0.31951904296875, -0.2867431640625, -0.25396728515625, -0.22119140625, -0.18841552734375, -0.1556396484375, -0.12286376953125, -0.090087890625, -0.05731201171875, -0.0245361328125, 0.00823974609375, 0.041015625, 0.07379150390625, 0.1065673828125, 0.13934326171875, 0.172119140625, 0.20489501953125, 0.2376708984375, 0.27044677734375, 0.30322265625, 0.33599853515625, 0.3687744140625, 0.40155029296875, 0.434326171875, 0.46710205078125, 0.4998779296875, 0.53265380859375, 0.5654296875, 0.59820556640625, 0.6309814453125, 0.66375732421875, 0.696533203125, 0.72930908203125, 0.7620849609375, 0.79486083984375, 0.82763671875, 0.86041259765625, 0.8931884765625, 0.92596435546875, 0.958740234375, 0.99151611328125, 1.0242919921875, 1.05706787109375, 1.08984375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 13.0, 16.0, 29.0, 48.0, 52.0, 91.0, 107.0, 147.0, 193.0, 313.0, 457.0, 688.0, 1040.0, 1656.0, 2636.0, 4007.0, 7034.0, 12270.0, 23191.0, 50251.0, 150293.0, 769396.0, 2213201.0, 726171.0, 134561.0, 46485.0, 21691.0, 11340.0, 6365.0, 3867.0, 2316.0, 1469.0, 975.0, 625.0, 406.0, 279.0, 195.0, 131.0, 83.0, 62.0, 45.0, 31.0, 19.0, 13.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7407379150390625, -1.681671142578125, -1.6226043701171875, -1.56353759765625, -1.5044708251953125, -1.445404052734375, -1.3863372802734375, -1.3272705078125, -1.2682037353515625, -1.209136962890625, -1.1500701904296875, -1.09100341796875, -1.0319366455078125, -0.972869873046875, -0.9138031005859375, -0.854736328125, -0.7956695556640625, -0.736602783203125, -0.6775360107421875, -0.61846923828125, -0.5594024658203125, -0.500335693359375, -0.4412689208984375, -0.3822021484375, -0.3231353759765625, -0.264068603515625, -0.2050018310546875, -0.14593505859375, -0.0868682861328125, -0.027801513671875, 0.0312652587890625, 0.09033203125, 0.1493988037109375, 0.208465576171875, 0.2675323486328125, 0.32659912109375, 0.3856658935546875, 0.444732666015625, 0.5037994384765625, 0.5628662109375, 0.6219329833984375, 0.680999755859375, 0.7400665283203125, 0.79913330078125, 0.8582000732421875, 0.917266845703125, 0.9763336181640625, 1.035400390625, 1.0944671630859375, 1.153533935546875, 1.2126007080078125, 1.27166748046875, 1.3307342529296875, 1.389801025390625, 1.4488677978515625, 1.5079345703125, 1.5670013427734375, 1.626068115234375, 1.6851348876953125, 1.74420166015625, 1.8032684326171875, 1.862335205078125, 1.9214019775390625, 1.98046875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 19.0, 12.0, 22.0, 30.0, 41.0, 58.0, 94.0, 136.0, 224.0, 360.0, 523.0, 732.0, 598.0, 412.0, 263.0, 171.0, 111.0, 68.0, 64.0, 35.0, 26.0, 18.0, 12.0, 4.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.2109375, -4.104766845703125, -3.99859619140625, -3.892425537109375, -3.7862548828125, -3.680084228515625, -3.57391357421875, -3.467742919921875, -3.361572265625, -3.255401611328125, -3.14923095703125, -3.043060302734375, -2.9368896484375, -2.830718994140625, -2.72454833984375, -2.618377685546875, -2.51220703125, -2.406036376953125, -2.29986572265625, -2.193695068359375, -2.0875244140625, -1.981353759765625, -1.87518310546875, -1.769012451171875, -1.662841796875, -1.556671142578125, -1.45050048828125, -1.344329833984375, -1.2381591796875, -1.131988525390625, -1.02581787109375, -0.919647216796875, -0.8134765625, -0.707305908203125, -0.60113525390625, -0.494964599609375, -0.3887939453125, -0.282623291015625, -0.17645263671875, -0.070281982421875, 0.035888671875, 0.142059326171875, 0.24822998046875, 0.354400634765625, 0.4605712890625, 0.566741943359375, 0.67291259765625, 0.779083251953125, 0.88525390625, 0.991424560546875, 1.09759521484375, 1.203765869140625, 1.3099365234375, 1.416107177734375, 1.52227783203125, 1.628448486328125, 1.734619140625, 1.840789794921875, 1.94696044921875, 2.053131103515625, 2.1593017578125, 2.265472412109375, 2.37164306640625, 2.477813720703125, 2.583984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 7.0, 16.0, 22.0, 18.0, 35.0, 50.0, 61.0, 100.0, 191.0, 334.0, 591.0, 1238.0, 2586.0, 6091.0, 15722.0, 48124.0, 209905.0, 2057751.0, 1609329.0, 175012.0, 42706.0, 14157.0, 5472.0, 2316.0, 1071.0, 573.0, 275.0, 152.0, 128.0, 81.0, 50.0, 32.0, 22.0, 13.0, 10.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.76129150390625, -3.6163330078125, -3.47137451171875, -3.326416015625, -3.18145751953125, -3.0364990234375, -2.89154052734375, -2.74658203125, -2.60162353515625, -2.4566650390625, -2.31170654296875, -2.166748046875, -2.02178955078125, -1.8768310546875, -1.73187255859375, -1.5869140625, -1.44195556640625, -1.2969970703125, -1.15203857421875, -1.007080078125, -0.86212158203125, -0.7171630859375, -0.57220458984375, -0.42724609375, -0.28228759765625, -0.1373291015625, 0.00762939453125, 0.152587890625, 0.29754638671875, 0.4425048828125, 0.58746337890625, 0.732421875, 0.87738037109375, 1.0223388671875, 1.16729736328125, 1.312255859375, 1.45721435546875, 1.6021728515625, 1.74713134765625, 1.89208984375, 2.03704833984375, 2.1820068359375, 2.32696533203125, 2.471923828125, 2.61688232421875, 2.7618408203125, 2.90679931640625, 3.0517578125, 3.19671630859375, 3.3416748046875, 3.48663330078125, 3.631591796875, 3.77655029296875, 3.9215087890625, 4.06646728515625, 4.21142578125, 4.35638427734375, 4.5013427734375, 4.64630126953125, 4.791259765625, 4.93621826171875, 5.0811767578125, 5.22613525390625, 5.37109375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 20.0, 54.0, 119.0, 223.0, 229.0, 194.0, 94.0, 45.0, 12.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.313840866088867, -15.250967979431152, -14.188094139099121, -13.125221252441406, -12.062347412109375, -10.99947452545166, -9.936601638793945, -8.873727798461914, -7.810854911804199, -6.747981548309326, -5.685108184814453, -4.622235298156738, -3.5593619346618652, -2.496488571166992, -1.4336156845092773, -0.3707423210144043, 0.6921310424804688, 1.7550042867660522, 2.8178775310516357, 3.8807506561279297, 4.943624019622803, 6.006497383117676, 7.069370269775391, 8.132244110107422, 9.195116996765137, 10.257989883422852, 11.320863723754883, 12.383736610412598, 13.446609497070312, 14.509483337402344, 15.572356224060059, 16.635229110717773, 17.698101043701172, 18.760974884033203, 19.8238468170166, 20.886720657348633, 21.949594497680664, 23.012466430664062, 24.075340270996094, 25.138214111328125, 26.201087951660156, 27.263961791992188, 28.326833724975586, 29.389707565307617, 30.45258140563965, 31.515453338623047, 32.57832717895508, 33.64120101928711, 34.704071044921875, 35.766944885253906, 36.82981872558594, 37.89269256591797, 38.955562591552734, 40.018436431884766, 41.0813102722168, 42.14418411254883, 43.20705795288086, 44.26993179321289, 45.33280563354492, 46.39567565917969, 47.45854949951172, 48.52142333984375, 49.58429718017578, 50.64717102050781, 51.710044860839844]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 4.0, 4.0, 13.0, 15.0, 9.0, 13.0, 12.0, 13.0, 16.0, 17.0, 21.0, 28.0, 37.0, 48.0, 34.0, 39.0, 31.0, 22.0, 42.0, 53.0, 32.0, 32.0, 36.0, 30.0, 37.0, 41.0, 29.0, 25.0, 32.0, 27.0, 24.0, 18.0, 24.0, 18.0, 24.0, 18.0, 13.0, 8.0, 10.0, 10.0, 9.0, 2.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.24605941772461, -7.991235733032227, -7.7364115715026855, -7.4815874099731445, -7.226763725280762, -6.971940040588379, -6.717115879058838, -6.462291717529297, -6.207468032836914, -5.952644348144531, -5.69782018661499, -5.442996025085449, -5.188172340393066, -4.933348655700684, -4.678524494171143, -4.423700332641602, -4.168876647949219, -3.914052724838257, -3.659228801727295, -3.404404878616333, -3.149580955505371, -2.894757032394409, -2.6399331092834473, -2.3851091861724854, -2.1302852630615234, -1.8754613399505615, -1.6206374168395996, -1.3658134937286377, -1.1109895706176758, -0.8561656475067139, -0.601341724395752, -0.34651780128479004, -0.09169387817382812, 0.1631300449371338, 0.4179539680480957, 0.6727778911590576, 0.9276018142700195, 1.1824257373809814, 1.4372496604919434, 1.6920735836029053, 1.9468975067138672, 2.201721429824829, 2.456545352935791, 2.711369276046753, 2.966193199157715, 3.2210171222686768, 3.4758410453796387, 3.7306649684906006, 3.9854888916015625, 4.240312576293945, 4.495136737823486, 4.749960899353027, 5.00478458404541, 5.259608268737793, 5.514432430267334, 5.769256591796875, 6.024080276489258, 6.278903961181641, 6.533728122711182, 6.788552284240723, 7.0433759689331055, 7.298199653625488, 7.553023815155029, 7.80784797668457, 8.062671661376953]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 14.0, 9.0, 14.0, 21.0, 27.0, 17.0, 25.0, 30.0, 34.0, 22.0, 44.0, 39.0, 52.0, 36.0, 43.0, 48.0, 46.0, 49.0, 50.0, 40.0, 43.0, 39.0, 35.0, 36.0, 28.0, 17.0, 22.0, 25.0, 11.0, 12.0, 14.0, 8.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0673828125, -1.0327911376953125, -0.998199462890625, -0.9636077880859375, -0.92901611328125, -0.8944244384765625, -0.859832763671875, -0.8252410888671875, -0.7906494140625, -0.7560577392578125, -0.721466064453125, -0.6868743896484375, -0.65228271484375, -0.6176910400390625, -0.583099365234375, -0.5485076904296875, -0.513916015625, -0.4793243408203125, -0.444732666015625, -0.4101409912109375, -0.37554931640625, -0.3409576416015625, -0.306365966796875, -0.2717742919921875, -0.2371826171875, -0.2025909423828125, -0.167999267578125, -0.1334075927734375, -0.09881591796875, -0.0642242431640625, -0.029632568359375, 0.0049591064453125, 0.03955078125, 0.0741424560546875, 0.108734130859375, 0.1433258056640625, 0.17791748046875, 0.2125091552734375, 0.247100830078125, 0.2816925048828125, 0.3162841796875, 0.3508758544921875, 0.385467529296875, 0.4200592041015625, 0.45465087890625, 0.4892425537109375, 0.523834228515625, 0.5584259033203125, 0.593017578125, 0.6276092529296875, 0.662200927734375, 0.6967926025390625, 0.73138427734375, 0.7659759521484375, 0.800567626953125, 0.8351593017578125, 0.8697509765625, 0.9043426513671875, 0.938934326171875, 0.9735260009765625, 1.00811767578125, 1.0427093505859375, 1.077301025390625, 1.1118927001953125, 1.146484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 10.0, 10.0, 19.0, 30.0, 52.0, 67.0, 84.0, 153.0, 217.0, 342.0, 521.0, 806.0, 1256.0, 2036.0, 2970.0, 4833.0, 7401.0, 11749.0, 18184.0, 27838.0, 42350.0, 62038.0, 87171.0, 113428.0, 131661.0, 133223.0, 116542.0, 90171.0, 65845.0, 44564.0, 29276.0, 19355.0, 12174.0, 7930.0, 5130.0, 3251.0, 2056.0, 1373.0, 869.0, 530.0, 364.0, 231.0, 130.0, 87.0, 77.0, 51.0, 30.0, 25.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-0.72705078125, -0.704376220703125, -0.68170166015625, -0.659027099609375, -0.6363525390625, -0.613677978515625, -0.59100341796875, -0.568328857421875, -0.545654296875, -0.522979736328125, -0.50030517578125, -0.477630615234375, -0.4549560546875, -0.432281494140625, -0.40960693359375, -0.386932373046875, -0.3642578125, -0.341583251953125, -0.31890869140625, -0.296234130859375, -0.2735595703125, -0.250885009765625, -0.22821044921875, -0.205535888671875, -0.182861328125, -0.160186767578125, -0.13751220703125, -0.114837646484375, -0.0921630859375, -0.069488525390625, -0.04681396484375, -0.024139404296875, -0.00146484375, 0.021209716796875, 0.04388427734375, 0.066558837890625, 0.0892333984375, 0.111907958984375, 0.13458251953125, 0.157257080078125, 0.179931640625, 0.202606201171875, 0.22528076171875, 0.247955322265625, 0.2706298828125, 0.293304443359375, 0.31597900390625, 0.338653564453125, 0.361328125, 0.384002685546875, 0.40667724609375, 0.429351806640625, 0.4520263671875, 0.474700927734375, 0.49737548828125, 0.520050048828125, 0.542724609375, 0.565399169921875, 0.58807373046875, 0.610748291015625, 0.6334228515625, 0.656097412109375, 0.67877197265625, 0.701446533203125, 0.72412109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 16.0, 10.0, 20.0, 13.0, 16.0, 22.0, 19.0, 45.0, 29.0, 33.0, 34.0, 38.0, 43.0, 37.0, 43.0, 47.0, 1077.0, 50.0, 36.0, 36.0, 53.0, 43.0, 33.0, 34.0, 20.0, 26.0, 25.0, 11.0, 17.0, 14.0, 19.0, 4.0, 12.0, 13.0, 5.0, 3.0, 1.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8901596069335938, -0.8569793701171875, -0.8237991333007812, -0.790618896484375, -0.7574386596679688, -0.7242584228515625, -0.6910781860351562, -0.65789794921875, -0.6247177124023438, -0.5915374755859375, -0.5583572387695312, -0.525177001953125, -0.49199676513671875, -0.4588165283203125, -0.42563629150390625, -0.3924560546875, -0.35927581787109375, -0.3260955810546875, -0.29291534423828125, -0.259735107421875, -0.22655487060546875, -0.1933746337890625, -0.16019439697265625, -0.12701416015625, -0.09383392333984375, -0.0606536865234375, -0.02747344970703125, 0.005706787109375, 0.03888702392578125, 0.0720672607421875, 0.10524749755859375, 0.138427734375, 0.17160797119140625, 0.2047882080078125, 0.23796844482421875, 0.271148681640625, 0.30432891845703125, 0.3375091552734375, 0.37068939208984375, 0.40386962890625, 0.43704986572265625, 0.4702301025390625, 0.5034103393554688, 0.536590576171875, 0.5697708129882812, 0.6029510498046875, 0.6361312866210938, 0.6693115234375, 0.7024917602539062, 0.7356719970703125, 0.7688522338867188, 0.802032470703125, 0.8352127075195312, 0.8683929443359375, 0.9015731811523438, 0.93475341796875, 0.9679336547851562, 1.0011138916015625, 1.0342941284179688, 1.067474365234375, 1.1006546020507812, 1.1338348388671875, 1.1670150756835938, 1.2001953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 16.0, 16.0, 25.0, 34.0, 59.0, 73.0, 103.0, 152.0, 222.0, 305.0, 426.0, 583.0, 841.0, 1228.0, 1766.0, 2641.0, 3779.0, 5594.0, 7973.0, 12322.0, 19533.0, 39667.0, 183794.0, 1562573.0, 160041.0, 37547.0, 18832.0, 11784.0, 7902.0, 5336.0, 3701.0, 2609.0, 1692.0, 1172.0, 840.0, 565.0, 381.0, 289.0, 194.0, 133.0, 103.0, 86.0, 52.0, 28.0, 33.0, 17.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.9970703125, -0.9672775268554688, -0.9374847412109375, -0.9076919555664062, -0.877899169921875, -0.8481063842773438, -0.8183135986328125, -0.7885208129882812, -0.75872802734375, -0.7289352416992188, -0.6991424560546875, -0.6693496704101562, -0.639556884765625, -0.6097640991210938, -0.5799713134765625, -0.5501785278320312, -0.5203857421875, -0.49059295654296875, -0.4608001708984375, -0.43100738525390625, -0.401214599609375, -0.37142181396484375, -0.3416290283203125, -0.31183624267578125, -0.28204345703125, -0.25225067138671875, -0.2224578857421875, -0.19266510009765625, -0.162872314453125, -0.13307952880859375, -0.1032867431640625, -0.07349395751953125, -0.043701171875, -0.01390838623046875, 0.0158843994140625, 0.04567718505859375, 0.075469970703125, 0.10526275634765625, 0.1350555419921875, 0.16484832763671875, 0.19464111328125, 0.22443389892578125, 0.2542266845703125, 0.28401947021484375, 0.313812255859375, 0.34360504150390625, 0.3733978271484375, 0.40319061279296875, 0.4329833984375, 0.46277618408203125, 0.4925689697265625, 0.5223617553710938, 0.552154541015625, 0.5819473266601562, 0.6117401123046875, 0.6415328979492188, 0.67132568359375, 0.7011184692382812, 0.7309112548828125, 0.7607040405273438, 0.790496826171875, 0.8202896118164062, 0.8500823974609375, 0.8798751831054688, 0.90966796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 3.0, 5.0, 7.0, 7.0, 4.0, 7.0, 15.0, 16.0, 18.0, 26.0, 24.0, 25.0, 35.0, 33.0, 35.0, 51.0, 42.0, 64.0, 55.0, 48.0, 44.0, 58.0, 43.0, 42.0, 40.0, 39.0, 37.0, 32.0, 31.0, 22.0, 17.0, 16.0, 8.0, 6.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.056060791015625, -0.0539708137512207, -0.051880836486816406, -0.04979085922241211, -0.04770088195800781, -0.045610904693603516, -0.04352092742919922, -0.04143095016479492, -0.039340972900390625, -0.03725099563598633, -0.03516101837158203, -0.033071041107177734, -0.030981063842773438, -0.02889108657836914, -0.026801109313964844, -0.024711132049560547, -0.02262115478515625, -0.020531177520751953, -0.018441200256347656, -0.01635122299194336, -0.014261245727539062, -0.012171268463134766, -0.010081291198730469, -0.007991313934326172, -0.005901336669921875, -0.003811359405517578, -0.0017213821411132812, 0.0003685951232910156, 0.0024585723876953125, 0.004548549652099609, 0.006638526916503906, 0.008728504180908203, 0.0108184814453125, 0.012908458709716797, 0.014998435974121094, 0.01708841323852539, 0.019178390502929688, 0.021268367767333984, 0.02335834503173828, 0.025448322296142578, 0.027538299560546875, 0.029628276824951172, 0.03171825408935547, 0.033808231353759766, 0.03589820861816406, 0.03798818588256836, 0.040078163146972656, 0.04216814041137695, 0.04425811767578125, 0.04634809494018555, 0.048438072204589844, 0.05052804946899414, 0.05261802673339844, 0.054708003997802734, 0.05679798126220703, 0.05888795852661133, 0.060977935791015625, 0.06306791305541992, 0.06515789031982422, 0.06724786758422852, 0.06933784484863281, 0.07142782211303711, 0.0735177993774414, 0.0756077766418457, 0.07769775390625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 5.0, 5.0, 10.0, 18.0, 27.0, 31.0, 32.0, 58.0, 90.0, 101.0, 137.0, 232.0, 456.0, 1691.0, 21549.0, 682703.0, 328091.0, 11005.0, 1172.0, 410.0, 228.0, 144.0, 102.0, 81.0, 39.0, 27.0, 23.0, 12.0, 18.0, 11.0, 7.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3215713500976562, -1.2847442626953125, -1.2479171752929688, -1.211090087890625, -1.1742630004882812, -1.1374359130859375, -1.1006088256835938, -1.06378173828125, -1.0269546508789062, -0.9901275634765625, -0.9533004760742188, -0.916473388671875, -0.8796463012695312, -0.8428192138671875, -0.8059921264648438, -0.7691650390625, -0.7323379516601562, -0.6955108642578125, -0.6586837768554688, -0.621856689453125, -0.5850296020507812, -0.5482025146484375, -0.5113754272460938, -0.47454833984375, -0.43772125244140625, -0.4008941650390625, -0.36406707763671875, -0.327239990234375, -0.29041290283203125, -0.2535858154296875, -0.21675872802734375, -0.179931640625, -0.14310455322265625, -0.1062774658203125, -0.06945037841796875, -0.032623291015625, 0.00420379638671875, 0.0410308837890625, 0.07785797119140625, 0.11468505859375, 0.15151214599609375, 0.1883392333984375, 0.22516632080078125, 0.261993408203125, 0.29882049560546875, 0.3356475830078125, 0.37247467041015625, 0.4093017578125, 0.44612884521484375, 0.4829559326171875, 0.5197830200195312, 0.556610107421875, 0.5934371948242188, 0.6302642822265625, 0.6670913696289062, 0.70391845703125, 0.7407455444335938, 0.7775726318359375, 0.8143997192382812, 0.851226806640625, 0.8880538940429688, 0.9248809814453125, 0.9617080688476562, 0.99853515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 23.0, 76.0, 229.0, 395.0, 187.0, 63.0, 23.0, 10.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3318135738372803, -2.2814669609069824, -2.2311201095581055, -2.1807734966278076, -2.1304268836975098, -2.080080032348633, -2.029733419418335, -1.979386806488037, -1.9290400743484497, -1.8786933422088623, -1.8283467292785645, -1.777999997138977, -1.7276533842086792, -1.6773066520690918, -1.626960039138794, -1.5766133069992065, -1.5262665748596191, -1.4759198427200317, -1.4255732297897339, -1.3752264976501465, -1.3248798847198486, -1.2745331525802612, -1.2241864204406738, -1.173839807510376, -1.1234931945800781, -1.0731464624404907, -1.0227998495101929, -0.9724531173706055, -0.9221064448356628, -0.8717597723007202, -0.8214130997657776, -0.771066427230835, -0.7207196354866028, -0.6703729629516602, -0.6200262904167175, -0.5696796178817749, -0.5193328857421875, -0.4689862132072449, -0.41863954067230225, -0.36829283833503723, -0.3179461658000946, -0.267599493265152, -0.21725279092788696, -0.16690611839294434, -0.11655943095684052, -0.0662127435207367, -0.015866070985794067, 0.03448063135147095, 0.08482730388641357, 0.1351739913225174, 0.18552067875862122, 0.23586735129356384, 0.28621405363082886, 0.3365607261657715, 0.3869073987007141, 0.4372541010379791, 0.48760077357292175, 0.5379474759101868, 0.5882941484451294, 0.638640820980072, 0.6889874935150146, 0.739334225654602, 0.7896808385848999, 0.8400275707244873, 0.8903742432594299]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 19.0, 11.0, 23.0, 27.0, 30.0, 28.0, 31.0, 35.0, 34.0, 43.0, 56.0, 52.0, 44.0, 50.0, 52.0, 55.0, 38.0, 48.0, 46.0, 37.0, 42.0, 35.0, 20.0, 18.0, 21.0, 15.0, 18.0, 9.0, 15.0, 4.0, 6.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.33830541372299194, -0.32950419187545776, -0.3207029700279236, -0.3119017481803894, -0.3031005263328552, -0.29429927468299866, -0.2854980528354645, -0.2766968309879303, -0.2678956091403961, -0.25909438729286194, -0.25029316544532776, -0.24149192869663239, -0.2326907068490982, -0.22388948500156403, -0.21508824825286865, -0.20628702640533447, -0.1974858045578003, -0.1886845827102661, -0.17988336086273193, -0.17108212411403656, -0.16228090226650238, -0.1534796804189682, -0.14467844367027283, -0.13587722182273865, -0.12707599997520447, -0.11827477812767029, -0.10947354882955551, -0.10067231953144073, -0.09187109768390656, -0.08306987583637238, -0.0742686465382576, -0.06546741724014282, -0.05666619539260864, -0.047864969819784164, -0.039063744246959686, -0.030262518674135208, -0.02146129310131073, -0.012660067528486252, -0.0038588419556617737, 0.0049423836171627045, 0.013743609189987183, 0.02254483476281166, 0.03134606033563614, 0.04014728590846062, 0.048948511481285095, 0.05774973705410957, 0.06655096262693405, 0.07535219192504883, 0.08415341377258301, 0.09295463562011719, 0.10175586491823196, 0.11055709421634674, 0.11935831606388092, 0.1281595379114151, 0.13696077466011047, 0.14576199650764465, 0.15456321835517883, 0.163364440202713, 0.1721656620502472, 0.18096689879894257, 0.18976812064647675, 0.19856934249401093, 0.2073705792427063, 0.21617180109024048, 0.22497302293777466]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 12.0, 13.0, 15.0, 20.0, 21.0, 24.0, 19.0, 33.0, 31.0, 29.0, 35.0, 38.0, 51.0, 56.0, 44.0, 60.0, 59.0, 55.0, 42.0, 44.0, 53.0, 33.0, 40.0, 34.0, 26.0, 21.0, 17.0, 13.0, 13.0, 8.0, 6.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1611328125, -1.123046875, -1.0849609375, -1.046875, -1.0087890625, -0.970703125, -0.9326171875, -0.89453125, -0.8564453125, -0.818359375, -0.7802734375, -0.7421875, -0.7041015625, -0.666015625, -0.6279296875, -0.58984375, -0.5517578125, -0.513671875, -0.4755859375, -0.4375, -0.3994140625, -0.361328125, -0.3232421875, -0.28515625, -0.2470703125, -0.208984375, -0.1708984375, -0.1328125, -0.0947265625, -0.056640625, -0.0185546875, 0.01953125, 0.0576171875, 0.095703125, 0.1337890625, 0.171875, 0.2099609375, 0.248046875, 0.2861328125, 0.32421875, 0.3623046875, 0.400390625, 0.4384765625, 0.4765625, 0.5146484375, 0.552734375, 0.5908203125, 0.62890625, 0.6669921875, 0.705078125, 0.7431640625, 0.78125, 0.8193359375, 0.857421875, 0.8955078125, 0.93359375, 0.9716796875, 1.009765625, 1.0478515625, 1.0859375, 1.1240234375, 1.162109375, 1.2001953125, 1.23828125, 1.2763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 7.0, 15.0, 11.0, 23.0, 36.0, 75.0, 81.0, 149.0, 257.0, 336.0, 533.0, 789.0, 1270.0, 2063.0, 3438.0, 6665.0, 13764.0, 38434.0, 145924.0, 544052.0, 206631.0, 49187.0, 17127.0, 7436.0, 4011.0, 2255.0, 1431.0, 910.0, 557.0, 371.0, 240.0, 199.0, 98.0, 72.0, 37.0, 35.0, 13.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9381103515625, -1.870361328125, -1.8026123046875, -1.73486328125, -1.6671142578125, -1.599365234375, -1.5316162109375, -1.4638671875, -1.3961181640625, -1.328369140625, -1.2606201171875, -1.19287109375, -1.1251220703125, -1.057373046875, -0.9896240234375, -0.921875, -0.8541259765625, -0.786376953125, -0.7186279296875, -0.65087890625, -0.5831298828125, -0.515380859375, -0.4476318359375, -0.3798828125, -0.3121337890625, -0.244384765625, -0.1766357421875, -0.10888671875, -0.0411376953125, 0.026611328125, 0.0943603515625, 0.162109375, 0.2298583984375, 0.297607421875, 0.3653564453125, 0.43310546875, 0.5008544921875, 0.568603515625, 0.6363525390625, 0.7041015625, 0.7718505859375, 0.839599609375, 0.9073486328125, 0.97509765625, 1.0428466796875, 1.110595703125, 1.1783447265625, 1.24609375, 1.3138427734375, 1.381591796875, 1.4493408203125, 1.51708984375, 1.5848388671875, 1.652587890625, 1.7203369140625, 1.7880859375, 1.8558349609375, 1.923583984375, 1.9913330078125, 2.05908203125, 2.1268310546875, 2.194580078125, 2.2623291015625, 2.330078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 14.0, 11.0, 20.0, 17.0, 18.0, 27.0, 31.0, 35.0, 31.0, 34.0, 46.0, 61.0, 85.0, 110.0, 228.0, 1395.0, 254.0, 138.0, 82.0, 63.0, 45.0, 61.0, 36.0, 29.0, 21.0, 28.0, 20.0, 11.0, 5.0, 8.0, 11.0, 8.0, 7.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.968414306640625, -3.84307861328125, -3.717742919921875, -3.5924072265625, -3.467071533203125, -3.34173583984375, -3.216400146484375, -3.091064453125, -2.965728759765625, -2.84039306640625, -2.715057373046875, -2.5897216796875, -2.464385986328125, -2.33905029296875, -2.213714599609375, -2.08837890625, -1.963043212890625, -1.83770751953125, -1.712371826171875, -1.5870361328125, -1.461700439453125, -1.33636474609375, -1.211029052734375, -1.085693359375, -0.960357666015625, -0.83502197265625, -0.709686279296875, -0.5843505859375, -0.459014892578125, -0.33367919921875, -0.208343505859375, -0.0830078125, 0.042327880859375, 0.16766357421875, 0.292999267578125, 0.4183349609375, 0.543670654296875, 0.66900634765625, 0.794342041015625, 0.919677734375, 1.045013427734375, 1.17034912109375, 1.295684814453125, 1.4210205078125, 1.546356201171875, 1.67169189453125, 1.797027587890625, 1.92236328125, 2.047698974609375, 2.17303466796875, 2.298370361328125, 2.4237060546875, 2.549041748046875, 2.67437744140625, 2.799713134765625, 2.925048828125, 3.050384521484375, 3.17572021484375, 3.301055908203125, 3.4263916015625, 3.551727294921875, 3.67706298828125, 3.802398681640625, 3.927734375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 3.0, 6.0, 18.0, 17.0, 29.0, 33.0, 41.0, 62.0, 116.0, 182.0, 315.0, 726.0, 2074.0, 8892.0, 76820.0, 2675627.0, 354657.0, 20077.0, 3756.0, 1084.0, 443.0, 262.0, 145.0, 81.0, 56.0, 40.0, 40.0, 24.0, 15.0, 12.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.02734375, -6.8057861328125, -6.584228515625, -6.3626708984375, -6.14111328125, -5.9195556640625, -5.697998046875, -5.4764404296875, -5.2548828125, -5.0333251953125, -4.811767578125, -4.5902099609375, -4.36865234375, -4.1470947265625, -3.925537109375, -3.7039794921875, -3.482421875, -3.2608642578125, -3.039306640625, -2.8177490234375, -2.59619140625, -2.3746337890625, -2.153076171875, -1.9315185546875, -1.7099609375, -1.4884033203125, -1.266845703125, -1.0452880859375, -0.82373046875, -0.6021728515625, -0.380615234375, -0.1590576171875, 0.0625, 0.2840576171875, 0.505615234375, 0.7271728515625, 0.94873046875, 1.1702880859375, 1.391845703125, 1.6134033203125, 1.8349609375, 2.0565185546875, 2.278076171875, 2.4996337890625, 2.72119140625, 2.9427490234375, 3.164306640625, 3.3858642578125, 3.607421875, 3.8289794921875, 4.050537109375, 4.2720947265625, 4.49365234375, 4.7152099609375, 4.936767578125, 5.1583251953125, 5.3798828125, 5.6014404296875, 5.822998046875, 6.0445556640625, 6.26611328125, 6.4876708984375, 6.709228515625, 6.9307861328125, 7.15234375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 57.0, 938.0, 23.0, 1.0], "bins": [-221.81622314453125, -218.2049560546875, -214.5937042236328, -210.98243713378906, -207.37118530273438, -203.75991821289062, -200.14865112304688, -196.5373992919922, -192.92613220214844, -189.3148651123047, -185.70361328125, -182.09234619140625, -178.48109436035156, -174.8698272705078, -171.25857543945312, -167.64730834960938, -164.03604125976562, -160.42477416992188, -156.8135223388672, -153.20225524902344, -149.59100341796875, -145.979736328125, -142.36846923828125, -138.75721740722656, -135.14596557617188, -131.53469848632812, -127.92344665527344, -124.31217956542969, -120.70092010498047, -117.08966064453125, -113.47840118408203, -109.86714172363281, -106.25587463378906, -102.64461517333984, -99.03335571289062, -95.42208862304688, -91.81082916259766, -88.19956970214844, -84.58831024169922, -80.97705078125, -77.36578369140625, -73.75452423095703, -70.14326477050781, -66.53199768066406, -62.920738220214844, -59.309478759765625, -55.698219299316406, -52.08695983886719, -48.47570037841797, -44.86444091796875, -41.253177642822266, -37.64191818237305, -34.03065490722656, -30.419395446777344, -26.808135986328125, -23.196874618530273, -19.585613250732422, -15.97435188293457, -12.363091468811035, -8.7518310546875, -5.140569686889648, -1.5293083190917969, 2.081951141357422, 5.693212509155273, 9.304474830627441]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 16.0, 17.0, 15.0, 13.0, 15.0, 28.0, 35.0, 31.0, 35.0, 38.0, 34.0, 47.0, 51.0, 44.0, 42.0, 28.0, 56.0, 47.0, 40.0, 34.0, 43.0, 40.0, 39.0, 24.0, 20.0, 29.0, 12.0, 18.0, 19.0, 15.0, 16.0, 13.0, 5.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.436010360717773, -13.035432815551758, -12.634855270385742, -12.234277725219727, -11.833700180053711, -11.433122634887695, -11.032544136047363, -10.631966590881348, -10.231389045715332, -9.830811500549316, -9.4302339553833, -9.029656410217285, -8.629077911376953, -8.228500366210938, -7.827922821044922, -7.427345275878906, -7.026767730712891, -6.626190185546875, -6.225612640380859, -5.8250346183776855, -5.42445707321167, -5.023879528045654, -4.6233015060424805, -4.222723960876465, -3.822146415710449, -3.4215688705444336, -3.020991086959839, -2.620413303375244, -2.2198357582092285, -1.819258213043213, -1.4186804294586182, -1.0181026458740234, -0.6175241470336914, -0.21694648265838623, 0.18363118171691895, 0.5842088460922241, 0.9847865104675293, 1.385364055633545, 1.7859418392181396, 2.1865196228027344, 2.58709716796875, 2.9876747131347656, 3.3882524967193604, 3.788830280303955, 4.189407825469971, 4.589985370635986, 4.99056339263916, 5.391140937805176, 5.791718482971191, 6.192296028137207, 6.592873573303223, 6.9934515953063965, 7.394029140472412, 7.794606685638428, 8.195184707641602, 8.595762252807617, 8.996339797973633, 9.396917343139648, 9.797494888305664, 10.19807243347168, 10.598649978637695, 10.999227523803711, 11.399806022644043, 11.800383567810059, 12.200961112976074]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 8.0, 9.0, 13.0, 12.0, 22.0, 27.0, 23.0, 27.0, 35.0, 31.0, 40.0, 32.0, 44.0, 48.0, 55.0, 47.0, 54.0, 47.0, 50.0, 49.0, 62.0, 49.0, 42.0, 30.0, 22.0, 23.0, 13.0, 21.0, 14.0, 8.0, 7.0, 9.0, 9.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1169586181640625, -1.075714111328125, -1.0344696044921875, -0.99322509765625, -0.9519805908203125, -0.910736083984375, -0.8694915771484375, -0.8282470703125, -0.7870025634765625, -0.745758056640625, -0.7045135498046875, -0.66326904296875, -0.6220245361328125, -0.580780029296875, -0.5395355224609375, -0.498291015625, -0.4570465087890625, -0.415802001953125, -0.3745574951171875, -0.33331298828125, -0.2920684814453125, -0.250823974609375, -0.2095794677734375, -0.1683349609375, -0.1270904541015625, -0.085845947265625, -0.0446014404296875, -0.00335693359375, 0.0378875732421875, 0.079132080078125, 0.1203765869140625, 0.16162109375, 0.2028656005859375, 0.244110107421875, 0.2853546142578125, 0.32659912109375, 0.3678436279296875, 0.409088134765625, 0.4503326416015625, 0.4915771484375, 0.5328216552734375, 0.574066162109375, 0.6153106689453125, 0.65655517578125, 0.6977996826171875, 0.739044189453125, 0.7802886962890625, 0.821533203125, 0.8627777099609375, 0.904022216796875, 0.9452667236328125, 0.98651123046875, 1.0277557373046875, 1.069000244140625, 1.1102447509765625, 1.1514892578125, 1.1927337646484375, 1.233978271484375, 1.2752227783203125, 1.31646728515625, 1.3577117919921875, 1.398956298828125, 1.4402008056640625, 1.4814453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 10.0, 9.0, 17.0, 27.0, 44.0, 80.0, 94.0, 166.0, 263.0, 421.0, 696.0, 1177.0, 2244.0, 4264.0, 8469.0, 19071.0, 53053.0, 249714.0, 2112948.0, 1506478.0, 162759.0, 40793.0, 15765.0, 7329.0, 3719.0, 1986.0, 1048.0, 644.0, 364.0, 229.0, 145.0, 86.0, 45.0, 37.0, 18.0, 17.0, 11.0, 7.0, 7.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.589996337890625, -2.50616455078125, -2.422332763671875, -2.3385009765625, -2.254669189453125, -2.17083740234375, -2.087005615234375, -2.003173828125, -1.919342041015625, -1.83551025390625, -1.751678466796875, -1.6678466796875, -1.584014892578125, -1.50018310546875, -1.416351318359375, -1.33251953125, -1.248687744140625, -1.16485595703125, -1.081024169921875, -0.9971923828125, -0.913360595703125, -0.82952880859375, -0.745697021484375, -0.661865234375, -0.578033447265625, -0.49420166015625, -0.410369873046875, -0.3265380859375, -0.242706298828125, -0.15887451171875, -0.075042724609375, 0.0087890625, 0.092620849609375, 0.17645263671875, 0.260284423828125, 0.3441162109375, 0.427947998046875, 0.51177978515625, 0.595611572265625, 0.679443359375, 0.763275146484375, 0.84710693359375, 0.930938720703125, 1.0147705078125, 1.098602294921875, 1.18243408203125, 1.266265869140625, 1.35009765625, 1.433929443359375, 1.51776123046875, 1.601593017578125, 1.6854248046875, 1.769256591796875, 1.85308837890625, 1.936920166015625, 2.020751953125, 2.104583740234375, 2.18841552734375, 2.272247314453125, 2.3560791015625, 2.439910888671875, 2.52374267578125, 2.607574462890625, 2.69140625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 16.0, 9.0, 20.0, 19.0, 26.0, 48.0, 69.0, 73.0, 100.0, 161.0, 279.0, 399.0, 610.0, 656.0, 539.0, 360.0, 231.0, 140.0, 83.0, 68.0, 51.0, 30.0, 23.0, 12.0, 17.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.174713134765625, -3.07012939453125, -2.965545654296875, -2.8609619140625, -2.756378173828125, -2.65179443359375, -2.547210693359375, -2.442626953125, -2.338043212890625, -2.23345947265625, -2.128875732421875, -2.0242919921875, -1.919708251953125, -1.81512451171875, -1.710540771484375, -1.60595703125, -1.501373291015625, -1.39678955078125, -1.292205810546875, -1.1876220703125, -1.083038330078125, -0.97845458984375, -0.873870849609375, -0.769287109375, -0.664703369140625, -0.56011962890625, -0.455535888671875, -0.3509521484375, -0.246368408203125, -0.14178466796875, -0.037200927734375, 0.0673828125, 0.171966552734375, 0.27655029296875, 0.381134033203125, 0.4857177734375, 0.590301513671875, 0.69488525390625, 0.799468994140625, 0.904052734375, 1.008636474609375, 1.11322021484375, 1.217803955078125, 1.3223876953125, 1.426971435546875, 1.53155517578125, 1.636138916015625, 1.74072265625, 1.845306396484375, 1.94989013671875, 2.054473876953125, 2.1590576171875, 2.263641357421875, 2.36822509765625, 2.472808837890625, 2.577392578125, 2.681976318359375, 2.78656005859375, 2.891143798828125, 2.9957275390625, 3.100311279296875, 3.20489501953125, 3.309478759765625, 3.4140625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 8.0, 10.0, 4.0, 5.0, 10.0, 19.0, 26.0, 38.0, 55.0, 94.0, 143.0, 198.0, 365.0, 615.0, 1099.0, 2136.0, 4358.0, 9587.0, 23335.0, 64683.0, 243754.0, 1746819.0, 1746482.0, 243759.0, 64905.0, 23245.0, 9475.0, 4248.0, 2116.0, 1075.0, 641.0, 337.0, 227.0, 141.0, 90.0, 50.0, 39.0, 21.0, 17.0, 11.0, 11.0, 6.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.751953125, -3.63470458984375, -3.5174560546875, -3.40020751953125, -3.282958984375, -3.16571044921875, -3.0484619140625, -2.93121337890625, -2.81396484375, -2.69671630859375, -2.5794677734375, -2.46221923828125, -2.344970703125, -2.22772216796875, -2.1104736328125, -1.99322509765625, -1.8759765625, -1.75872802734375, -1.6414794921875, -1.52423095703125, -1.406982421875, -1.28973388671875, -1.1724853515625, -1.05523681640625, -0.93798828125, -0.82073974609375, -0.7034912109375, -0.58624267578125, -0.468994140625, -0.35174560546875, -0.2344970703125, -0.11724853515625, 0.0, 0.11724853515625, 0.2344970703125, 0.35174560546875, 0.468994140625, 0.58624267578125, 0.7034912109375, 0.82073974609375, 0.93798828125, 1.05523681640625, 1.1724853515625, 1.28973388671875, 1.406982421875, 1.52423095703125, 1.6414794921875, 1.75872802734375, 1.8759765625, 1.99322509765625, 2.1104736328125, 2.22772216796875, 2.344970703125, 2.46221923828125, 2.5794677734375, 2.69671630859375, 2.81396484375, 2.93121337890625, 3.0484619140625, 3.16571044921875, 3.282958984375, 3.40020751953125, 3.5174560546875, 3.63470458984375, 3.751953125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 27.0, 43.0, 83.0, 123.0, 203.0, 220.0, 157.0, 85.0, 36.0, 14.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3842716217041, -24.446584701538086, -23.508895874023438, -22.571208953857422, -21.633522033691406, -20.69583511352539, -19.758148193359375, -18.820459365844727, -17.88277244567871, -16.945085525512695, -16.007396697998047, -15.069709777832031, -14.132022857666016, -13.1943359375, -12.256648063659668, -11.318960189819336, -10.38127326965332, -9.443586349487305, -8.505898475646973, -7.568211078643799, -6.630523681640625, -5.692836284637451, -4.755148887634277, -3.8174614906311035, -2.8797740936279297, -1.9420866966247559, -1.004399299621582, -0.0667119026184082, 0.8709754943847656, 1.8086628913879395, 2.7463502883911133, 3.684037685394287, 4.621726989746094, 5.559414386749268, 6.497101783752441, 7.434789180755615, 8.372476577758789, 9.310163497924805, 10.247851371765137, 11.185539245605469, 12.123226165771484, 13.0609130859375, 13.998600959777832, 14.936288833618164, 15.87397575378418, 16.811662673950195, 17.749351501464844, 18.68703842163086, 19.624725341796875, 20.56241226196289, 21.500099182128906, 22.437788009643555, 23.37547492980957, 24.313161849975586, 25.250850677490234, 26.18853759765625, 27.126224517822266, 28.06391143798828, 29.001598358154297, 29.939287185668945, 30.87697410583496, 31.814661026000977, 32.752349853515625, 33.69003677368164, 34.627723693847656]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 13.0, 12.0, 7.0, 18.0, 15.0, 27.0, 17.0, 24.0, 21.0, 29.0, 24.0, 33.0, 35.0, 37.0, 38.0, 39.0, 32.0, 43.0, 32.0, 42.0, 31.0, 39.0, 41.0, 30.0, 28.0, 32.0, 34.0, 22.0, 24.0, 26.0, 18.0, 20.0, 12.0, 18.0, 9.0, 16.0, 3.0, 8.0, 7.0, 5.0, 4.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.944015026092529, -7.674643039703369, -7.405271053314209, -7.135899066925049, -6.866527080535889, -6.5971550941467285, -6.327783107757568, -6.058411121368408, -5.789039134979248, -5.519667148590088, -5.250295162200928, -4.980923175811768, -4.711551189422607, -4.442179203033447, -4.172807216644287, -3.903435230255127, -3.634063243865967, -3.3646912574768066, -3.0953192710876465, -2.8259472846984863, -2.556575298309326, -2.287203311920166, -2.017831325531006, -1.7484593391418457, -1.4790873527526855, -1.2097153663635254, -0.9403433799743652, -0.6709713935852051, -0.4015994071960449, -0.13222742080688477, 0.1371445655822754, 0.40651655197143555, 0.6758880615234375, 0.9452600479125977, 1.2146320343017578, 1.484004020690918, 1.7533760070800781, 2.0227479934692383, 2.2921199798583984, 2.5614919662475586, 2.8308639526367188, 3.100235939025879, 3.369607925415039, 3.638979911804199, 3.9083518981933594, 4.1777238845825195, 4.44709587097168, 4.71646785736084, 4.98583984375, 5.25521183013916, 5.52458381652832, 5.7939558029174805, 6.063327789306641, 6.332699775695801, 6.602071762084961, 6.871443748474121, 7.140815734863281, 7.410187721252441, 7.679559707641602, 7.948931694030762, 8.218303680419922, 8.487675666809082, 8.757047653198242, 9.026419639587402, 9.295791625976562]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 4.0, 9.0, 8.0, 7.0, 6.0, 9.0, 17.0, 26.0, 22.0, 22.0, 23.0, 33.0, 39.0, 39.0, 46.0, 42.0, 52.0, 51.0, 68.0, 52.0, 57.0, 48.0, 45.0, 35.0, 35.0, 30.0, 30.0, 27.0, 28.0, 23.0, 17.0, 9.0, 8.0, 7.0, 7.0, 12.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3330078125, -1.2921142578125, -1.251220703125, -1.2103271484375, -1.16943359375, -1.1285400390625, -1.087646484375, -1.0467529296875, -1.005859375, -0.9649658203125, -0.924072265625, -0.8831787109375, -0.84228515625, -0.8013916015625, -0.760498046875, -0.7196044921875, -0.6787109375, -0.6378173828125, -0.596923828125, -0.5560302734375, -0.51513671875, -0.4742431640625, -0.433349609375, -0.3924560546875, -0.3515625, -0.3106689453125, -0.269775390625, -0.2288818359375, -0.18798828125, -0.1470947265625, -0.106201171875, -0.0653076171875, -0.0244140625, 0.0164794921875, 0.057373046875, 0.0982666015625, 0.13916015625, 0.1800537109375, 0.220947265625, 0.2618408203125, 0.302734375, 0.3436279296875, 0.384521484375, 0.4254150390625, 0.46630859375, 0.5072021484375, 0.548095703125, 0.5889892578125, 0.6298828125, 0.6707763671875, 0.711669921875, 0.7525634765625, 0.79345703125, 0.8343505859375, 0.875244140625, 0.9161376953125, 0.95703125, 0.9979248046875, 1.038818359375, 1.0797119140625, 1.12060546875, 1.1614990234375, 1.202392578125, 1.2432861328125, 1.2841796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 9.0, 13.0, 19.0, 24.0, 66.0, 77.0, 100.0, 179.0, 277.0, 405.0, 664.0, 1006.0, 1648.0, 2646.0, 4369.0, 7140.0, 11869.0, 19718.0, 32518.0, 51973.0, 79943.0, 114080.0, 142926.0, 153150.0, 134617.0, 103150.0, 70423.0, 44803.0, 27524.0, 16989.0, 10154.0, 6145.0, 3798.0, 2268.0, 1447.0, 855.0, 526.0, 377.0, 240.0, 153.0, 84.0, 58.0, 46.0, 23.0, 26.0, 8.0, 11.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7539596557617188, -0.7291107177734375, -0.7042617797851562, -0.679412841796875, -0.6545639038085938, -0.6297149658203125, -0.6048660278320312, -0.58001708984375, -0.5551681518554688, -0.5303192138671875, -0.5054702758789062, -0.480621337890625, -0.45577239990234375, -0.4309234619140625, -0.40607452392578125, -0.3812255859375, -0.35637664794921875, -0.3315277099609375, -0.30667877197265625, -0.281829833984375, -0.25698089599609375, -0.2321319580078125, -0.20728302001953125, -0.18243408203125, -0.15758514404296875, -0.1327362060546875, -0.10788726806640625, -0.083038330078125, -0.05818939208984375, -0.0333404541015625, -0.00849151611328125, 0.016357421875, 0.04120635986328125, 0.0660552978515625, 0.09090423583984375, 0.115753173828125, 0.14060211181640625, 0.1654510498046875, 0.19029998779296875, 0.21514892578125, 0.23999786376953125, 0.2648468017578125, 0.28969573974609375, 0.314544677734375, 0.33939361572265625, 0.3642425537109375, 0.38909149169921875, 0.4139404296875, 0.43878936767578125, 0.4636383056640625, 0.48848724365234375, 0.513336181640625, 0.5381851196289062, 0.5630340576171875, 0.5878829956054688, 0.61273193359375, 0.6375808715820312, 0.6624298095703125, 0.6872787475585938, 0.712127685546875, 0.7369766235351562, 0.7618255615234375, 0.7866744995117188, 0.8115234375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 12.0, 3.0, 6.0, 9.0, 9.0, 14.0, 21.0, 17.0, 19.0, 27.0, 31.0, 39.0, 38.0, 38.0, 49.0, 42.0, 41.0, 42.0, 1070.0, 40.0, 48.0, 44.0, 41.0, 43.0, 36.0, 44.0, 31.0, 30.0, 22.0, 19.0, 18.0, 18.0, 14.0, 19.0, 6.0, 13.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2398223876953125, -1.199371337890625, -1.1589202880859375, -1.11846923828125, -1.0780181884765625, -1.037567138671875, -0.9971160888671875, -0.9566650390625, -0.9162139892578125, -0.875762939453125, -0.8353118896484375, -0.79486083984375, -0.7544097900390625, -0.713958740234375, -0.6735076904296875, -0.633056640625, -0.5926055908203125, -0.552154541015625, -0.5117034912109375, -0.47125244140625, -0.4308013916015625, -0.390350341796875, -0.3498992919921875, -0.3094482421875, -0.2689971923828125, -0.228546142578125, -0.1880950927734375, -0.14764404296875, -0.1071929931640625, -0.066741943359375, -0.0262908935546875, 0.01416015625, 0.0546112060546875, 0.095062255859375, 0.1355133056640625, 0.17596435546875, 0.2164154052734375, 0.256866455078125, 0.2973175048828125, 0.3377685546875, 0.3782196044921875, 0.418670654296875, 0.4591217041015625, 0.49957275390625, 0.5400238037109375, 0.580474853515625, 0.6209259033203125, 0.661376953125, 0.7018280029296875, 0.742279052734375, 0.7827301025390625, 0.82318115234375, 0.8636322021484375, 0.904083251953125, 0.9445343017578125, 0.9849853515625, 1.0254364013671875, 1.065887451171875, 1.1063385009765625, 1.14678955078125, 1.1872406005859375, 1.227691650390625, 1.2681427001953125, 1.30859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 14.0, 17.0, 17.0, 39.0, 61.0, 84.0, 114.0, 175.0, 221.0, 361.0, 519.0, 845.0, 1208.0, 1868.0, 2752.0, 4387.0, 6774.0, 10654.0, 17978.0, 34997.0, 133542.0, 1558892.0, 223651.0, 43912.0, 20384.0, 11874.0, 7635.0, 4814.0, 3184.0, 2051.0, 1372.0, 896.0, 620.0, 372.0, 262.0, 162.0, 127.0, 88.0, 58.0, 53.0, 29.0, 23.0, 14.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0363006591796875, -1.001312255859375, -0.9663238525390625, -0.93133544921875, -0.8963470458984375, -0.861358642578125, -0.8263702392578125, -0.7913818359375, -0.7563934326171875, -0.721405029296875, -0.6864166259765625, -0.65142822265625, -0.6164398193359375, -0.581451416015625, -0.5464630126953125, -0.511474609375, -0.4764862060546875, -0.441497802734375, -0.4065093994140625, -0.37152099609375, -0.3365325927734375, -0.301544189453125, -0.2665557861328125, -0.2315673828125, -0.1965789794921875, -0.161590576171875, -0.1266021728515625, -0.09161376953125, -0.0566253662109375, -0.021636962890625, 0.0133514404296875, 0.04833984375, 0.0833282470703125, 0.118316650390625, 0.1533050537109375, 0.18829345703125, 0.2232818603515625, 0.258270263671875, 0.2932586669921875, 0.3282470703125, 0.3632354736328125, 0.398223876953125, 0.4332122802734375, 0.46820068359375, 0.5031890869140625, 0.538177490234375, 0.5731658935546875, 0.608154296875, 0.6431427001953125, 0.678131103515625, 0.7131195068359375, 0.74810791015625, 0.7830963134765625, 0.818084716796875, 0.8530731201171875, 0.8880615234375, 0.9230499267578125, 0.958038330078125, 0.9930267333984375, 1.02801513671875, 1.0630035400390625, 1.097991943359375, 1.1329803466796875, 1.16796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 3.0, 12.0, 13.0, 15.0, 21.0, 14.0, 23.0, 31.0, 26.0, 30.0, 45.0, 58.0, 62.0, 69.0, 52.0, 58.0, 64.0, 61.0, 47.0, 45.0, 48.0, 30.0, 21.0, 32.0, 23.0, 15.0, 11.0, 18.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10654544830322266, -0.10243415832519531, -0.09832286834716797, -0.09421157836914062, -0.09010028839111328, -0.08598899841308594, -0.0818777084350586, -0.07776641845703125, -0.0736551284790039, -0.06954383850097656, -0.06543254852294922, -0.061321258544921875, -0.05720996856689453, -0.05309867858886719, -0.048987388610839844, -0.0448760986328125, -0.040764808654785156, -0.03665351867675781, -0.03254222869873047, -0.028430938720703125, -0.02431964874267578, -0.020208358764648438, -0.016097068786621094, -0.01198577880859375, -0.007874488830566406, -0.0037631988525390625, 0.00034809112548828125, 0.004459381103515625, 0.008570671081542969, 0.012681961059570312, 0.016793251037597656, 0.020904541015625, 0.025015830993652344, 0.029127120971679688, 0.03323841094970703, 0.037349700927734375, 0.04146099090576172, 0.04557228088378906, 0.049683570861816406, 0.05379486083984375, 0.057906150817871094, 0.06201744079589844, 0.06612873077392578, 0.07024002075195312, 0.07435131072998047, 0.07846260070800781, 0.08257389068603516, 0.0866851806640625, 0.09079647064208984, 0.09490776062011719, 0.09901905059814453, 0.10313034057617188, 0.10724163055419922, 0.11135292053222656, 0.1154642105102539, 0.11957550048828125, 0.1236867904663086, 0.12779808044433594, 0.13190937042236328, 0.13602066040039062, 0.14013195037841797, 0.1442432403564453, 0.14835453033447266, 0.1524658203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 9.0, 14.0, 7.0, 21.0, 22.0, 28.0, 43.0, 64.0, 94.0, 163.0, 340.0, 1043.0, 6582.0, 81715.0, 878114.0, 72385.0, 6079.0, 984.0, 333.0, 163.0, 104.0, 56.0, 47.0, 38.0, 26.0, 14.0, 21.0, 5.0, 9.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.42144775390625, -2.3585205078125, -2.29559326171875, -2.232666015625, -2.16973876953125, -2.1068115234375, -2.04388427734375, -1.98095703125, -1.91802978515625, -1.8551025390625, -1.79217529296875, -1.729248046875, -1.66632080078125, -1.6033935546875, -1.54046630859375, -1.4775390625, -1.41461181640625, -1.3516845703125, -1.28875732421875, -1.225830078125, -1.16290283203125, -1.0999755859375, -1.03704833984375, -0.97412109375, -0.91119384765625, -0.8482666015625, -0.78533935546875, -0.722412109375, -0.65948486328125, -0.5965576171875, -0.53363037109375, -0.470703125, -0.40777587890625, -0.3448486328125, -0.28192138671875, -0.218994140625, -0.15606689453125, -0.0931396484375, -0.03021240234375, 0.03271484375, 0.09564208984375, 0.1585693359375, 0.22149658203125, 0.284423828125, 0.34735107421875, 0.4102783203125, 0.47320556640625, 0.5361328125, 0.59906005859375, 0.6619873046875, 0.72491455078125, 0.787841796875, 0.85076904296875, 0.9136962890625, 0.97662353515625, 1.03955078125, 1.10247802734375, 1.1654052734375, 1.22833251953125, 1.291259765625, 1.35418701171875, 1.4171142578125, 1.48004150390625, 1.54296875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 14.0, 33.0, 95.0, 191.0, 301.0, 200.0, 89.0, 40.0, 17.0, 11.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8741536140441895, -2.807976007461548, -2.7417984008789062, -2.6756210327148438, -2.609443426132202, -2.5432658195495605, -2.477088212966919, -2.4109106063842773, -2.344733238220215, -2.2785556316375732, -2.2123780250549316, -2.146200656890869, -2.0800230503082275, -2.013845443725586, -1.9476678371429443, -1.8814902305603027, -1.8153126239776611, -1.7491350173950195, -1.6829575300216675, -1.6167799234390259, -1.5506024360656738, -1.4844248294830322, -1.4182472229003906, -1.352069616317749, -1.285892128944397, -1.2197145223617554, -1.1535370349884033, -1.0873594284057617, -1.0211818218231201, -0.9550043344497681, -0.8888267278671265, -0.8226491808891296, -0.7564716339111328, -0.690294086933136, -0.6241165399551392, -0.5579389333724976, -0.49176138639450073, -0.4255838394165039, -0.3594062626361847, -0.2932286858558655, -0.22705113887786865, -0.16087357699871063, -0.09469601511955261, -0.028518453240394592, 0.03765910863876343, 0.10383665561676025, 0.17001423239707947, 0.23619180917739868, 0.3023693561553955, 0.36854690313339233, 0.43472447991371155, 0.5009020566940308, 0.5670796036720276, 0.6332571506500244, 0.699434757232666, 0.7656123042106628, 0.8317898511886597, 0.8979673981666565, 0.9641449451446533, 1.030322551727295, 1.0965001583099365, 1.1626776456832886, 1.2288552522659302, 1.2950327396392822, 1.3612103462219238]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 12.0, 14.0, 6.0, 10.0, 17.0, 23.0, 37.0, 40.0, 32.0, 28.0, 39.0, 28.0, 51.0, 45.0, 61.0, 45.0, 53.0, 53.0, 50.0, 40.0, 43.0, 40.0, 39.0, 30.0, 25.0, 25.0, 28.0, 21.0, 11.0, 17.0, 7.0, 6.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.500812292098999, -0.4838857054710388, -0.4669591188430786, -0.4500325322151184, -0.4331059455871582, -0.416179358959198, -0.3992527723312378, -0.3823261857032776, -0.3653995990753174, -0.3484730124473572, -0.331546425819397, -0.31461983919143677, -0.29769325256347656, -0.28076666593551636, -0.26384007930755615, -0.24691349267959595, -0.22998690605163574, -0.21306031942367554, -0.19613373279571533, -0.17920714616775513, -0.16228055953979492, -0.14535397291183472, -0.1284273862838745, -0.1115007996559143, -0.0945742130279541, -0.0776476263999939, -0.06072103977203369, -0.043794453144073486, -0.02686786651611328, -0.009941279888153076, 0.006985306739807129, 0.023911893367767334, 0.04083847999572754, 0.057765066623687744, 0.07469165325164795, 0.09161823987960815, 0.10854482650756836, 0.12547141313552856, 0.14239799976348877, 0.15932458639144897, 0.17625117301940918, 0.19317775964736938, 0.2101043462753296, 0.2270309329032898, 0.24395751953125, 0.2608841061592102, 0.2778106927871704, 0.2947372794151306, 0.3116638660430908, 0.328590452671051, 0.34551703929901123, 0.36244362592697144, 0.37937021255493164, 0.39629679918289185, 0.41322338581085205, 0.43014997243881226, 0.44707655906677246, 0.46400314569473267, 0.48092973232269287, 0.4978563189506531, 0.5147829055786133, 0.5317094922065735, 0.5486360788345337, 0.5655626654624939, 0.5824892520904541]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 5.0, 6.0, 13.0, 12.0, 19.0, 29.0, 35.0, 36.0, 34.0, 45.0, 46.0, 40.0, 56.0, 64.0, 64.0, 63.0, 55.0, 54.0, 46.0, 45.0, 41.0, 31.0, 29.0, 27.0, 23.0, 17.0, 23.0, 9.0, 10.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.533203125, -1.4862213134765625, -1.439239501953125, -1.3922576904296875, -1.34527587890625, -1.2982940673828125, -1.251312255859375, -1.2043304443359375, -1.1573486328125, -1.1103668212890625, -1.063385009765625, -1.0164031982421875, -0.96942138671875, -0.9224395751953125, -0.875457763671875, -0.8284759521484375, -0.781494140625, -0.7345123291015625, -0.687530517578125, -0.6405487060546875, -0.59356689453125, -0.5465850830078125, -0.499603271484375, -0.4526214599609375, -0.4056396484375, -0.3586578369140625, -0.311676025390625, -0.2646942138671875, -0.21771240234375, -0.1707305908203125, -0.123748779296875, -0.0767669677734375, -0.02978515625, 0.0171966552734375, 0.064178466796875, 0.1111602783203125, 0.15814208984375, 0.2051239013671875, 0.252105712890625, 0.2990875244140625, 0.3460693359375, 0.3930511474609375, 0.440032958984375, 0.4870147705078125, 0.53399658203125, 0.5809783935546875, 0.627960205078125, 0.6749420166015625, 0.721923828125, 0.7689056396484375, 0.815887451171875, 0.8628692626953125, 0.90985107421875, 0.9568328857421875, 1.003814697265625, 1.0507965087890625, 1.0977783203125, 1.1447601318359375, 1.191741943359375, 1.2387237548828125, 1.28570556640625, 1.3326873779296875, 1.379669189453125, 1.4266510009765625, 1.4736328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 14.0, 27.0, 39.0, 69.0, 99.0, 189.0, 310.0, 505.0, 906.0, 1630.0, 2959.0, 5679.0, 11486.0, 26618.0, 79182.0, 394857.0, 393615.0, 79777.0, 26389.0, 11675.0, 5681.0, 2946.0, 1686.0, 957.0, 522.0, 297.0, 163.0, 99.0, 62.0, 29.0, 22.0, 19.0, 14.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51171875, -2.4332275390625, -2.354736328125, -2.2762451171875, -2.19775390625, -2.1192626953125, -2.040771484375, -1.9622802734375, -1.8837890625, -1.8052978515625, -1.726806640625, -1.6483154296875, -1.56982421875, -1.4913330078125, -1.412841796875, -1.3343505859375, -1.255859375, -1.1773681640625, -1.098876953125, -1.0203857421875, -0.94189453125, -0.8634033203125, -0.784912109375, -0.7064208984375, -0.6279296875, -0.5494384765625, -0.470947265625, -0.3924560546875, -0.31396484375, -0.2354736328125, -0.156982421875, -0.0784912109375, 0.0, 0.0784912109375, 0.156982421875, 0.2354736328125, 0.31396484375, 0.3924560546875, 0.470947265625, 0.5494384765625, 0.6279296875, 0.7064208984375, 0.784912109375, 0.8634033203125, 0.94189453125, 1.0203857421875, 1.098876953125, 1.1773681640625, 1.255859375, 1.3343505859375, 1.412841796875, 1.4913330078125, 1.56982421875, 1.6483154296875, 1.726806640625, 1.8052978515625, 1.8837890625, 1.9622802734375, 2.040771484375, 2.1192626953125, 2.19775390625, 2.2762451171875, 2.354736328125, 2.4332275390625, 2.51171875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 10.0, 3.0, 8.0, 7.0, 9.0, 7.0, 13.0, 25.0, 31.0, 33.0, 26.0, 48.0, 55.0, 50.0, 79.0, 95.0, 169.0, 378.0, 1378.0, 143.0, 100.0, 81.0, 46.0, 54.0, 50.0, 28.0, 22.0, 27.0, 16.0, 16.0, 8.0, 11.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.57293701171875, -4.4036865234375, -4.23443603515625, -4.065185546875, -3.89593505859375, -3.7266845703125, -3.55743408203125, -3.38818359375, -3.21893310546875, -3.0496826171875, -2.88043212890625, -2.711181640625, -2.54193115234375, -2.3726806640625, -2.20343017578125, -2.0341796875, -1.86492919921875, -1.6956787109375, -1.52642822265625, -1.357177734375, -1.18792724609375, -1.0186767578125, -0.84942626953125, -0.68017578125, -0.51092529296875, -0.3416748046875, -0.17242431640625, -0.003173828125, 0.16607666015625, 0.3353271484375, 0.50457763671875, 0.673828125, 0.84307861328125, 1.0123291015625, 1.18157958984375, 1.350830078125, 1.52008056640625, 1.6893310546875, 1.85858154296875, 2.02783203125, 2.19708251953125, 2.3663330078125, 2.53558349609375, 2.704833984375, 2.87408447265625, 3.0433349609375, 3.21258544921875, 3.3818359375, 3.55108642578125, 3.7203369140625, 3.88958740234375, 4.058837890625, 4.22808837890625, 4.3973388671875, 4.56658935546875, 4.73583984375, 4.90509033203125, 5.0743408203125, 5.24359130859375, 5.412841796875, 5.58209228515625, 5.7513427734375, 5.92059326171875, 6.08984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 7.0, 11.0, 12.0, 17.0, 16.0, 32.0, 48.0, 55.0, 90.0, 156.0, 288.0, 553.0, 1544.0, 7326.0, 73949.0, 2789426.0, 252390.0, 15464.0, 2631.0, 761.0, 336.0, 205.0, 123.0, 78.0, 48.0, 36.0, 25.0, 15.0, 11.0, 17.0, 11.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.6273193359375, -9.332763671875, -9.0382080078125, -8.74365234375, -8.4490966796875, -8.154541015625, -7.8599853515625, -7.5654296875, -7.2708740234375, -6.976318359375, -6.6817626953125, -6.38720703125, -6.0926513671875, -5.798095703125, -5.5035400390625, -5.208984375, -4.9144287109375, -4.619873046875, -4.3253173828125, -4.03076171875, -3.7362060546875, -3.441650390625, -3.1470947265625, -2.8525390625, -2.5579833984375, -2.263427734375, -1.9688720703125, -1.67431640625, -1.3797607421875, -1.085205078125, -0.7906494140625, -0.49609375, -0.2015380859375, 0.093017578125, 0.3875732421875, 0.68212890625, 0.9766845703125, 1.271240234375, 1.5657958984375, 1.8603515625, 2.1549072265625, 2.449462890625, 2.7440185546875, 3.03857421875, 3.3331298828125, 3.627685546875, 3.9222412109375, 4.216796875, 4.5113525390625, 4.805908203125, 5.1004638671875, 5.39501953125, 5.6895751953125, 5.984130859375, 6.2786865234375, 6.5732421875, 6.8677978515625, 7.162353515625, 7.4569091796875, 7.75146484375, 8.0460205078125, 8.340576171875, 8.6351318359375, 8.9296875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 40.0, 290.0, 536.0, 130.0, 17.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.43467712402344, -72.67379760742188, -70.91292572021484, -69.15204620361328, -67.39116668701172, -65.63029479980469, -63.869415283203125, -62.10853576660156, -60.347660064697266, -58.58678436279297, -56.825904846191406, -55.06502914428711, -53.30415344238281, -51.54327392578125, -49.78239822387695, -48.021522521972656, -46.260643005371094, -44.4997673034668, -42.738887786865234, -40.97801208496094, -39.21713638305664, -37.45625686645508, -35.69538116455078, -33.93450164794922, -32.17362976074219, -30.412752151489258, -28.65187644958496, -26.89099884033203, -25.1301212310791, -23.369243621826172, -21.608367919921875, -19.847490310668945, -18.086612701416016, -16.325735092163086, -14.564858436584473, -12.80398178100586, -11.04310417175293, -9.282227516174316, -7.521350860595703, -5.760473251342773, -3.99959659576416, -2.2387194633483887, -0.4778425693511963, 1.283034324645996, 3.0439114570617676, 4.804788589477539, 6.565665245056152, 8.326542854309082, 10.087419509887695, 11.848296165466309, 13.609173774719238, 15.370050430297852, 17.13092803955078, 18.891803741455078, 20.652681350708008, 22.413558959960938, 24.174434661865234, 25.935312271118164, 27.69618797302246, 29.45706558227539, 31.21794319152832, 32.97882080078125, 34.73969650268555, 36.500572204589844, 38.261451721191406]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 9.0, 10.0, 12.0, 10.0, 14.0, 17.0, 16.0, 22.0, 31.0, 31.0, 29.0, 28.0, 30.0, 22.0, 36.0, 36.0, 33.0, 46.0, 30.0, 34.0, 46.0, 50.0, 35.0, 42.0, 27.0, 37.0, 26.0, 25.0, 34.0, 23.0, 20.0, 26.0, 17.0, 19.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.29312801361084, -9.966480255126953, -9.639832496643066, -9.31318473815918, -8.98653793334961, -8.659890174865723, -8.333242416381836, -8.00659465789795, -7.6799468994140625, -7.353299140930176, -7.026651382446289, -6.7000041007995605, -6.373356342315674, -6.046708583831787, -5.720061302185059, -5.393413543701172, -5.066765785217285, -4.740118026733398, -4.413470268249512, -4.086822986602783, -3.7601752281188965, -3.4335274696350098, -3.106879949569702, -2.7802324295043945, -2.453584671020508, -2.126936912536621, -1.8002893924713135, -1.4736417531967163, -1.1469941139221191, -0.820346474647522, -0.4936988353729248, -0.1670513153076172, 0.15959548950195312, 0.4862431287765503, 0.8128907680511475, 1.1395384073257446, 1.4661860466003418, 1.792833685874939, 2.119481325149536, 2.4461288452148438, 2.7727766036987305, 3.099424362182617, 3.426071882247925, 3.7527194023132324, 4.079367160797119, 4.406014919281006, 4.732662200927734, 5.059309959411621, 5.385957717895508, 5.7126054763793945, 6.039253234863281, 6.36590051651001, 6.6925482749938965, 7.019196033477783, 7.345843315124512, 7.672491073608398, 7.999138832092285, 8.325786590576172, 8.652434349060059, 8.979082107543945, 9.305728912353516, 9.632376670837402, 9.959024429321289, 10.285672187805176, 10.612319946289062]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 9.0, 8.0, 16.0, 14.0, 27.0, 24.0, 24.0, 30.0, 30.0, 35.0, 50.0, 39.0, 40.0, 60.0, 56.0, 51.0, 56.0, 65.0, 56.0, 40.0, 35.0, 37.0, 27.0, 24.0, 24.0, 20.0, 16.0, 16.0, 13.0, 8.0, 5.0, 5.0, 2.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.392578125, -1.3492279052734375, -1.305877685546875, -1.2625274658203125, -1.21917724609375, -1.1758270263671875, -1.132476806640625, -1.0891265869140625, -1.0457763671875, -1.0024261474609375, -0.959075927734375, -0.9157257080078125, -0.87237548828125, -0.8290252685546875, -0.785675048828125, -0.7423248291015625, -0.698974609375, -0.6556243896484375, -0.612274169921875, -0.5689239501953125, -0.52557373046875, -0.4822235107421875, -0.438873291015625, -0.3955230712890625, -0.3521728515625, -0.3088226318359375, -0.265472412109375, -0.2221221923828125, -0.17877197265625, -0.1354217529296875, -0.092071533203125, -0.0487213134765625, -0.00537109375, 0.0379791259765625, 0.081329345703125, 0.1246795654296875, 0.16802978515625, 0.2113800048828125, 0.254730224609375, 0.2980804443359375, 0.3414306640625, 0.3847808837890625, 0.428131103515625, 0.4714813232421875, 0.51483154296875, 0.5581817626953125, 0.601531982421875, 0.6448822021484375, 0.688232421875, 0.7315826416015625, 0.774932861328125, 0.8182830810546875, 0.86163330078125, 0.9049835205078125, 0.948333740234375, 0.9916839599609375, 1.0350341796875, 1.0783843994140625, 1.121734619140625, 1.1650848388671875, 1.20843505859375, 1.2517852783203125, 1.295135498046875, 1.3384857177734375, 1.3818359375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 10.0, 9.0, 21.0, 26.0, 28.0, 38.0, 53.0, 49.0, 104.0, 170.0, 357.0, 816.0, 2196.0, 6318.0, 23345.0, 150239.0, 2792422.0, 1130931.0, 65058.0, 14454.0, 4576.0, 1607.0, 702.0, 308.0, 151.0, 86.0, 50.0, 38.0, 24.0, 20.0, 15.0, 13.0, 8.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4765625, -4.34417724609375, -4.2117919921875, -4.07940673828125, -3.947021484375, -3.81463623046875, -3.6822509765625, -3.54986572265625, -3.41748046875, -3.28509521484375, -3.1527099609375, -3.02032470703125, -2.887939453125, -2.75555419921875, -2.6231689453125, -2.49078369140625, -2.3583984375, -2.22601318359375, -2.0936279296875, -1.96124267578125, -1.828857421875, -1.69647216796875, -1.5640869140625, -1.43170166015625, -1.29931640625, -1.16693115234375, -1.0345458984375, -0.90216064453125, -0.769775390625, -0.63739013671875, -0.5050048828125, -0.37261962890625, -0.240234375, -0.10784912109375, 0.0245361328125, 0.15692138671875, 0.289306640625, 0.42169189453125, 0.5540771484375, 0.68646240234375, 0.81884765625, 0.95123291015625, 1.0836181640625, 1.21600341796875, 1.348388671875, 1.48077392578125, 1.6131591796875, 1.74554443359375, 1.8779296875, 2.01031494140625, 2.1427001953125, 2.27508544921875, 2.407470703125, 2.53985595703125, 2.6722412109375, 2.80462646484375, 2.93701171875, 3.06939697265625, 3.2017822265625, 3.33416748046875, 3.466552734375, 3.59893798828125, 3.7313232421875, 3.86370849609375, 3.99609375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 4.0, 9.0, 13.0, 14.0, 19.0, 23.0, 35.0, 37.0, 60.0, 79.0, 86.0, 142.0, 170.0, 252.0, 362.0, 497.0, 566.0, 497.0, 370.0, 238.0, 151.0, 112.0, 73.0, 58.0, 50.0, 31.0, 26.0, 22.0, 21.0, 12.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.00390625, -2.916412353515625, -2.82891845703125, -2.741424560546875, -2.6539306640625, -2.566436767578125, -2.47894287109375, -2.391448974609375, -2.303955078125, -2.216461181640625, -2.12896728515625, -2.041473388671875, -1.9539794921875, -1.866485595703125, -1.77899169921875, -1.691497802734375, -1.60400390625, -1.516510009765625, -1.42901611328125, -1.341522216796875, -1.2540283203125, -1.166534423828125, -1.07904052734375, -0.991546630859375, -0.904052734375, -0.816558837890625, -0.72906494140625, -0.641571044921875, -0.5540771484375, -0.466583251953125, -0.37908935546875, -0.291595458984375, -0.2041015625, -0.116607666015625, -0.02911376953125, 0.058380126953125, 0.1458740234375, 0.233367919921875, 0.32086181640625, 0.408355712890625, 0.495849609375, 0.583343505859375, 0.67083740234375, 0.758331298828125, 0.8458251953125, 0.933319091796875, 1.02081298828125, 1.108306884765625, 1.19580078125, 1.283294677734375, 1.37078857421875, 1.458282470703125, 1.5457763671875, 1.633270263671875, 1.72076416015625, 1.808258056640625, 1.895751953125, 1.983245849609375, 2.07073974609375, 2.158233642578125, 2.2457275390625, 2.333221435546875, 2.42071533203125, 2.508209228515625, 2.595703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 10.0, 22.0, 24.0, 37.0, 42.0, 72.0, 125.0, 233.0, 550.0, 1289.0, 3959.0, 16782.0, 107224.0, 2402782.0, 1560249.0, 81754.0, 13508.0, 3408.0, 1134.0, 468.0, 229.0, 122.0, 79.0, 50.0, 29.0, 18.0, 15.0, 12.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.76995849609375, -6.5438232421875, -6.31768798828125, -6.091552734375, -5.86541748046875, -5.6392822265625, -5.41314697265625, -5.18701171875, -4.96087646484375, -4.7347412109375, -4.50860595703125, -4.282470703125, -4.05633544921875, -3.8302001953125, -3.60406494140625, -3.3779296875, -3.15179443359375, -2.9256591796875, -2.69952392578125, -2.473388671875, -2.24725341796875, -2.0211181640625, -1.79498291015625, -1.56884765625, -1.34271240234375, -1.1165771484375, -0.89044189453125, -0.664306640625, -0.43817138671875, -0.2120361328125, 0.01409912109375, 0.240234375, 0.46636962890625, 0.6925048828125, 0.91864013671875, 1.144775390625, 1.37091064453125, 1.5970458984375, 1.82318115234375, 2.04931640625, 2.27545166015625, 2.5015869140625, 2.72772216796875, 2.953857421875, 3.17999267578125, 3.4061279296875, 3.63226318359375, 3.8583984375, 4.08453369140625, 4.3106689453125, 4.53680419921875, 4.762939453125, 4.98907470703125, 5.2152099609375, 5.44134521484375, 5.66748046875, 5.89361572265625, 6.1197509765625, 6.34588623046875, 6.572021484375, 6.79815673828125, 7.0242919921875, 7.25042724609375, 7.4765625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 15.0, 26.0, 54.0, 108.0, 185.0, 208.0, 186.0, 120.0, 60.0, 25.0, 13.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.76798629760742, -31.846311569213867, -30.92463493347168, -30.002960205078125, -29.08128547668457, -28.159608840942383, -27.237934112548828, -26.31625747680664, -25.394582748413086, -24.47290802001953, -23.551231384277344, -22.62955665588379, -21.707881927490234, -20.786205291748047, -19.864530563354492, -18.942855834960938, -18.02117919921875, -17.099504470825195, -16.177827835083008, -15.256153106689453, -14.334477424621582, -13.412801742553711, -12.491127014160156, -11.569451332092285, -10.647777557373047, -9.726101875305176, -8.804427146911621, -7.88275146484375, -6.961075782775879, -6.039400577545166, -5.117725372314453, -4.196049690246582, -3.274374008178711, -2.352698564529419, -1.4310232400894165, -0.5093479156494141, 0.41232752799987793, 1.33400297164917, 2.255678176879883, 3.177353858947754, 4.099029064178467, 5.02070426940918, 5.942379951477051, 6.864055156707764, 7.785730361938477, 8.707406044006348, 9.629081726074219, 10.550756454467773, 11.472432136535645, 12.394107818603516, 13.31578254699707, 14.237458229064941, 15.159133911132812, 16.080808639526367, 17.002483367919922, 17.92416000366211, 18.845834732055664, 19.76750946044922, 20.689186096191406, 21.61086082458496, 22.532535552978516, 23.454212188720703, 24.375886917114258, 25.297561645507812, 26.21923828125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 14.0, 11.0, 12.0, 6.0, 13.0, 15.0, 26.0, 21.0, 26.0, 27.0, 27.0, 32.0, 36.0, 46.0, 40.0, 45.0, 50.0, 26.0, 32.0, 33.0, 46.0, 41.0, 39.0, 39.0, 23.0, 39.0, 26.0, 31.0, 30.0, 28.0, 24.0, 6.0, 19.0, 12.0, 11.0, 8.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.187625885009766, -8.903886795043945, -8.620147705078125, -8.336409568786621, -8.0526704788208, -7.7689313888549805, -7.485192775726318, -7.201454162597656, -6.917715072631836, -6.633975982666016, -6.3502373695373535, -6.066498756408691, -5.782759666442871, -5.499020576477051, -5.215281963348389, -4.931543350219727, -4.647804260253906, -4.364065170288086, -4.080326557159424, -3.7965877056121826, -3.5128488540649414, -3.2291100025177, -2.945371150970459, -2.6616322994232178, -2.3778934478759766, -2.0941545963287354, -1.8104157447814941, -1.526676893234253, -1.2429380416870117, -0.9591991901397705, -0.6754603385925293, -0.3917214870452881, -0.10798168182373047, 0.17575716972351074, 0.45949602127075195, 0.7432348728179932, 1.0269737243652344, 1.3107125759124756, 1.5944514274597168, 1.878190279006958, 2.161929130554199, 2.4456679821014404, 2.7294068336486816, 3.013145685195923, 3.296884536743164, 3.5806233882904053, 3.8643622398376465, 4.148100852966309, 4.431839942932129, 4.715579032897949, 4.999317646026611, 5.283056259155273, 5.566795349121094, 5.850534439086914, 6.134273052215576, 6.418011665344238, 6.701750755310059, 6.985489845275879, 7.269228458404541, 7.552967071533203, 7.836706161499023, 8.120445251464844, 8.404184341430664, 8.687922477722168, 8.971661567687988]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 7.0, 12.0, 14.0, 27.0, 14.0, 38.0, 36.0, 39.0, 48.0, 46.0, 59.0, 57.0, 62.0, 75.0, 74.0, 68.0, 62.0, 42.0, 39.0, 32.0, 31.0, 29.0, 24.0, 22.0, 8.0, 14.0, 7.0, 5.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.08984375, -2.0339508056640625, -1.978057861328125, -1.9221649169921875, -1.86627197265625, -1.8103790283203125, -1.754486083984375, -1.6985931396484375, -1.6427001953125, -1.5868072509765625, -1.530914306640625, -1.4750213623046875, -1.41912841796875, -1.3632354736328125, -1.307342529296875, -1.2514495849609375, -1.195556640625, -1.1396636962890625, -1.083770751953125, -1.0278778076171875, -0.97198486328125, -0.9160919189453125, -0.860198974609375, -0.8043060302734375, -0.7484130859375, -0.6925201416015625, -0.636627197265625, -0.5807342529296875, -0.52484130859375, -0.4689483642578125, -0.413055419921875, -0.3571624755859375, -0.30126953125, -0.2453765869140625, -0.189483642578125, -0.1335906982421875, -0.07769775390625, -0.0218048095703125, 0.034088134765625, 0.0899810791015625, 0.1458740234375, 0.2017669677734375, 0.257659912109375, 0.3135528564453125, 0.36944580078125, 0.4253387451171875, 0.481231689453125, 0.5371246337890625, 0.593017578125, 0.6489105224609375, 0.704803466796875, 0.7606964111328125, 0.81658935546875, 0.8724822998046875, 0.928375244140625, 0.9842681884765625, 1.0401611328125, 1.0960540771484375, 1.151947021484375, 1.2078399658203125, 1.26373291015625, 1.3196258544921875, 1.375518798828125, 1.4314117431640625, 1.4873046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 3.0, 6.0, 11.0, 15.0, 15.0, 36.0, 36.0, 64.0, 87.0, 154.0, 264.0, 438.0, 718.0, 1299.0, 2248.0, 4107.0, 7536.0, 13287.0, 24447.0, 43571.0, 73575.0, 114728.0, 155522.0, 174763.0, 153221.0, 112237.0, 71395.0, 42030.0, 23483.0, 13017.0, 7115.0, 3940.0, 2085.0, 1284.0, 744.0, 413.0, 237.0, 179.0, 76.0, 47.0, 48.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.939453125, -0.9095993041992188, -0.8797454833984375, -0.8498916625976562, -0.820037841796875, -0.7901840209960938, -0.7603302001953125, -0.7304763793945312, -0.70062255859375, -0.6707687377929688, -0.6409149169921875, -0.6110610961914062, -0.581207275390625, -0.5513534545898438, -0.5214996337890625, -0.49164581298828125, -0.4617919921875, -0.43193817138671875, -0.4020843505859375, -0.37223052978515625, -0.342376708984375, -0.31252288818359375, -0.2826690673828125, -0.25281524658203125, -0.22296142578125, -0.19310760498046875, -0.1632537841796875, -0.13339996337890625, -0.103546142578125, -0.07369232177734375, -0.0438385009765625, -0.01398468017578125, 0.015869140625, 0.04572296142578125, 0.0755767822265625, 0.10543060302734375, 0.135284423828125, 0.16513824462890625, 0.1949920654296875, 0.22484588623046875, 0.25469970703125, 0.28455352783203125, 0.3144073486328125, 0.34426116943359375, 0.374114990234375, 0.40396881103515625, 0.4338226318359375, 0.46367645263671875, 0.4935302734375, 0.5233840942382812, 0.5532379150390625, 0.5830917358398438, 0.612945556640625, 0.6427993774414062, 0.6726531982421875, 0.7025070190429688, 0.73236083984375, 0.7622146606445312, 0.7920684814453125, 0.8219223022460938, 0.851776123046875, 0.8816299438476562, 0.9114837646484375, 0.9413375854492188, 0.97119140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 8.0, 11.0, 8.0, 11.0, 18.0, 28.0, 25.0, 44.0, 28.0, 39.0, 43.0, 35.0, 43.0, 44.0, 46.0, 1065.0, 53.0, 39.0, 58.0, 41.0, 40.0, 35.0, 41.0, 25.0, 25.0, 30.0, 22.0, 14.0, 23.0, 13.0, 11.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4771270751953125, -1.435699462890625, -1.3942718505859375, -1.35284423828125, -1.3114166259765625, -1.269989013671875, -1.2285614013671875, -1.1871337890625, -1.1457061767578125, -1.104278564453125, -1.0628509521484375, -1.02142333984375, -0.9799957275390625, -0.938568115234375, -0.8971405029296875, -0.855712890625, -0.8142852783203125, -0.772857666015625, -0.7314300537109375, -0.69000244140625, -0.6485748291015625, -0.607147216796875, -0.5657196044921875, -0.5242919921875, -0.4828643798828125, -0.441436767578125, -0.4000091552734375, -0.35858154296875, -0.3171539306640625, -0.275726318359375, -0.2342987060546875, -0.19287109375, -0.1514434814453125, -0.110015869140625, -0.0685882568359375, -0.02716064453125, 0.0142669677734375, 0.055694580078125, 0.0971221923828125, 0.1385498046875, 0.1799774169921875, 0.221405029296875, 0.2628326416015625, 0.30426025390625, 0.3456878662109375, 0.387115478515625, 0.4285430908203125, 0.469970703125, 0.5113983154296875, 0.552825927734375, 0.5942535400390625, 0.63568115234375, 0.6771087646484375, 0.718536376953125, 0.7599639892578125, 0.8013916015625, 0.8428192138671875, 0.884246826171875, 0.9256744384765625, 0.96710205078125, 1.0085296630859375, 1.049957275390625, 1.0913848876953125, 1.1328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 13.0, 11.0, 20.0, 29.0, 40.0, 49.0, 64.0, 120.0, 154.0, 251.0, 310.0, 431.0, 666.0, 887.0, 1275.0, 1878.0, 2652.0, 3862.0, 5764.0, 8390.0, 12789.0, 20996.0, 42141.0, 159470.0, 1458562.0, 255442.0, 53562.0, 23845.0, 14327.0, 9197.0, 6277.0, 4165.0, 2828.0, 1961.0, 1450.0, 932.0, 647.0, 497.0, 338.0, 245.0, 180.0, 116.0, 87.0, 64.0, 32.0, 36.0, 21.0, 11.0, 13.0, 17.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.93408203125, -0.904541015625, -0.875, -0.845458984375, -0.81591796875, -0.786376953125, -0.7568359375, -0.727294921875, -0.69775390625, -0.668212890625, -0.638671875, -0.609130859375, -0.57958984375, -0.550048828125, -0.5205078125, -0.490966796875, -0.46142578125, -0.431884765625, -0.40234375, -0.372802734375, -0.34326171875, -0.313720703125, -0.2841796875, -0.254638671875, -0.22509765625, -0.195556640625, -0.166015625, -0.136474609375, -0.10693359375, -0.077392578125, -0.0478515625, -0.018310546875, 0.01123046875, 0.040771484375, 0.0703125, 0.099853515625, 0.12939453125, 0.158935546875, 0.1884765625, 0.218017578125, 0.24755859375, 0.277099609375, 0.306640625, 0.336181640625, 0.36572265625, 0.395263671875, 0.4248046875, 0.454345703125, 0.48388671875, 0.513427734375, 0.54296875, 0.572509765625, 0.60205078125, 0.631591796875, 0.6611328125, 0.690673828125, 0.72021484375, 0.749755859375, 0.779296875, 0.808837890625, 0.83837890625, 0.867919921875, 0.8974609375, 0.927001953125, 0.95654296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 9.0, 5.0, 3.0, 10.0, 20.0, 24.0, 35.0, 39.0, 61.0, 79.0, 82.0, 115.0, 118.0, 111.0, 72.0, 48.0, 45.0, 32.0, 20.0, 19.0, 9.0, 7.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2119140625, -0.20529937744140625, -0.1986846923828125, -0.19207000732421875, -0.185455322265625, -0.17884063720703125, -0.1722259521484375, -0.16561126708984375, -0.15899658203125, -0.15238189697265625, -0.1457672119140625, -0.13915252685546875, -0.132537841796875, -0.12592315673828125, -0.1193084716796875, -0.11269378662109375, -0.1060791015625, -0.09946441650390625, -0.0928497314453125, -0.08623504638671875, -0.079620361328125, -0.07300567626953125, -0.0663909912109375, -0.05977630615234375, -0.05316162109375, -0.04654693603515625, -0.0399322509765625, -0.03331756591796875, -0.026702880859375, -0.02008819580078125, -0.0134735107421875, -0.00685882568359375, -0.000244140625, 0.00637054443359375, 0.0129852294921875, 0.01959991455078125, 0.026214599609375, 0.03282928466796875, 0.0394439697265625, 0.04605865478515625, 0.05267333984375, 0.05928802490234375, 0.0659027099609375, 0.07251739501953125, 0.079132080078125, 0.08574676513671875, 0.0923614501953125, 0.09897613525390625, 0.1055908203125, 0.11220550537109375, 0.1188201904296875, 0.12543487548828125, 0.132049560546875, 0.13866424560546875, 0.1452789306640625, 0.15189361572265625, 0.15850830078125, 0.16512298583984375, 0.1717376708984375, 0.17835235595703125, 0.184967041015625, 0.19158172607421875, 0.1981964111328125, 0.20481109619140625, 0.21142578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 6.0, 7.0, 8.0, 8.0, 15.0, 17.0, 24.0, 42.0, 96.0, 192.0, 572.0, 2126.0, 11882.0, 822747.0, 201999.0, 6593.0, 1438.0, 430.0, 137.0, 76.0, 44.0, 22.0, 21.0, 14.0, 8.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.021240234375, -2.92333984375, -2.825439453125, -2.7275390625, -2.629638671875, -2.53173828125, -2.433837890625, -2.3359375, -2.238037109375, -2.14013671875, -2.042236328125, -1.9443359375, -1.846435546875, -1.74853515625, -1.650634765625, -1.552734375, -1.454833984375, -1.35693359375, -1.259033203125, -1.1611328125, -1.063232421875, -0.96533203125, -0.867431640625, -0.76953125, -0.671630859375, -0.57373046875, -0.475830078125, -0.3779296875, -0.280029296875, -0.18212890625, -0.084228515625, 0.013671875, 0.111572265625, 0.20947265625, 0.307373046875, 0.4052734375, 0.503173828125, 0.60107421875, 0.698974609375, 0.796875, 0.894775390625, 0.99267578125, 1.090576171875, 1.1884765625, 1.286376953125, 1.38427734375, 1.482177734375, 1.580078125, 1.677978515625, 1.77587890625, 1.873779296875, 1.9716796875, 2.069580078125, 2.16748046875, 2.265380859375, 2.36328125, 2.461181640625, 2.55908203125, 2.656982421875, 2.7548828125, 2.852783203125, 2.95068359375, 3.048583984375, 3.146484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 28.0, 58.0, 100.0, 192.0, 269.0, 164.0, 87.0, 46.0, 20.0, 9.0, 6.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.608473539352417, -2.5345613956451416, -2.4606494903564453, -2.38673734664917, -2.3128254413604736, -2.2389132976531982, -2.165001392364502, -2.0910892486572266, -2.017177104949951, -1.9432650804519653, -1.8693530559539795, -1.7954410314559937, -1.7215290069580078, -1.6476168632507324, -1.5737048387527466, -1.4997928142547607, -1.4258809089660645, -1.3519688844680786, -1.2780568599700928, -1.204144835472107, -1.130232810974121, -1.0563206672668457, -0.9824086427688599, -0.908496618270874, -0.8345845937728882, -0.7606725692749023, -0.6867605447769165, -0.6128484606742859, -0.5389364361763, -0.4650244116783142, -0.391112357378006, -0.31720030307769775, -0.24328827857971191, -0.16937623918056488, -0.09546419978141785, -0.021552160382270813, 0.05235987901687622, 0.12627190351486206, 0.2001839578151703, 0.2740960121154785, 0.34800803661346436, 0.4219200611114502, 0.4958321154117584, 0.5697441697120667, 0.6436561942100525, 0.7175682187080383, 0.791480302810669, 0.8653923273086548, 0.9393043518066406, 1.0132163763046265, 1.0871284008026123, 1.1610404253005981, 1.234952449798584, 1.3088645935058594, 1.3827766180038452, 1.456688642501831, 1.530600666999817, 1.6045126914978027, 1.6784247159957886, 1.7523367404937744, 1.8262488842010498, 1.900160789489746, 1.9740729331970215, 2.047985076904297, 2.121896982192993]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 14.0, 9.0, 17.0, 25.0, 34.0, 41.0, 54.0, 43.0, 37.0, 50.0, 53.0, 50.0, 65.0, 53.0, 65.0, 56.0, 48.0, 45.0, 31.0, 32.0, 32.0, 21.0, 23.0, 22.0, 11.0, 15.0, 3.0, 13.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8811373114585876, -0.8552358150482178, -0.8293343186378479, -0.803432822227478, -0.7775313854217529, -0.7516298890113831, -0.7257283926010132, -0.6998268961906433, -0.6739253997802734, -0.6480239033699036, -0.6221224069595337, -0.5962209701538086, -0.5703194737434387, -0.5444179773330688, -0.518516480922699, -0.4926149845123291, -0.466713547706604, -0.44081205129623413, -0.41491058468818665, -0.3890090882778168, -0.3631076216697693, -0.3372061252593994, -0.31130462884902954, -0.28540313243865967, -0.2595016658306122, -0.2336001843214035, -0.20769870281219482, -0.18179720640182495, -0.15589572489261627, -0.1299942433834076, -0.10409274697303772, -0.07819126546382904, -0.05228978395462036, -0.026388298720121384, -0.000486813485622406, 0.02541467547416687, 0.05131615698337555, 0.07721763849258423, 0.1031191349029541, 0.12902061641216278, 0.15492209792137146, 0.18082357943058014, 0.20672506093978882, 0.2326265573501587, 0.25852805376052856, 0.28442952036857605, 0.3103310167789459, 0.3362324833869934, 0.3621339797973633, 0.38803547620773315, 0.41393694281578064, 0.4398384392261505, 0.465739905834198, 0.49164140224456787, 0.5175428986549377, 0.5434443950653076, 0.5693458318710327, 0.5952473282814026, 0.6211488246917725, 0.6470502614974976, 0.6729517579078674, 0.6988532543182373, 0.7247547507286072, 0.750656247138977, 0.7765577435493469]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 13.0, 13.0, 20.0, 28.0, 36.0, 37.0, 49.0, 46.0, 43.0, 45.0, 66.0, 56.0, 74.0, 76.0, 62.0, 51.0, 56.0, 35.0, 34.0, 24.0, 35.0, 18.0, 18.0, 17.0, 16.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.06640625, -2.012451171875, -1.95849609375, -1.904541015625, -1.8505859375, -1.796630859375, -1.74267578125, -1.688720703125, -1.634765625, -1.580810546875, -1.52685546875, -1.472900390625, -1.4189453125, -1.364990234375, -1.31103515625, -1.257080078125, -1.203125, -1.149169921875, -1.09521484375, -1.041259765625, -0.9873046875, -0.933349609375, -0.87939453125, -0.825439453125, -0.771484375, -0.717529296875, -0.66357421875, -0.609619140625, -0.5556640625, -0.501708984375, -0.44775390625, -0.393798828125, -0.33984375, -0.285888671875, -0.23193359375, -0.177978515625, -0.1240234375, -0.070068359375, -0.01611328125, 0.037841796875, 0.091796875, 0.145751953125, 0.19970703125, 0.253662109375, 0.3076171875, 0.361572265625, 0.41552734375, 0.469482421875, 0.5234375, 0.577392578125, 0.63134765625, 0.685302734375, 0.7392578125, 0.793212890625, 0.84716796875, 0.901123046875, 0.955078125, 1.009033203125, 1.06298828125, 1.116943359375, 1.1708984375, 1.224853515625, 1.27880859375, 1.332763671875, 1.38671875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 12.0, 14.0, 26.0, 29.0, 59.0, 100.0, 170.0, 297.0, 531.0, 1092.0, 2199.0, 5277.0, 13608.0, 40056.0, 142718.0, 498398.0, 246286.0, 64039.0, 20199.0, 7354.0, 3096.0, 1410.0, 697.0, 360.0, 222.0, 126.0, 70.0, 41.0, 21.0, 16.0, 11.0, 7.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.052276611328125, -1.98541259765625, -1.918548583984375, -1.8516845703125, -1.784820556640625, -1.71795654296875, -1.651092529296875, -1.584228515625, -1.517364501953125, -1.45050048828125, -1.383636474609375, -1.3167724609375, -1.249908447265625, -1.18304443359375, -1.116180419921875, -1.04931640625, -0.982452392578125, -0.91558837890625, -0.848724365234375, -0.7818603515625, -0.714996337890625, -0.64813232421875, -0.581268310546875, -0.514404296875, -0.447540283203125, -0.38067626953125, -0.313812255859375, -0.2469482421875, -0.180084228515625, -0.11322021484375, -0.046356201171875, 0.0205078125, 0.087371826171875, 0.15423583984375, 0.221099853515625, 0.2879638671875, 0.354827880859375, 0.42169189453125, 0.488555908203125, 0.555419921875, 0.622283935546875, 0.68914794921875, 0.756011962890625, 0.8228759765625, 0.889739990234375, 0.95660400390625, 1.023468017578125, 1.09033203125, 1.157196044921875, 1.22406005859375, 1.290924072265625, 1.3577880859375, 1.424652099609375, 1.49151611328125, 1.558380126953125, 1.625244140625, 1.692108154296875, 1.75897216796875, 1.825836181640625, 1.8927001953125, 1.959564208984375, 2.02642822265625, 2.093292236328125, 2.16015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 12.0, 10.0, 11.0, 13.0, 13.0, 22.0, 23.0, 31.0, 36.0, 35.0, 38.0, 39.0, 51.0, 60.0, 85.0, 111.0, 204.0, 1449.0, 216.0, 110.0, 70.0, 87.0, 56.0, 27.0, 39.0, 30.0, 26.0, 26.0, 28.0, 18.0, 17.0, 12.0, 7.0, 2.0, 3.0, 4.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.310791015625, -4.16455078125, -4.018310546875, -3.8720703125, -3.725830078125, -3.57958984375, -3.433349609375, -3.287109375, -3.140869140625, -2.99462890625, -2.848388671875, -2.7021484375, -2.555908203125, -2.40966796875, -2.263427734375, -2.1171875, -1.970947265625, -1.82470703125, -1.678466796875, -1.5322265625, -1.385986328125, -1.23974609375, -1.093505859375, -0.947265625, -0.801025390625, -0.65478515625, -0.508544921875, -0.3623046875, -0.216064453125, -0.06982421875, 0.076416015625, 0.22265625, 0.368896484375, 0.51513671875, 0.661376953125, 0.8076171875, 0.953857421875, 1.10009765625, 1.246337890625, 1.392578125, 1.538818359375, 1.68505859375, 1.831298828125, 1.9775390625, 2.123779296875, 2.27001953125, 2.416259765625, 2.5625, 2.708740234375, 2.85498046875, 3.001220703125, 3.1474609375, 3.293701171875, 3.43994140625, 3.586181640625, 3.732421875, 3.878662109375, 4.02490234375, 4.171142578125, 4.3173828125, 4.463623046875, 4.60986328125, 4.756103515625, 4.90234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 19.0, 24.0, 27.0, 42.0, 100.0, 120.0, 199.0, 354.0, 865.0, 2773.0, 26514.0, 2829568.0, 275007.0, 7227.0, 1539.0, 524.0, 280.0, 190.0, 109.0, 62.0, 36.0, 36.0, 23.0, 13.0, 10.0, 13.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.318603515625, -10.97314453125, -10.627685546875, -10.2822265625, -9.936767578125, -9.59130859375, -9.245849609375, -8.900390625, -8.554931640625, -8.20947265625, -7.864013671875, -7.5185546875, -7.173095703125, -6.82763671875, -6.482177734375, -6.13671875, -5.791259765625, -5.44580078125, -5.100341796875, -4.7548828125, -4.409423828125, -4.06396484375, -3.718505859375, -3.373046875, -3.027587890625, -2.68212890625, -2.336669921875, -1.9912109375, -1.645751953125, -1.30029296875, -0.954833984375, -0.609375, -0.263916015625, 0.08154296875, 0.427001953125, 0.7724609375, 1.117919921875, 1.46337890625, 1.808837890625, 2.154296875, 2.499755859375, 2.84521484375, 3.190673828125, 3.5361328125, 3.881591796875, 4.22705078125, 4.572509765625, 4.91796875, 5.263427734375, 5.60888671875, 5.954345703125, 6.2998046875, 6.645263671875, 6.99072265625, 7.336181640625, 7.681640625, 8.027099609375, 8.37255859375, 8.718017578125, 9.0634765625, 9.408935546875, 9.75439453125, 10.099853515625, 10.4453125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 147.0, 748.0, 112.0, 5.0, 2.0, 0.0, 2.0], "bins": [-133.59580993652344, -131.31063842773438, -129.02548217773438, -126.74031066894531, -124.45513916015625, -122.16997528076172, -119.88480377197266, -117.59963989257812, -115.31446838378906, -113.02930450439453, -110.74413299560547, -108.45896911621094, -106.17379760742188, -103.88863372802734, -101.60346221923828, -99.31829833984375, -97.03312683105469, -94.74796295166016, -92.4627914428711, -90.17762756347656, -87.8924560546875, -85.60729217529297, -83.3221206665039, -81.03695678710938, -78.75179290771484, -76.46662902832031, -74.18145751953125, -71.89629364013672, -69.61112213134766, -67.32595825195312, -65.04078674316406, -62.75562286376953, -60.4704475402832, -58.185279846191406, -55.90011215209961, -53.61494445800781, -51.329776763916016, -49.04460906982422, -46.75944519042969, -44.474273681640625, -42.189109802246094, -39.9039421081543, -37.6187744140625, -35.3336067199707, -33.048439025878906, -30.76327133178711, -28.478105545043945, -26.19293785095215, -23.90776824951172, -21.622600555419922, -19.337432861328125, -17.052265167236328, -14.767098426818848, -12.48193073272705, -10.19676399230957, -7.911596298217773, -5.626428604125977, -3.341261148452759, -1.056093692779541, 1.2290735244750977, 3.5142412185668945, 5.799408912658691, 8.084575653076172, 10.369743347167969, 12.654911041259766]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 9.0, 2.0, 11.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 21.0, 20.0, 20.0, 28.0, 39.0, 27.0, 31.0, 33.0, 23.0, 47.0, 28.0, 36.0, 36.0, 30.0, 39.0, 32.0, 41.0, 29.0, 29.0, 56.0, 33.0, 21.0, 27.0, 26.0, 18.0, 19.0, 17.0, 14.0, 23.0, 13.0, 9.0, 4.0, 10.0, 8.0, 6.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21320915222168, -9.859966278076172, -9.50672435760498, -9.153481483459473, -8.800239562988281, -8.446996688842773, -8.093753814697266, -7.740511894226074, -7.387269020080566, -7.034026622772217, -6.680784225463867, -6.327541351318359, -5.97429895401001, -5.62105655670166, -5.2678141593933105, -4.914571762084961, -4.561329364776611, -4.208086967468262, -3.854844331741333, -3.5016019344329834, -3.1483592987060547, -2.795116901397705, -2.4418745040893555, -2.0886318683624268, -1.7353894710540771, -1.382146954536438, -1.0289044380187988, -0.6756620407104492, -0.32241952419281006, 0.0308229923248291, 0.3840653896331787, 0.7373080253601074, 1.090550422668457, 1.4437929391860962, 1.7970354557037354, 2.150277853012085, 2.5035204887390137, 2.8567628860473633, 3.210005283355713, 3.5632479190826416, 3.916490316390991, 4.26973295211792, 4.6229753494262695, 4.976217746734619, 5.329460144042969, 5.682703018188477, 6.035944938659668, 6.389187812805176, 6.742430210113525, 7.095672607421875, 7.448915004730225, 7.802157402038574, 8.155400276184082, 8.508642196655273, 8.861885070800781, 9.215127944946289, 9.56836986541748, 9.921612739562988, 10.27485466003418, 10.628097534179688, 10.981339454650879, 11.334582328796387, 11.687824249267578, 12.041067123413086, 12.394309997558594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 6.0, 6.0, 15.0, 17.0, 18.0, 25.0, 38.0, 36.0, 36.0, 39.0, 62.0, 57.0, 71.0, 70.0, 57.0, 67.0, 64.0, 53.0, 51.0, 47.0, 39.0, 23.0, 30.0, 21.0, 15.0, 11.0, 7.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0407257080078125, -1.983795166015625, -1.9268646240234375, -1.86993408203125, -1.8130035400390625, -1.756072998046875, -1.6991424560546875, -1.6422119140625, -1.5852813720703125, -1.528350830078125, -1.4714202880859375, -1.41448974609375, -1.3575592041015625, -1.300628662109375, -1.2436981201171875, -1.186767578125, -1.1298370361328125, -1.072906494140625, -1.0159759521484375, -0.95904541015625, -0.9021148681640625, -0.845184326171875, -0.7882537841796875, -0.7313232421875, -0.6743927001953125, -0.617462158203125, -0.5605316162109375, -0.50360107421875, -0.4466705322265625, -0.389739990234375, -0.3328094482421875, -0.27587890625, -0.2189483642578125, -0.162017822265625, -0.1050872802734375, -0.04815673828125, 0.0087738037109375, 0.065704345703125, 0.1226348876953125, 0.1795654296875, 0.2364959716796875, 0.293426513671875, 0.3503570556640625, 0.40728759765625, 0.4642181396484375, 0.521148681640625, 0.5780792236328125, 0.635009765625, 0.6919403076171875, 0.748870849609375, 0.8058013916015625, 0.86273193359375, 0.9196624755859375, 0.976593017578125, 1.0335235595703125, 1.0904541015625, 1.1473846435546875, 1.204315185546875, 1.2612457275390625, 1.31817626953125, 1.3751068115234375, 1.432037353515625, 1.4889678955078125, 1.5458984375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 12.0, 13.0, 24.0, 27.0, 31.0, 45.0, 77.0, 124.0, 185.0, 323.0, 544.0, 970.0, 1852.0, 3608.0, 7954.0, 19946.0, 66148.0, 439576.0, 2722782.0, 788509.0, 95233.0, 27063.0, 10002.0, 4473.0, 2143.0, 1136.0, 640.0, 314.0, 196.0, 112.0, 76.0, 45.0, 30.0, 21.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.18359375, -4.08306884765625, -3.9825439453125, -3.88201904296875, -3.781494140625, -3.68096923828125, -3.5804443359375, -3.47991943359375, -3.37939453125, -3.27886962890625, -3.1783447265625, -3.07781982421875, -2.977294921875, -2.87677001953125, -2.7762451171875, -2.67572021484375, -2.5751953125, -2.47467041015625, -2.3741455078125, -2.27362060546875, -2.173095703125, -2.07257080078125, -1.9720458984375, -1.87152099609375, -1.77099609375, -1.67047119140625, -1.5699462890625, -1.46942138671875, -1.368896484375, -1.26837158203125, -1.1678466796875, -1.06732177734375, -0.966796875, -0.86627197265625, -0.7657470703125, -0.66522216796875, -0.564697265625, -0.46417236328125, -0.3636474609375, -0.26312255859375, -0.16259765625, -0.06207275390625, 0.0384521484375, 0.13897705078125, 0.239501953125, 0.34002685546875, 0.4405517578125, 0.54107666015625, 0.6416015625, 0.74212646484375, 0.8426513671875, 0.94317626953125, 1.043701171875, 1.14422607421875, 1.2447509765625, 1.34527587890625, 1.44580078125, 1.54632568359375, 1.6468505859375, 1.74737548828125, 1.847900390625, 1.94842529296875, 2.0489501953125, 2.14947509765625, 2.25]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 11.0, 14.0, 16.0, 18.0, 28.0, 40.0, 54.0, 80.0, 94.0, 176.0, 208.0, 309.0, 459.0, 555.0, 584.0, 428.0, 253.0, 209.0, 140.0, 102.0, 68.0, 53.0, 42.0, 34.0, 16.0, 12.0, 12.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.595001220703125, -2.49859619140625, -2.402191162109375, -2.3057861328125, -2.209381103515625, -2.11297607421875, -2.016571044921875, -1.920166015625, -1.823760986328125, -1.72735595703125, -1.630950927734375, -1.5345458984375, -1.438140869140625, -1.34173583984375, -1.245330810546875, -1.14892578125, -1.052520751953125, -0.95611572265625, -0.859710693359375, -0.7633056640625, -0.666900634765625, -0.57049560546875, -0.474090576171875, -0.377685546875, -0.281280517578125, -0.18487548828125, -0.088470458984375, 0.0079345703125, 0.104339599609375, 0.20074462890625, 0.297149658203125, 0.3935546875, 0.489959716796875, 0.58636474609375, 0.682769775390625, 0.7791748046875, 0.875579833984375, 0.97198486328125, 1.068389892578125, 1.164794921875, 1.261199951171875, 1.35760498046875, 1.454010009765625, 1.5504150390625, 1.646820068359375, 1.74322509765625, 1.839630126953125, 1.93603515625, 2.032440185546875, 2.12884521484375, 2.225250244140625, 2.3216552734375, 2.418060302734375, 2.51446533203125, 2.610870361328125, 2.707275390625, 2.803680419921875, 2.90008544921875, 2.996490478515625, 3.0928955078125, 3.189300537109375, 3.28570556640625, 3.382110595703125, 3.478515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 4.0, 12.0, 20.0, 31.0, 57.0, 74.0, 118.0, 236.0, 452.0, 985.0, 2209.0, 5658.0, 16059.0, 53341.0, 270262.0, 2631415.0, 1041641.0, 123812.0, 30978.0, 10156.0, 3672.0, 1549.0, 754.0, 330.0, 187.0, 96.0, 48.0, 35.0, 22.0, 13.0, 12.0, 3.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.67578125, -5.521484375, -5.3671875, -5.212890625, -5.05859375, -4.904296875, -4.75, -4.595703125, -4.44140625, -4.287109375, -4.1328125, -3.978515625, -3.82421875, -3.669921875, -3.515625, -3.361328125, -3.20703125, -3.052734375, -2.8984375, -2.744140625, -2.58984375, -2.435546875, -2.28125, -2.126953125, -1.97265625, -1.818359375, -1.6640625, -1.509765625, -1.35546875, -1.201171875, -1.046875, -0.892578125, -0.73828125, -0.583984375, -0.4296875, -0.275390625, -0.12109375, 0.033203125, 0.1875, 0.341796875, 0.49609375, 0.650390625, 0.8046875, 0.958984375, 1.11328125, 1.267578125, 1.421875, 1.576171875, 1.73046875, 1.884765625, 2.0390625, 2.193359375, 2.34765625, 2.501953125, 2.65625, 2.810546875, 2.96484375, 3.119140625, 3.2734375, 3.427734375, 3.58203125, 3.736328125, 3.890625, 4.044921875, 4.19921875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 7.0, 3.0, 7.0, 19.0, 19.0, 21.0, 37.0, 44.0, 46.0, 62.0, 83.0, 83.0, 89.0, 92.0, 55.0, 76.0, 60.0, 56.0, 32.0, 30.0, 21.0, 14.0, 16.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.79543685913086, -9.430390357971191, -9.065343856811523, -8.700298309326172, -8.335251808166504, -7.970205307006836, -7.605158805847168, -7.2401123046875, -6.87506628036499, -6.510019779205322, -6.1449737548828125, -5.7799272537231445, -5.414880752563477, -5.049834728240967, -4.684788227081299, -4.319742202758789, -3.954695701599121, -3.5896494388580322, -3.2246031761169434, -2.8595566749572754, -2.4945104122161865, -2.1294641494750977, -1.7644176483154297, -1.3993713855743408, -1.034325122833252, -0.6692788004875183, -0.30423247814178467, 0.06081390380859375, 0.4258601665496826, 0.7909064292907715, 1.1559529304504395, 1.5209991931915283, 1.8860445022583008, 2.2510907649993896, 2.6161370277404785, 2.9811835289001465, 3.3462297916412354, 3.711276054382324, 4.076322555541992, 4.44136905670166, 4.80641508102417, 5.171461582183838, 5.536507606506348, 5.901554107666016, 6.266600608825684, 6.631646633148193, 6.996693134307861, 7.361739158630371, 7.726785659790039, 8.091832160949707, 8.456878662109375, 8.821924209594727, 9.186970710754395, 9.552017211914062, 9.91706371307373, 10.282110214233398, 10.64715576171875, 11.012202262878418, 11.377248764038086, 11.742294311523438, 12.107340812683105, 12.472387313842773, 12.837433815002441, 13.20248031616211, 13.567526817321777]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 5.0, 12.0, 14.0, 24.0, 19.0, 21.0, 24.0, 25.0, 24.0, 27.0, 33.0, 31.0, 38.0, 22.0, 47.0, 42.0, 43.0, 33.0, 37.0, 39.0, 40.0, 34.0, 45.0, 28.0, 35.0, 38.0, 34.0, 29.0, 15.0, 19.0, 18.0, 12.0, 18.0, 18.0, 6.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.779570579528809, -8.490565299987793, -8.201559066772461, -7.912553787231445, -7.62354850769043, -7.334542751312256, -7.045536994934082, -6.756531715393066, -6.467525959014893, -6.178520202636719, -5.889514923095703, -5.600509166717529, -5.3115034103393555, -5.02249813079834, -4.733492374420166, -4.444486618041992, -4.155481338500977, -3.866475820541382, -3.577470302581787, -3.2884645462036133, -2.9994590282440186, -2.710453510284424, -2.42144775390625, -2.1324422359466553, -1.8434367179870605, -1.5544312000274658, -1.2654255628585815, -0.976419985294342, -0.6874144077301025, -0.3984088897705078, -0.10940325260162354, 0.17960238456726074, 0.46860694885253906, 0.7576125264167786, 1.046618103981018, 1.3356237411499023, 1.624629259109497, 1.9136347770690918, 2.2026405334472656, 2.4916460514068604, 2.780651569366455, 3.06965708732605, 3.3586626052856445, 3.6476683616638184, 3.936673879623413, 4.225679397583008, 4.514685153961182, 4.8036909103393555, 5.092696189880371, 5.381701946258545, 5.6707072257995605, 5.959712982177734, 6.24871826171875, 6.537724018096924, 6.826729774475098, 7.115735054016113, 7.404740810394287, 7.693746566772461, 7.982751846313477, 8.271757125854492, 8.560763359069824, 8.84976863861084, 9.138773918151855, 9.427780151367188, 9.716785430908203]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 16.0, 14.0, 19.0, 27.0, 28.0, 46.0, 47.0, 49.0, 59.0, 68.0, 58.0, 71.0, 66.0, 66.0, 61.0, 52.0, 52.0, 40.0, 31.0, 31.0, 32.0, 16.0, 11.0, 7.0, 11.0, 8.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.6070556640625, -2.546142578125, -2.4852294921875, -2.42431640625, -2.3634033203125, -2.302490234375, -2.2415771484375, -2.1806640625, -2.1197509765625, -2.058837890625, -1.9979248046875, -1.93701171875, -1.8760986328125, -1.815185546875, -1.7542724609375, -1.693359375, -1.6324462890625, -1.571533203125, -1.5106201171875, -1.44970703125, -1.3887939453125, -1.327880859375, -1.2669677734375, -1.2060546875, -1.1451416015625, -1.084228515625, -1.0233154296875, -0.96240234375, -0.9014892578125, -0.840576171875, -0.7796630859375, -0.71875, -0.6578369140625, -0.596923828125, -0.5360107421875, -0.47509765625, -0.4141845703125, -0.353271484375, -0.2923583984375, -0.2314453125, -0.1705322265625, -0.109619140625, -0.0487060546875, 0.01220703125, 0.0731201171875, 0.134033203125, 0.1949462890625, 0.255859375, 0.3167724609375, 0.377685546875, 0.4385986328125, 0.49951171875, 0.5604248046875, 0.621337890625, 0.6822509765625, 0.7431640625, 0.8040771484375, 0.864990234375, 0.9259033203125, 0.98681640625, 1.0477294921875, 1.108642578125, 1.1695556640625, 1.23046875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 3.0, 3.0, 9.0, 10.0, 31.0, 19.0, 26.0, 52.0, 90.0, 149.0, 293.0, 500.0, 917.0, 1769.0, 3591.0, 7182.0, 14368.0, 28092.0, 53690.0, 98080.0, 156681.0, 202403.0, 188521.0, 131079.0, 77468.0, 40825.0, 21101.0, 10578.0, 5326.0, 2665.0, 1393.0, 719.0, 392.0, 184.0, 126.0, 77.0, 44.0, 20.0, 26.0, 15.0, 9.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.1015625, -1.0669097900390625, -1.032257080078125, -0.9976043701171875, -0.96295166015625, -0.9282989501953125, -0.893646240234375, -0.8589935302734375, -0.8243408203125, -0.7896881103515625, -0.755035400390625, -0.7203826904296875, -0.68572998046875, -0.6510772705078125, -0.616424560546875, -0.5817718505859375, -0.547119140625, -0.5124664306640625, -0.477813720703125, -0.4431610107421875, -0.40850830078125, -0.3738555908203125, -0.339202880859375, -0.3045501708984375, -0.2698974609375, -0.2352447509765625, -0.200592041015625, -0.1659393310546875, -0.13128662109375, -0.0966339111328125, -0.061981201171875, -0.0273284912109375, 0.00732421875, 0.0419769287109375, 0.076629638671875, 0.1112823486328125, 0.14593505859375, 0.1805877685546875, 0.215240478515625, 0.2498931884765625, 0.2845458984375, 0.3191986083984375, 0.353851318359375, 0.3885040283203125, 0.42315673828125, 0.4578094482421875, 0.492462158203125, 0.5271148681640625, 0.561767578125, 0.5964202880859375, 0.631072998046875, 0.6657257080078125, 0.70037841796875, 0.7350311279296875, 0.769683837890625, 0.8043365478515625, 0.8389892578125, 0.8736419677734375, 0.908294677734375, 0.9429473876953125, 0.97760009765625, 1.0122528076171875, 1.046905517578125, 1.0815582275390625, 1.1162109375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 5.0, 11.0, 3.0, 6.0, 12.0, 12.0, 11.0, 12.0, 21.0, 21.0, 16.0, 19.0, 34.0, 23.0, 23.0, 28.0, 31.0, 28.0, 29.0, 32.0, 39.0, 38.0, 31.0, 1057.0, 25.0, 38.0, 42.0, 32.0, 38.0, 35.0, 27.0, 22.0, 31.0, 26.0, 24.0, 12.0, 19.0, 12.0, 22.0, 6.0, 14.0, 16.0, 5.0, 8.0, 15.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93310546875, -0.9011154174804688, -0.8691253662109375, -0.8371353149414062, -0.805145263671875, -0.7731552124023438, -0.7411651611328125, -0.7091751098632812, -0.67718505859375, -0.6451950073242188, -0.6132049560546875, -0.5812149047851562, -0.549224853515625, -0.5172348022460938, -0.4852447509765625, -0.45325469970703125, -0.4212646484375, -0.38927459716796875, -0.3572845458984375, -0.32529449462890625, -0.293304443359375, -0.26131439208984375, -0.2293243408203125, -0.19733428955078125, -0.16534423828125, -0.13335418701171875, -0.1013641357421875, -0.06937408447265625, -0.037384033203125, -0.00539398193359375, 0.0265960693359375, 0.05858612060546875, 0.090576171875, 0.12256622314453125, 0.1545562744140625, 0.18654632568359375, 0.218536376953125, 0.25052642822265625, 0.2825164794921875, 0.31450653076171875, 0.34649658203125, 0.37848663330078125, 0.4104766845703125, 0.44246673583984375, 0.474456787109375, 0.5064468383789062, 0.5384368896484375, 0.5704269409179688, 0.6024169921875, 0.6344070434570312, 0.6663970947265625, 0.6983871459960938, 0.730377197265625, 0.7623672485351562, 0.7943572998046875, 0.8263473510742188, 0.85833740234375, 0.8903274536132812, 0.9223175048828125, 0.9543075561523438, 0.986297607421875, 1.0182876586914062, 1.0502777099609375, 1.0822677612304688, 1.1142578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 11.0, 6.0, 25.0, 23.0, 55.0, 68.0, 106.0, 166.0, 271.0, 403.0, 576.0, 838.0, 1332.0, 1825.0, 2898.0, 4384.0, 6490.0, 10504.0, 16617.0, 30937.0, 86697.0, 958819.0, 814710.0, 83083.0, 30116.0, 16661.0, 10082.0, 6632.0, 4292.0, 2895.0, 1859.0, 1265.0, 855.0, 578.0, 362.0, 224.0, 149.0, 101.0, 72.0, 46.0, 29.0, 25.0, 20.0, 14.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.0018463134765625, -0.969512939453125, -0.9371795654296875, -0.90484619140625, -0.8725128173828125, -0.840179443359375, -0.8078460693359375, -0.7755126953125, -0.7431793212890625, -0.710845947265625, -0.6785125732421875, -0.64617919921875, -0.6138458251953125, -0.581512451171875, -0.5491790771484375, -0.516845703125, -0.4845123291015625, -0.452178955078125, -0.4198455810546875, -0.38751220703125, -0.3551788330078125, -0.322845458984375, -0.2905120849609375, -0.2581787109375, -0.2258453369140625, -0.193511962890625, -0.1611785888671875, -0.12884521484375, -0.0965118408203125, -0.064178466796875, -0.0318450927734375, 0.00048828125, 0.0328216552734375, 0.065155029296875, 0.0974884033203125, 0.12982177734375, 0.1621551513671875, 0.194488525390625, 0.2268218994140625, 0.2591552734375, 0.2914886474609375, 0.323822021484375, 0.3561553955078125, 0.38848876953125, 0.4208221435546875, 0.453155517578125, 0.4854888916015625, 0.517822265625, 0.5501556396484375, 0.582489013671875, 0.6148223876953125, 0.64715576171875, 0.6794891357421875, 0.711822509765625, 0.7441558837890625, 0.7764892578125, 0.8088226318359375, 0.841156005859375, 0.8734893798828125, 0.90582275390625, 0.9381561279296875, 0.970489501953125, 1.0028228759765625, 1.03515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 11.0, 10.0, 15.0, 16.0, 26.0, 29.0, 40.0, 42.0, 58.0, 79.0, 68.0, 93.0, 76.0, 100.0, 59.0, 46.0, 35.0, 24.0, 23.0, 17.0, 14.0, 18.0, 10.0, 8.0, 12.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1748046875, -0.16961288452148438, -0.16442108154296875, -0.15922927856445312, -0.1540374755859375, -0.14884567260742188, -0.14365386962890625, -0.13846206665039062, -0.133270263671875, -0.12807846069335938, -0.12288665771484375, -0.11769485473632812, -0.1125030517578125, -0.10731124877929688, -0.10211944580078125, -0.09692764282226562, -0.09173583984375, -0.08654403686523438, -0.08135223388671875, -0.07616043090820312, -0.0709686279296875, -0.06577682495117188, -0.06058502197265625, -0.055393218994140625, -0.050201416015625, -0.045009613037109375, -0.03981781005859375, -0.034626007080078125, -0.0294342041015625, -0.024242401123046875, -0.01905059814453125, -0.013858795166015625, -0.0086669921875, -0.003475189208984375, 0.00171661376953125, 0.006908416748046875, 0.0121002197265625, 0.017292022705078125, 0.02248382568359375, 0.027675628662109375, 0.032867431640625, 0.038059234619140625, 0.04325103759765625, 0.048442840576171875, 0.0536346435546875, 0.058826446533203125, 0.06401824951171875, 0.06921005249023438, 0.07440185546875, 0.07959365844726562, 0.08478546142578125, 0.08997726440429688, 0.0951690673828125, 0.10036087036132812, 0.10555267333984375, 0.11074447631835938, 0.115936279296875, 0.12112808227539062, 0.12631988525390625, 0.13151168823242188, 0.1367034912109375, 0.14189529418945312, 0.14708709716796875, 0.15227890014648438, 0.157470703125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 0.0, 8.0, 13.0, 14.0, 11.0, 25.0, 35.0, 33.0, 40.0, 88.0, 180.0, 448.0, 1640.0, 7888.0, 71737.0, 902857.0, 54519.0, 6687.0, 1460.0, 410.0, 159.0, 81.0, 56.0, 30.0, 33.0, 15.0, 16.0, 12.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.40234375, -2.323455810546875, -2.24456787109375, -2.165679931640625, -2.0867919921875, -2.007904052734375, -1.92901611328125, -1.850128173828125, -1.771240234375, -1.692352294921875, -1.61346435546875, -1.534576416015625, -1.4556884765625, -1.376800537109375, -1.29791259765625, -1.219024658203125, -1.14013671875, -1.061248779296875, -0.98236083984375, -0.903472900390625, -0.8245849609375, -0.745697021484375, -0.66680908203125, -0.587921142578125, -0.509033203125, -0.430145263671875, -0.35125732421875, -0.272369384765625, -0.1934814453125, -0.114593505859375, -0.03570556640625, 0.043182373046875, 0.1220703125, 0.200958251953125, 0.27984619140625, 0.358734130859375, 0.4376220703125, 0.516510009765625, 0.59539794921875, 0.674285888671875, 0.753173828125, 0.832061767578125, 0.91094970703125, 0.989837646484375, 1.0687255859375, 1.147613525390625, 1.22650146484375, 1.305389404296875, 1.38427734375, 1.463165283203125, 1.54205322265625, 1.620941162109375, 1.6998291015625, 1.778717041015625, 1.85760498046875, 1.936492919921875, 2.015380859375, 2.094268798828125, 2.17315673828125, 2.252044677734375, 2.3309326171875, 2.409820556640625, 2.48870849609375, 2.567596435546875, 2.646484375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 14.0, 12.0, 19.0, 31.0, 33.0, 45.0, 49.0, 77.0, 139.0, 164.0, 113.0, 84.0, 59.0, 39.0, 23.0, 24.0, 13.0, 12.0, 9.0, 4.0, 5.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3291393518447876, -1.2866466045379639, -1.2441538572311401, -1.2016611099243164, -1.1591684818267822, -1.1166757345199585, -1.0741829872131348, -1.031690239906311, -0.9891974925994873, -0.9467047452926636, -0.9042119979858398, -0.8617193102836609, -0.8192265629768372, -0.7767338156700134, -0.7342411279678345, -0.6917483806610107, -0.649255633354187, -0.6067628860473633, -0.5642701387405396, -0.5217774510383606, -0.47928470373153687, -0.43679195642471313, -0.3942992389202118, -0.35180652141571045, -0.3093137741088867, -0.266821026802063, -0.22432830929756165, -0.1818355768918991, -0.13934284448623657, -0.09685011208057404, -0.0543573796749115, -0.011864662170410156, 0.030628204345703125, 0.07312093675136566, 0.1156136691570282, 0.15810640156269073, 0.20059913396835327, 0.2430918663740158, 0.28558459877967834, 0.3280773162841797, 0.3705700635910034, 0.41306281089782715, 0.4555555284023285, 0.49804824590682983, 0.5405409932136536, 0.5830337405204773, 0.6255264282226562, 0.66801917552948, 0.7105119228363037, 0.7530046701431274, 0.7954974174499512, 0.8379901051521301, 0.8804828524589539, 0.9229755997657776, 0.9654682874679565, 1.0079610347747803, 1.050453782081604, 1.0929465293884277, 1.1354392766952515, 1.1779320240020752, 1.2204246520996094, 1.262917399406433, 1.3054101467132568, 1.3479028940200806, 1.3903956413269043]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 13.0, 13.0, 17.0, 21.0, 14.0, 34.0, 33.0, 44.0, 52.0, 41.0, 49.0, 55.0, 54.0, 48.0, 54.0, 48.0, 63.0, 66.0, 47.0, 33.0, 29.0, 34.0, 33.0, 22.0, 14.0, 13.0, 15.0, 11.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.3303589820861816, -1.2977761030197144, -1.265193223953247, -1.2326103448867798, -1.2000274658203125, -1.1674445867538452, -1.134861707687378, -1.102278709411621, -1.0696959495544434, -1.037113070487976, -1.0045301914215088, -0.9719473123550415, -0.9393644332885742, -0.9067815542221069, -0.8741986155509949, -0.8416157364845276, -0.8090327978134155, -0.7764499187469482, -0.743867039680481, -0.7112841606140137, -0.6787012815475464, -0.6461184024810791, -0.613535463809967, -0.5809525847434998, -0.5483697056770325, -0.5157868266105652, -0.4832039475440979, -0.4506210386753082, -0.41803815960884094, -0.38545528054237366, -0.352872371673584, -0.3202894926071167, -0.28770655393600464, -0.25512367486953735, -0.22254078090190887, -0.1899578869342804, -0.1573750078678131, -0.12479212880134583, -0.09220923483371735, -0.05962634086608887, -0.027043461799621582, 0.0055394247174263, 0.03812231123447418, 0.07070519775152206, 0.10328808426856995, 0.13587096333503723, 0.1684538573026657, 0.2010367512702942, 0.23361963033676147, 0.26620250940322876, 0.29878538846969604, 0.3313682973384857, 0.363951176404953, 0.3965340554714203, 0.42911696434020996, 0.46169984340667725, 0.49428272247314453, 0.5268656015396118, 0.5594484806060791, 0.5920313596725464, 0.6246142387390137, 0.657197117805481, 0.689780056476593, 0.7223629355430603, 0.7549458146095276]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 10.0, 11.0, 16.0, 15.0, 24.0, 35.0, 39.0, 38.0, 52.0, 63.0, 64.0, 83.0, 79.0, 59.0, 74.0, 57.0, 60.0, 46.0, 34.0, 41.0, 24.0, 26.0, 19.0, 8.0, 8.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.557098388671875, -2.49114990234375, -2.425201416015625, -2.3592529296875, -2.293304443359375, -2.22735595703125, -2.161407470703125, -2.095458984375, -2.029510498046875, -1.96356201171875, -1.897613525390625, -1.8316650390625, -1.765716552734375, -1.69976806640625, -1.633819580078125, -1.56787109375, -1.501922607421875, -1.43597412109375, -1.370025634765625, -1.3040771484375, -1.238128662109375, -1.17218017578125, -1.106231689453125, -1.040283203125, -0.974334716796875, -0.90838623046875, -0.842437744140625, -0.7764892578125, -0.710540771484375, -0.64459228515625, -0.578643798828125, -0.5126953125, -0.446746826171875, -0.38079833984375, -0.314849853515625, -0.2489013671875, -0.182952880859375, -0.11700439453125, -0.051055908203125, 0.014892578125, 0.080841064453125, 0.14678955078125, 0.212738037109375, 0.2786865234375, 0.344635009765625, 0.41058349609375, 0.476531982421875, 0.54248046875, 0.608428955078125, 0.67437744140625, 0.740325927734375, 0.8062744140625, 0.872222900390625, 0.93817138671875, 1.004119873046875, 1.070068359375, 1.136016845703125, 1.20196533203125, 1.267913818359375, 1.3338623046875, 1.399810791015625, 1.46575927734375, 1.531707763671875, 1.59765625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 24.0, 44.0, 83.0, 153.0, 302.0, 586.0, 1324.0, 2991.0, 7953.0, 25307.0, 93628.0, 430188.0, 370591.0, 80893.0, 22081.0, 7154.0, 2769.0, 1295.0, 565.0, 290.0, 142.0, 69.0, 36.0, 23.0, 9.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.424652099609375, -3.29266357421875, -3.160675048828125, -3.0286865234375, -2.896697998046875, -2.76470947265625, -2.632720947265625, -2.500732421875, -2.368743896484375, -2.23675537109375, -2.104766845703125, -1.9727783203125, -1.840789794921875, -1.70880126953125, -1.576812744140625, -1.44482421875, -1.312835693359375, -1.18084716796875, -1.048858642578125, -0.9168701171875, -0.784881591796875, -0.65289306640625, -0.520904541015625, -0.388916015625, -0.256927490234375, -0.12493896484375, 0.007049560546875, 0.1390380859375, 0.271026611328125, 0.40301513671875, 0.535003662109375, 0.6669921875, 0.798980712890625, 0.93096923828125, 1.062957763671875, 1.1949462890625, 1.326934814453125, 1.45892333984375, 1.590911865234375, 1.722900390625, 1.854888916015625, 1.98687744140625, 2.118865966796875, 2.2508544921875, 2.382843017578125, 2.51483154296875, 2.646820068359375, 2.77880859375, 2.910797119140625, 3.04278564453125, 3.174774169921875, 3.3067626953125, 3.438751220703125, 3.57073974609375, 3.702728271484375, 3.834716796875, 3.966705322265625, 4.09869384765625, 4.230682373046875, 4.3626708984375, 4.494659423828125, 4.62664794921875, 4.758636474609375, 4.890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 7.0, 14.0, 17.0, 17.0, 23.0, 26.0, 31.0, 39.0, 40.0, 59.0, 52.0, 96.0, 134.0, 199.0, 1308.0, 256.0, 166.0, 111.0, 78.0, 64.0, 48.0, 43.0, 34.0, 33.0, 22.0, 17.0, 19.0, 21.0, 16.0, 4.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.58837890625, -4.4345703125, -4.28076171875, -4.126953125, -3.97314453125, -3.8193359375, -3.66552734375, -3.51171875, -3.35791015625, -3.2041015625, -3.05029296875, -2.896484375, -2.74267578125, -2.5888671875, -2.43505859375, -2.28125, -2.12744140625, -1.9736328125, -1.81982421875, -1.666015625, -1.51220703125, -1.3583984375, -1.20458984375, -1.05078125, -0.89697265625, -0.7431640625, -0.58935546875, -0.435546875, -0.28173828125, -0.1279296875, 0.02587890625, 0.1796875, 0.33349609375, 0.4873046875, 0.64111328125, 0.794921875, 0.94873046875, 1.1025390625, 1.25634765625, 1.41015625, 1.56396484375, 1.7177734375, 1.87158203125, 2.025390625, 2.17919921875, 2.3330078125, 2.48681640625, 2.640625, 2.79443359375, 2.9482421875, 3.10205078125, 3.255859375, 3.40966796875, 3.5634765625, 3.71728515625, 3.87109375, 4.02490234375, 4.1787109375, 4.33251953125, 4.486328125, 4.64013671875, 4.7939453125, 4.94775390625, 5.1015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 4.0, 14.0, 18.0, 12.0, 16.0, 24.0, 35.0, 34.0, 54.0, 74.0, 99.0, 127.0, 230.0, 360.0, 670.0, 1558.0, 4066.0, 16232.0, 114621.0, 2133656.0, 803997.0, 54300.0, 9905.0, 2945.0, 1176.0, 540.0, 282.0, 162.0, 126.0, 73.0, 74.0, 44.0, 31.0, 26.0, 26.0, 23.0, 12.0, 12.0, 4.0, 7.0, 5.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.48046875, -7.2454833984375, -7.010498046875, -6.7755126953125, -6.54052734375, -6.3055419921875, -6.070556640625, -5.8355712890625, -5.6005859375, -5.3656005859375, -5.130615234375, -4.8956298828125, -4.66064453125, -4.4256591796875, -4.190673828125, -3.9556884765625, -3.720703125, -3.4857177734375, -3.250732421875, -3.0157470703125, -2.78076171875, -2.5457763671875, -2.310791015625, -2.0758056640625, -1.8408203125, -1.6058349609375, -1.370849609375, -1.1358642578125, -0.90087890625, -0.6658935546875, -0.430908203125, -0.1959228515625, 0.0390625, 0.2740478515625, 0.509033203125, 0.7440185546875, 0.97900390625, 1.2139892578125, 1.448974609375, 1.6839599609375, 1.9189453125, 2.1539306640625, 2.388916015625, 2.6239013671875, 2.85888671875, 3.0938720703125, 3.328857421875, 3.5638427734375, 3.798828125, 4.0338134765625, 4.268798828125, 4.5037841796875, 4.73876953125, 4.9737548828125, 5.208740234375, 5.4437255859375, 5.6787109375, 5.9136962890625, 6.148681640625, 6.3836669921875, 6.61865234375, 6.8536376953125, 7.088623046875, 7.3236083984375, 7.55859375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 9.0, 44.0, 201.0, 371.0, 297.0, 80.0, 12.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.52214813232422, -59.07243347167969, -57.622718811035156, -56.173004150390625, -54.723289489746094, -53.27357482910156, -51.82386016845703, -50.3741455078125, -48.92443084716797, -47.47471618652344, -46.025001525878906, -44.575286865234375, -43.125572204589844, -41.67585754394531, -40.22614288330078, -38.77642822265625, -37.326717376708984, -35.87700271606445, -34.42728805541992, -32.97757339477539, -31.52785873413086, -30.078144073486328, -28.62843132019043, -27.1787166595459, -25.729001998901367, -24.279287338256836, -22.829572677612305, -21.379859924316406, -19.930145263671875, -18.480430603027344, -17.030715942382812, -15.581001281738281, -14.13128662109375, -12.681571960449219, -11.231857299804688, -9.782143592834473, -8.332428932189941, -6.88271427154541, -5.433000564575195, -3.983285903930664, -2.533571243286133, -1.0838568210601807, 0.3658576011657715, 1.8155717849731445, 3.265286445617676, 4.715001106262207, 6.164714813232422, 7.614429473876953, 9.064144134521484, 10.513858795166016, 11.963573455810547, 13.413287162780762, 14.863001823425293, 16.31271743774414, 17.76243019104004, 19.21214485168457, 20.6618595123291, 22.111574172973633, 23.561288833618164, 25.011001586914062, 26.460716247558594, 27.910430908203125, 29.360145568847656, 30.809860229492188, 32.25957489013672]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 1.0, 12.0, 11.0, 10.0, 12.0, 16.0, 27.0, 27.0, 24.0, 18.0, 25.0, 31.0, 28.0, 29.0, 42.0, 42.0, 52.0, 45.0, 44.0, 44.0, 35.0, 41.0, 48.0, 34.0, 32.0, 33.0, 28.0, 19.0, 24.0, 28.0, 20.0, 19.0, 13.0, 21.0, 5.0, 16.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-13.023686408996582, -12.636239051818848, -12.248790740966797, -11.861343383789062, -11.473895072937012, -11.086447715759277, -10.698999404907227, -10.311552047729492, -9.924104690551758, -9.536657333374023, -9.149209022521973, -8.761761665344238, -8.374313354492188, -7.986865997314453, -7.5994181632995605, -7.211970329284668, -6.824522018432617, -6.437074184417725, -6.049626350402832, -5.662178993225098, -5.274730682373047, -4.8872833251953125, -4.49983549118042, -4.112387657165527, -3.7249398231506348, -3.337491989135742, -2.9500441551208496, -2.562596559524536, -2.1751487255096436, -1.787700891494751, -1.4002532958984375, -1.012805461883545, -0.6253576278686523, -0.23790985345840454, 0.14953792095184326, 0.5369856357574463, 0.9244334697723389, 1.3118813037872314, 1.699328899383545, 2.0867767333984375, 2.47422456741333, 2.8616724014282227, 3.2491202354431152, 3.6365678310394287, 4.024015426635742, 4.411463737487793, 4.798911094665527, 5.18635892868042, 5.5738067626953125, 5.961254596710205, 6.348702430725098, 6.736149787902832, 7.123598098754883, 7.511045455932617, 7.89849328994751, 8.285941123962402, 8.673389434814453, 9.060836791992188, 9.448285102844238, 9.835732460021973, 10.223180770874023, 10.610628128051758, 10.998075485229492, 11.385523796081543, 11.772971153259277]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 7.0, 8.0, 10.0, 18.0, 13.0, 14.0, 17.0, 27.0, 33.0, 35.0, 20.0, 37.0, 39.0, 48.0, 36.0, 51.0, 61.0, 39.0, 48.0, 40.0, 40.0, 49.0, 36.0, 40.0, 30.0, 24.0, 24.0, 20.0, 16.0, 17.0, 14.0, 20.0, 7.0, 12.0, 3.0, 6.0, 8.0, 8.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4677734375, -1.4225311279296875, -1.377288818359375, -1.3320465087890625, -1.28680419921875, -1.2415618896484375, -1.196319580078125, -1.1510772705078125, -1.1058349609375, -1.0605926513671875, -1.015350341796875, -0.9701080322265625, -0.92486572265625, -0.8796234130859375, -0.834381103515625, -0.7891387939453125, -0.743896484375, -0.6986541748046875, -0.653411865234375, -0.6081695556640625, -0.56292724609375, -0.5176849365234375, -0.472442626953125, -0.4272003173828125, -0.3819580078125, -0.3367156982421875, -0.291473388671875, -0.2462310791015625, -0.20098876953125, -0.1557464599609375, -0.110504150390625, -0.0652618408203125, -0.02001953125, 0.0252227783203125, 0.070465087890625, 0.1157073974609375, 0.16094970703125, 0.2061920166015625, 0.251434326171875, 0.2966766357421875, 0.3419189453125, 0.3871612548828125, 0.432403564453125, 0.4776458740234375, 0.52288818359375, 0.5681304931640625, 0.613372802734375, 0.6586151123046875, 0.703857421875, 0.7490997314453125, 0.794342041015625, 0.8395843505859375, 0.88482666015625, 0.9300689697265625, 0.975311279296875, 1.0205535888671875, 1.0657958984375, 1.1110382080078125, 1.156280517578125, 1.2015228271484375, 1.24676513671875, 1.2920074462890625, 1.337249755859375, 1.3824920654296875, 1.427734375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 10.0, 9.0, 13.0, 7.0, 9.0, 30.0, 40.0, 66.0, 91.0, 98.0, 165.0, 267.0, 507.0, 1008.0, 1998.0, 4322.0, 11191.0, 37678.0, 281296.0, 2876667.0, 876481.0, 71756.0, 17831.0, 6505.0, 2851.0, 1502.0, 762.0, 414.0, 244.0, 125.0, 95.0, 73.0, 47.0, 31.0, 21.0, 18.0, 8.0, 9.0, 5.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.65325927734375, -3.5213623046875, -3.38946533203125, -3.257568359375, -3.12567138671875, -2.9937744140625, -2.86187744140625, -2.72998046875, -2.59808349609375, -2.4661865234375, -2.33428955078125, -2.202392578125, -2.07049560546875, -1.9385986328125, -1.80670166015625, -1.6748046875, -1.54290771484375, -1.4110107421875, -1.27911376953125, -1.147216796875, -1.01531982421875, -0.8834228515625, -0.75152587890625, -0.61962890625, -0.48773193359375, -0.3558349609375, -0.22393798828125, -0.092041015625, 0.03985595703125, 0.1717529296875, 0.30364990234375, 0.435546875, 0.56744384765625, 0.6993408203125, 0.83123779296875, 0.963134765625, 1.09503173828125, 1.2269287109375, 1.35882568359375, 1.49072265625, 1.62261962890625, 1.7545166015625, 1.88641357421875, 2.018310546875, 2.15020751953125, 2.2821044921875, 2.41400146484375, 2.5458984375, 2.67779541015625, 2.8096923828125, 2.94158935546875, 3.073486328125, 3.20538330078125, 3.3372802734375, 3.46917724609375, 3.60107421875, 3.73297119140625, 3.8648681640625, 3.99676513671875, 4.128662109375, 4.26055908203125, 4.3924560546875, 4.52435302734375, 4.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 9.0, 8.0, 9.0, 13.0, 17.0, 29.0, 37.0, 48.0, 70.0, 105.0, 165.0, 196.0, 325.0, 442.0, 554.0, 556.0, 450.0, 325.0, 207.0, 111.0, 90.0, 84.0, 67.0, 29.0, 26.0, 20.0, 20.0, 14.0, 7.0, 8.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.611328125, -3.51104736328125, -3.4107666015625, -3.31048583984375, -3.210205078125, -3.10992431640625, -3.0096435546875, -2.90936279296875, -2.80908203125, -2.70880126953125, -2.6085205078125, -2.50823974609375, -2.407958984375, -2.30767822265625, -2.2073974609375, -2.10711669921875, -2.0068359375, -1.90655517578125, -1.8062744140625, -1.70599365234375, -1.605712890625, -1.50543212890625, -1.4051513671875, -1.30487060546875, -1.20458984375, -1.10430908203125, -1.0040283203125, -0.90374755859375, -0.803466796875, -0.70318603515625, -0.6029052734375, -0.50262451171875, -0.40234375, -0.30206298828125, -0.2017822265625, -0.10150146484375, -0.001220703125, 0.09906005859375, 0.1993408203125, 0.29962158203125, 0.39990234375, 0.50018310546875, 0.6004638671875, 0.70074462890625, 0.801025390625, 0.90130615234375, 1.0015869140625, 1.10186767578125, 1.2021484375, 1.30242919921875, 1.4027099609375, 1.50299072265625, 1.603271484375, 1.70355224609375, 1.8038330078125, 1.90411376953125, 2.00439453125, 2.10467529296875, 2.2049560546875, 2.30523681640625, 2.405517578125, 2.50579833984375, 2.6060791015625, 2.70635986328125, 2.806640625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 17.0, 19.0, 31.0, 35.0, 48.0, 89.0, 159.0, 278.0, 543.0, 1112.0, 2426.0, 6668.0, 21830.0, 103640.0, 1238227.0, 2588820.0, 182906.0, 32347.0, 9172.0, 3132.0, 1332.0, 631.0, 321.0, 205.0, 87.0, 62.0, 29.0, 28.0, 20.0, 19.0, 10.0, 7.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.1124267578125, -4.924072265625, -4.7357177734375, -4.54736328125, -4.3590087890625, -4.170654296875, -3.9822998046875, -3.7939453125, -3.6055908203125, -3.417236328125, -3.2288818359375, -3.04052734375, -2.8521728515625, -2.663818359375, -2.4754638671875, -2.287109375, -2.0987548828125, -1.910400390625, -1.7220458984375, -1.53369140625, -1.3453369140625, -1.156982421875, -0.9686279296875, -0.7802734375, -0.5919189453125, -0.403564453125, -0.2152099609375, -0.02685546875, 0.1614990234375, 0.349853515625, 0.5382080078125, 0.7265625, 0.9149169921875, 1.103271484375, 1.2916259765625, 1.47998046875, 1.6683349609375, 1.856689453125, 2.0450439453125, 2.2333984375, 2.4217529296875, 2.610107421875, 2.7984619140625, 2.98681640625, 3.1751708984375, 3.363525390625, 3.5518798828125, 3.740234375, 3.9285888671875, 4.116943359375, 4.3052978515625, 4.49365234375, 4.6820068359375, 4.870361328125, 5.0587158203125, 5.2470703125, 5.4354248046875, 5.623779296875, 5.8121337890625, 6.00048828125, 6.1888427734375, 6.377197265625, 6.5655517578125, 6.75390625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 10.0, 4.0, 7.0, 19.0, 18.0, 18.0, 34.0, 38.0, 54.0, 60.0, 64.0, 99.0, 87.0, 94.0, 86.0, 86.0, 65.0, 43.0, 33.0, 27.0, 18.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.854825019836426, -12.424972534179688, -11.99512004852295, -11.565267562866211, -11.135414123535156, -10.705561637878418, -10.27570915222168, -9.845856666564941, -9.416004180908203, -8.986151695251465, -8.556299209594727, -8.126445770263672, -7.696593761444092, -7.266740798950195, -6.836888313293457, -6.407035827636719, -5.977182865142822, -5.547330379486084, -5.1174774169921875, -4.687624931335449, -4.257772445678711, -3.8279197216033936, -3.398066997528076, -2.968214511871338, -2.5383617877960205, -2.108509063720703, -1.6786565780639648, -1.2488038539886475, -0.8189512491226196, -0.3890986442565918, 0.040754079818725586, 0.47060656547546387, 0.9004592895507812, 1.330311894416809, 1.760164499282837, 2.1900172233581543, 2.6198697090148926, 3.04972243309021, 3.4795751571655273, 3.9094276428222656, 4.339280128479004, 4.769132614135742, 5.198985576629639, 5.628838062286377, 6.058690547943115, 6.488543510437012, 6.91839599609375, 7.348248481750488, 7.778101444244385, 8.207954406738281, 8.63780689239502, 9.067659378051758, 9.497511863708496, 9.927364349365234, 10.357217788696289, 10.787069320678711, 11.216922760009766, 11.646775245666504, 12.076627731323242, 12.506481170654297, 12.936333656311035, 13.366186141967773, 13.796038627624512, 14.22589111328125, 14.655743598937988]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 9.0, 8.0, 14.0, 18.0, 12.0, 11.0, 18.0, 13.0, 21.0, 30.0, 26.0, 34.0, 26.0, 37.0, 43.0, 38.0, 38.0, 30.0, 38.0, 40.0, 29.0, 40.0, 36.0, 38.0, 39.0, 38.0, 36.0, 21.0, 27.0, 21.0, 19.0, 15.0, 23.0, 19.0, 17.0, 21.0, 11.0, 9.0, 8.0, 10.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0], "bins": [-10.632645606994629, -10.340533256530762, -10.048420906066895, -9.756307601928711, -9.464195251464844, -9.172082901000977, -8.87997055053711, -8.587858200073242, -8.295744895935059, -8.003632545471191, -7.711519718170166, -7.419407367706299, -7.127294540405273, -6.835182189941406, -6.543069839477539, -6.250957012176514, -5.9588446617126465, -5.666732311248779, -5.374619483947754, -5.082507133483887, -4.790394306182861, -4.498281955718994, -4.206169128417969, -3.9140567779541016, -3.6219441890716553, -3.329831600189209, -3.0377190113067627, -2.7456064224243164, -2.453494071960449, -2.161381244659424, -1.8692688941955566, -1.5771563053131104, -1.285043716430664, -0.9929311275482178, -0.7008185982704163, -0.40870606899261475, -0.11659348011016846, 0.17551910877227783, 0.46763157844543457, 0.7597441673278809, 1.0518567562103271, 1.3439693450927734, 1.6360819339752197, 1.9281944036483765, 2.220306873321533, 2.5124197006225586, 2.804532051086426, 3.096644639968872, 3.3887572288513184, 3.6808698177337646, 3.972982406616211, 4.265094757080078, 4.5572075843811035, 4.849319934844971, 5.141432762145996, 5.433545112609863, 5.7256574630737305, 6.017769813537598, 6.309882640838623, 6.60199499130249, 6.894107818603516, 7.186220169067383, 7.47833251953125, 7.770445346832275, 8.0625581741333]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 8.0, 16.0, 15.0, 15.0, 19.0, 26.0, 24.0, 26.0, 24.0, 39.0, 33.0, 44.0, 42.0, 59.0, 39.0, 44.0, 49.0, 68.0, 56.0, 37.0, 46.0, 39.0, 22.0, 39.0, 22.0, 27.0, 18.0, 18.0, 13.0, 14.0, 11.0, 10.0, 7.0, 7.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.697265625, -1.6486968994140625, -1.600128173828125, -1.5515594482421875, -1.50299072265625, -1.4544219970703125, -1.405853271484375, -1.3572845458984375, -1.3087158203125, -1.2601470947265625, -1.211578369140625, -1.1630096435546875, -1.11444091796875, -1.0658721923828125, -1.017303466796875, -0.9687347412109375, -0.920166015625, -0.8715972900390625, -0.823028564453125, -0.7744598388671875, -0.72589111328125, -0.6773223876953125, -0.628753662109375, -0.5801849365234375, -0.5316162109375, -0.4830474853515625, -0.434478759765625, -0.3859100341796875, -0.33734130859375, -0.2887725830078125, -0.240203857421875, -0.1916351318359375, -0.14306640625, -0.0944976806640625, -0.045928955078125, 0.0026397705078125, 0.05120849609375, 0.0997772216796875, 0.148345947265625, 0.1969146728515625, 0.2454833984375, 0.2940521240234375, 0.342620849609375, 0.3911895751953125, 0.43975830078125, 0.4883270263671875, 0.536895751953125, 0.5854644775390625, 0.634033203125, 0.6826019287109375, 0.731170654296875, 0.7797393798828125, 0.82830810546875, 0.8768768310546875, 0.925445556640625, 0.9740142822265625, 1.0225830078125, 1.0711517333984375, 1.119720458984375, 1.1682891845703125, 1.21685791015625, 1.2654266357421875, 1.313995361328125, 1.3625640869140625, 1.4111328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 13.0, 21.0, 24.0, 38.0, 64.0, 96.0, 132.0, 240.0, 412.0, 593.0, 993.0, 1696.0, 2824.0, 4729.0, 8118.0, 13967.0, 24226.0, 40895.0, 66488.0, 103969.0, 150387.0, 181974.0, 157042.0, 110075.0, 71912.0, 44387.0, 26386.0, 15328.0, 8865.0, 5093.0, 2986.0, 1743.0, 1048.0, 665.0, 411.0, 249.0, 149.0, 107.0, 75.0, 32.0, 33.0, 21.0, 10.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9072113037109375, -0.879364013671875, -0.8515167236328125, -0.82366943359375, -0.7958221435546875, -0.767974853515625, -0.7401275634765625, -0.7122802734375, -0.6844329833984375, -0.656585693359375, -0.6287384033203125, -0.60089111328125, -0.5730438232421875, -0.545196533203125, -0.5173492431640625, -0.489501953125, -0.4616546630859375, -0.433807373046875, -0.4059600830078125, -0.37811279296875, -0.3502655029296875, -0.322418212890625, -0.2945709228515625, -0.2667236328125, -0.2388763427734375, -0.211029052734375, -0.1831817626953125, -0.15533447265625, -0.1274871826171875, -0.099639892578125, -0.0717926025390625, -0.0439453125, -0.0160980224609375, 0.011749267578125, 0.0395965576171875, 0.06744384765625, 0.0952911376953125, 0.123138427734375, 0.1509857177734375, 0.1788330078125, 0.2066802978515625, 0.234527587890625, 0.2623748779296875, 0.29022216796875, 0.3180694580078125, 0.345916748046875, 0.3737640380859375, 0.401611328125, 0.4294586181640625, 0.457305908203125, 0.4851531982421875, 0.51300048828125, 0.5408477783203125, 0.568695068359375, 0.5965423583984375, 0.6243896484375, 0.6522369384765625, 0.680084228515625, 0.7079315185546875, 0.73577880859375, 0.7636260986328125, 0.791473388671875, 0.8193206787109375, 0.84716796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 18.0, 16.0, 10.0, 13.0, 9.0, 16.0, 25.0, 17.0, 23.0, 32.0, 36.0, 35.0, 38.0, 25.0, 40.0, 42.0, 37.0, 36.0, 1060.0, 45.0, 40.0, 39.0, 36.0, 30.0, 32.0, 27.0, 17.0, 29.0, 25.0, 25.0, 18.0, 16.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1083984375, -1.0740509033203125, -1.039703369140625, -1.0053558349609375, -0.97100830078125, -0.9366607666015625, -0.902313232421875, -0.8679656982421875, -0.8336181640625, -0.7992706298828125, -0.764923095703125, -0.7305755615234375, -0.69622802734375, -0.6618804931640625, -0.627532958984375, -0.5931854248046875, -0.558837890625, -0.5244903564453125, -0.490142822265625, -0.4557952880859375, -0.42144775390625, -0.3871002197265625, -0.352752685546875, -0.3184051513671875, -0.2840576171875, -0.2497100830078125, -0.215362548828125, -0.1810150146484375, -0.14666748046875, -0.1123199462890625, -0.077972412109375, -0.0436248779296875, -0.00927734375, 0.0250701904296875, 0.059417724609375, 0.0937652587890625, 0.12811279296875, 0.1624603271484375, 0.196807861328125, 0.2311553955078125, 0.2655029296875, 0.2998504638671875, 0.334197998046875, 0.3685455322265625, 0.40289306640625, 0.4372406005859375, 0.471588134765625, 0.5059356689453125, 0.540283203125, 0.5746307373046875, 0.608978271484375, 0.6433258056640625, 0.67767333984375, 0.7120208740234375, 0.746368408203125, 0.7807159423828125, 0.8150634765625, 0.8494110107421875, 0.883758544921875, 0.9181060791015625, 0.95245361328125, 0.9868011474609375, 1.021148681640625, 1.0554962158203125, 1.08984375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 23.0, 36.0, 54.0, 63.0, 100.0, 132.0, 215.0, 306.0, 407.0, 597.0, 933.0, 1320.0, 1940.0, 2878.0, 4258.0, 6208.0, 9379.0, 14858.0, 25536.0, 65595.0, 425459.0, 1350686.0, 103735.0, 32565.0, 17091.0, 10596.0, 7081.0, 4807.0, 3199.0, 2275.0, 1476.0, 1037.0, 719.0, 443.0, 290.0, 254.0, 190.0, 112.0, 76.0, 59.0, 41.0, 17.0, 17.0, 12.0, 13.0, 1.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.96875, -0.938629150390625, -0.90850830078125, -0.878387451171875, -0.8482666015625, -0.818145751953125, -0.78802490234375, -0.757904052734375, -0.727783203125, -0.697662353515625, -0.66754150390625, -0.637420654296875, -0.6072998046875, -0.577178955078125, -0.54705810546875, -0.516937255859375, -0.48681640625, -0.456695556640625, -0.42657470703125, -0.396453857421875, -0.3663330078125, -0.336212158203125, -0.30609130859375, -0.275970458984375, -0.245849609375, -0.215728759765625, -0.18560791015625, -0.155487060546875, -0.1253662109375, -0.095245361328125, -0.06512451171875, -0.035003662109375, -0.0048828125, 0.025238037109375, 0.05535888671875, 0.085479736328125, 0.1156005859375, 0.145721435546875, 0.17584228515625, 0.205963134765625, 0.236083984375, 0.266204833984375, 0.29632568359375, 0.326446533203125, 0.3565673828125, 0.386688232421875, 0.41680908203125, 0.446929931640625, 0.47705078125, 0.507171630859375, 0.53729248046875, 0.567413330078125, 0.5975341796875, 0.627655029296875, 0.65777587890625, 0.687896728515625, 0.718017578125, 0.748138427734375, 0.77825927734375, 0.808380126953125, 0.8385009765625, 0.868621826171875, 0.89874267578125, 0.928863525390625, 0.958984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 12.0, 15.0, 17.0, 14.0, 21.0, 38.0, 33.0, 46.0, 49.0, 46.0, 83.0, 77.0, 98.0, 66.0, 62.0, 57.0, 42.0, 35.0, 38.0, 29.0, 14.0, 17.0, 8.0, 12.0, 12.0, 5.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.12310791015625, -0.11988067626953125, -0.1166534423828125, -0.11342620849609375, -0.110198974609375, -0.10697174072265625, -0.1037445068359375, -0.10051727294921875, -0.0972900390625, -0.09406280517578125, -0.0908355712890625, -0.08760833740234375, -0.084381103515625, -0.08115386962890625, -0.0779266357421875, -0.07469940185546875, -0.07147216796875, -0.06824493408203125, -0.0650177001953125, -0.06179046630859375, -0.058563232421875, -0.05533599853515625, -0.0521087646484375, -0.04888153076171875, -0.045654296875, -0.04242706298828125, -0.0391998291015625, -0.03597259521484375, -0.032745361328125, -0.02951812744140625, -0.0262908935546875, -0.02306365966796875, -0.01983642578125, -0.01660919189453125, -0.0133819580078125, -0.01015472412109375, -0.006927490234375, -0.00370025634765625, -0.0004730224609375, 0.00275421142578125, 0.0059814453125, 0.00920867919921875, 0.0124359130859375, 0.01566314697265625, 0.018890380859375, 0.02211761474609375, 0.0253448486328125, 0.02857208251953125, 0.03179931640625, 0.03502655029296875, 0.0382537841796875, 0.04148101806640625, 0.044708251953125, 0.04793548583984375, 0.0511627197265625, 0.05438995361328125, 0.0576171875, 0.06084442138671875, 0.0640716552734375, 0.06729888916015625, 0.070526123046875, 0.07375335693359375, 0.0769805908203125, 0.08020782470703125, 0.08343505859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 12.0, 12.0, 30.0, 24.0, 50.0, 83.0, 128.0, 281.0, 1032.0, 6918.0, 170311.0, 847865.0, 18855.0, 2072.0, 379.0, 163.0, 86.0, 57.0, 41.0, 23.0, 28.0, 16.0, 10.0, 8.0, 10.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4230194091796875, -1.366546630859375, -1.3100738525390625, -1.25360107421875, -1.1971282958984375, -1.140655517578125, -1.0841827392578125, -1.0277099609375, -0.9712371826171875, -0.914764404296875, -0.8582916259765625, -0.80181884765625, -0.7453460693359375, -0.688873291015625, -0.6324005126953125, -0.575927734375, -0.5194549560546875, -0.462982177734375, -0.4065093994140625, -0.35003662109375, -0.2935638427734375, -0.237091064453125, -0.1806182861328125, -0.1241455078125, -0.0676727294921875, -0.011199951171875, 0.0452728271484375, 0.10174560546875, 0.1582183837890625, 0.214691162109375, 0.2711639404296875, 0.32763671875, 0.3841094970703125, 0.440582275390625, 0.4970550537109375, 0.55352783203125, 0.6100006103515625, 0.666473388671875, 0.7229461669921875, 0.7794189453125, 0.8358917236328125, 0.892364501953125, 0.9488372802734375, 1.00531005859375, 1.0617828369140625, 1.118255615234375, 1.1747283935546875, 1.231201171875, 1.2876739501953125, 1.344146728515625, 1.4006195068359375, 1.45709228515625, 1.5135650634765625, 1.570037841796875, 1.6265106201171875, 1.6829833984375, 1.7394561767578125, 1.795928955078125, 1.8524017333984375, 1.90887451171875, 1.9653472900390625, 2.021820068359375, 2.0782928466796875, 2.134765625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 10.0, 17.0, 32.0, 49.0, 50.0, 90.0, 136.0, 155.0, 138.0, 106.0, 64.0, 34.0, 33.0, 24.0, 16.0, 10.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9815634489059448, -0.9584847688674927, -0.9354060292243958, -0.9123273491859436, -0.8892486095428467, -0.8661699295043945, -0.8430912494659424, -0.8200125694274902, -0.7969338297843933, -0.7738551497459412, -0.7507764101028442, -0.7276977300643921, -0.7046190500259399, -0.681540310382843, -0.6584616303443909, -0.635382890701294, -0.6123042106628418, -0.5892255306243896, -0.5661467909812927, -0.5430681109428406, -0.5199893712997437, -0.4969106912612915, -0.47383201122283936, -0.4507533013820648, -0.4276745915412903, -0.40459588170051575, -0.3815171718597412, -0.35843849182128906, -0.3353597819805145, -0.31228107213974, -0.28920239210128784, -0.2661236822605133, -0.24304494261741638, -0.21996623277664185, -0.1968875378370285, -0.17380884289741516, -0.15073013305664062, -0.1276514232158661, -0.10457272827625275, -0.0814940333366394, -0.05841532349586487, -0.03533662110567093, -0.01225791871547699, 0.01082078367471695, 0.03389948606491089, 0.05697818845510483, 0.08005689084529877, 0.10313558578491211, 0.12621429562568665, 0.14929300546646118, 0.17237170040607452, 0.19545039534568787, 0.2185291051864624, 0.24160781502723694, 0.2646865248680115, 0.2877652049064636, 0.31084391474723816, 0.3339226245880127, 0.35700130462646484, 0.3800800144672394, 0.4031587243080139, 0.42623743414878845, 0.449316143989563, 0.47239482402801514, 0.4954735338687897]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 8.0, 5.0, 14.0, 18.0, 27.0, 40.0, 35.0, 42.0, 45.0, 50.0, 70.0, 57.0, 80.0, 77.0, 57.0, 56.0, 59.0, 43.0, 56.0, 38.0, 28.0, 27.0, 24.0, 14.0, 9.0, 10.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7357281446456909, -0.7173859477043152, -0.6990438103675842, -0.6807016134262085, -0.6623594164848328, -0.644017219543457, -0.6256750822067261, -0.6073328852653503, -0.5889906883239746, -0.5706484913825989, -0.5523063540458679, -0.5339641571044922, -0.5156219601631165, -0.4972797930240631, -0.47893762588500977, -0.46059542894363403, -0.4422532618045807, -0.42391109466552734, -0.4055688977241516, -0.38722673058509827, -0.36888453364372253, -0.3505423665046692, -0.33220016956329346, -0.3138580024242401, -0.29551583528518677, -0.2771736681461334, -0.2588314712047577, -0.24048930406570435, -0.2221471071243286, -0.20380493998527527, -0.18546275794506073, -0.1671205759048462, -0.14877837896347046, -0.13043619692325592, -0.11209401488304138, -0.09375184029340744, -0.0754096582531929, -0.05706747621297836, -0.03872530162334442, -0.020383119583129883, -0.0020409375429153442, 0.016301242634654045, 0.034643422812223434, 0.052985601127147675, 0.07132778316736221, 0.08966996520757675, 0.1080121397972107, 0.12635432183742523, 0.14469650387763977, 0.1630386859178543, 0.18138086795806885, 0.1997230350971222, 0.21806523203849792, 0.23640739917755127, 0.254749596118927, 0.27309176325798035, 0.2914339303970337, 0.30977609753608704, 0.32811829447746277, 0.3464604616165161, 0.36480265855789185, 0.3831448256969452, 0.40148699283599854, 0.41982918977737427, 0.43817138671875]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 30.0, 20.0, 30.0, 41.0, 53.0, 49.0, 52.0, 51.0, 72.0, 76.0, 72.0, 75.0, 67.0, 58.0, 46.0, 46.0, 31.0, 22.0, 29.0, 17.0, 14.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0], "bins": [-3.1796875, -3.1104736328125, -3.041259765625, -2.9720458984375, -2.90283203125, -2.8336181640625, -2.764404296875, -2.6951904296875, -2.6259765625, -2.5567626953125, -2.487548828125, -2.4183349609375, -2.34912109375, -2.2799072265625, -2.210693359375, -2.1414794921875, -2.072265625, -2.0030517578125, -1.933837890625, -1.8646240234375, -1.79541015625, -1.7261962890625, -1.656982421875, -1.5877685546875, -1.5185546875, -1.4493408203125, -1.380126953125, -1.3109130859375, -1.24169921875, -1.1724853515625, -1.103271484375, -1.0340576171875, -0.96484375, -0.8956298828125, -0.826416015625, -0.7572021484375, -0.68798828125, -0.6187744140625, -0.549560546875, -0.4803466796875, -0.4111328125, -0.3419189453125, -0.272705078125, -0.2034912109375, -0.13427734375, -0.0650634765625, 0.004150390625, 0.0733642578125, 0.142578125, 0.2117919921875, 0.281005859375, 0.3502197265625, 0.41943359375, 0.4886474609375, 0.557861328125, 0.6270751953125, 0.6962890625, 0.7655029296875, 0.834716796875, 0.9039306640625, 0.97314453125, 1.0423583984375, 1.111572265625, 1.1807861328125, 1.25]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 9.0, 19.0, 23.0, 41.0, 56.0, 98.0, 162.0, 235.0, 417.0, 765.0, 1401.0, 2709.0, 5753.0, 13653.0, 38859.0, 144011.0, 524645.0, 226741.0, 55827.0, 18486.0, 7447.0, 3371.0, 1735.0, 894.0, 453.0, 295.0, 156.0, 95.0, 60.0, 43.0, 31.0, 15.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.837890625, -2.735260009765625, -2.63262939453125, -2.529998779296875, -2.4273681640625, -2.324737548828125, -2.22210693359375, -2.119476318359375, -2.016845703125, -1.914215087890625, -1.81158447265625, -1.708953857421875, -1.6063232421875, -1.503692626953125, -1.40106201171875, -1.298431396484375, -1.19580078125, -1.093170166015625, -0.99053955078125, -0.887908935546875, -0.7852783203125, -0.682647705078125, -0.58001708984375, -0.477386474609375, -0.374755859375, -0.272125244140625, -0.16949462890625, -0.066864013671875, 0.0357666015625, 0.138397216796875, 0.24102783203125, 0.343658447265625, 0.4462890625, 0.548919677734375, 0.65155029296875, 0.754180908203125, 0.8568115234375, 0.959442138671875, 1.06207275390625, 1.164703369140625, 1.267333984375, 1.369964599609375, 1.47259521484375, 1.575225830078125, 1.6778564453125, 1.780487060546875, 1.88311767578125, 1.985748291015625, 2.08837890625, 2.191009521484375, 2.29364013671875, 2.396270751953125, 2.4989013671875, 2.601531982421875, 2.70416259765625, 2.806793212890625, 2.909423828125, 3.012054443359375, 3.11468505859375, 3.217315673828125, 3.3199462890625, 3.422576904296875, 3.52520751953125, 3.627838134765625, 3.73046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 25.0, 14.0, 22.0, 25.0, 17.0, 16.0, 26.0, 21.0, 35.0, 40.0, 68.0, 68.0, 94.0, 147.0, 286.0, 1343.0, 198.0, 89.0, 74.0, 58.0, 29.0, 39.0, 33.0, 33.0, 26.0, 26.0, 19.0, 23.0, 20.0, 15.0, 8.0, 10.0, 13.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.955078125, -3.827789306640625, -3.70050048828125, -3.573211669921875, -3.4459228515625, -3.318634033203125, -3.19134521484375, -3.064056396484375, -2.936767578125, -2.809478759765625, -2.68218994140625, -2.554901123046875, -2.4276123046875, -2.300323486328125, -2.17303466796875, -2.045745849609375, -1.91845703125, -1.791168212890625, -1.66387939453125, -1.536590576171875, -1.4093017578125, -1.282012939453125, -1.15472412109375, -1.027435302734375, -0.900146484375, -0.772857666015625, -0.64556884765625, -0.518280029296875, -0.3909912109375, -0.263702392578125, -0.13641357421875, -0.009124755859375, 0.1181640625, 0.245452880859375, 0.37274169921875, 0.500030517578125, 0.6273193359375, 0.754608154296875, 0.88189697265625, 1.009185791015625, 1.136474609375, 1.263763427734375, 1.39105224609375, 1.518341064453125, 1.6456298828125, 1.772918701171875, 1.90020751953125, 2.027496337890625, 2.15478515625, 2.282073974609375, 2.40936279296875, 2.536651611328125, 2.6639404296875, 2.791229248046875, 2.91851806640625, 3.045806884765625, 3.173095703125, 3.300384521484375, 3.42767333984375, 3.554962158203125, 3.6822509765625, 3.809539794921875, 3.93682861328125, 4.064117431640625, 4.19140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 3.0, 2.0, 11.0, 1.0, 16.0, 15.0, 17.0, 21.0, 25.0, 30.0, 41.0, 52.0, 53.0, 68.0, 94.0, 111.0, 208.0, 350.0, 655.0, 1977.0, 9764.0, 99632.0, 2627056.0, 378176.0, 21618.0, 3466.0, 979.0, 403.0, 234.0, 139.0, 131.0, 75.0, 53.0, 47.0, 35.0, 27.0, 27.0, 15.0, 23.0, 10.0, 9.0, 3.0, 7.0, 11.0, 5.0, 6.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.16436767578125, -7.9146728515625, -7.66497802734375, -7.415283203125, -7.16558837890625, -6.9158935546875, -6.66619873046875, -6.41650390625, -6.16680908203125, -5.9171142578125, -5.66741943359375, -5.417724609375, -5.16802978515625, -4.9183349609375, -4.66864013671875, -4.4189453125, -4.16925048828125, -3.9195556640625, -3.66986083984375, -3.420166015625, -3.17047119140625, -2.9207763671875, -2.67108154296875, -2.42138671875, -2.17169189453125, -1.9219970703125, -1.67230224609375, -1.422607421875, -1.17291259765625, -0.9232177734375, -0.67352294921875, -0.423828125, -0.17413330078125, 0.0755615234375, 0.32525634765625, 0.574951171875, 0.82464599609375, 1.0743408203125, 1.32403564453125, 1.57373046875, 1.82342529296875, 2.0731201171875, 2.32281494140625, 2.572509765625, 2.82220458984375, 3.0718994140625, 3.32159423828125, 3.5712890625, 3.82098388671875, 4.0706787109375, 4.32037353515625, 4.570068359375, 4.81976318359375, 5.0694580078125, 5.31915283203125, 5.56884765625, 5.81854248046875, 6.0682373046875, 6.31793212890625, 6.567626953125, 6.81732177734375, 7.0670166015625, 7.31671142578125, 7.56640625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 308.0, 705.0, 1.0, 1.0], "bins": [-339.839599609375, -334.2760925292969, -328.7126159667969, -323.14910888671875, -317.58563232421875, -312.0221252441406, -306.4586181640625, -300.8951416015625, -295.3316345214844, -289.76812744140625, -284.20465087890625, -278.6411437988281, -273.07763671875, -267.51416015625, -261.9506530761719, -256.3871765136719, -250.82366943359375, -245.2601776123047, -239.69668579101562, -234.1331787109375, -228.56968688964844, -223.00619506835938, -217.44268798828125, -211.8791961669922, -206.31570434570312, -200.75221252441406, -195.188720703125, -189.62521362304688, -184.0617218017578, -178.49822998046875, -172.93472290039062, -167.37123107910156, -161.8077392578125, -156.24424743652344, -150.68075561523438, -145.11724853515625, -139.5537567138672, -133.99026489257812, -128.4267578125, -122.86326599121094, -117.29977416992188, -111.73628234863281, -106.17278289794922, -100.60928344726562, -95.04579162597656, -89.4822998046875, -83.9188003540039, -78.35530090332031, -72.79180908203125, -67.22831726074219, -61.664817810058594, -56.101322174072266, -50.53782653808594, -44.97433090209961, -39.41083526611328, -33.84733963012695, -28.28384017944336, -22.72034454345703, -17.156848907470703, -11.593353271484375, -6.029857635498047, -0.46636199951171875, 5.097133636474609, 10.660629272460938, 16.224124908447266]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 4.0, 15.0, 3.0, 14.0, 19.0, 15.0, 13.0, 22.0, 28.0, 22.0, 26.0, 35.0, 37.0, 31.0, 42.0, 33.0, 34.0, 50.0, 50.0, 55.0, 42.0, 39.0, 47.0, 33.0, 33.0, 32.0, 33.0, 27.0, 35.0, 17.0, 22.0, 18.0, 11.0, 7.0, 10.0, 10.0, 7.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.351264953613281, -14.917603492736816, -14.483942031860352, -14.050280570983887, -13.616619110107422, -13.182957649230957, -12.749296188354492, -12.315633773803711, -11.881973266601562, -11.448311805725098, -11.014650344848633, -10.580988883972168, -10.147327423095703, -9.713665962219238, -9.280004501342773, -8.846342086791992, -8.412680625915527, -7.9790191650390625, -7.545357704162598, -7.111696243286133, -6.678034782409668, -6.244373321533203, -5.81071138381958, -5.377049922943115, -4.94338846206665, -4.5097270011901855, -4.076065540313721, -3.6424038410186768, -3.208742380142212, -2.775080919265747, -2.341419219970703, -1.9077577590942383, -1.4740962982177734, -1.0404348373413086, -0.6067732572555542, -0.1731116771697998, 0.26054978370666504, 0.6942112445831299, 1.1278729438781738, 1.5615344047546387, 1.9951958656311035, 2.4288573265075684, 2.862518787384033, 3.296180486679077, 3.729841947555542, 4.163503646850586, 4.597165107727051, 5.030826568603516, 5.4644880294799805, 5.898149490356445, 6.33181095123291, 6.765472412109375, 7.19913387298584, 7.632795333862305, 8.066457748413086, 8.500118255615234, 8.933780670166016, 9.36744213104248, 9.801103591918945, 10.23476505279541, 10.668426513671875, 11.10208797454834, 11.535749435424805, 11.969411849975586, 12.403072357177734]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 8.0, 14.0, 11.0, 19.0, 26.0, 25.0, 49.0, 40.0, 40.0, 57.0, 71.0, 53.0, 65.0, 61.0, 61.0, 68.0, 61.0, 45.0, 42.0, 38.0, 35.0, 31.0, 19.0, 11.0, 13.0, 13.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.025390625, -2.9557647705078125, -2.886138916015625, -2.8165130615234375, -2.74688720703125, -2.6772613525390625, -2.607635498046875, -2.5380096435546875, -2.4683837890625, -2.3987579345703125, -2.329132080078125, -2.2595062255859375, -2.18988037109375, -2.1202545166015625, -2.050628662109375, -1.9810028076171875, -1.911376953125, -1.8417510986328125, -1.772125244140625, -1.7024993896484375, -1.63287353515625, -1.5632476806640625, -1.493621826171875, -1.4239959716796875, -1.3543701171875, -1.2847442626953125, -1.215118408203125, -1.1454925537109375, -1.07586669921875, -1.0062408447265625, -0.936614990234375, -0.8669891357421875, -0.79736328125, -0.7277374267578125, -0.658111572265625, -0.5884857177734375, -0.51885986328125, -0.4492340087890625, -0.379608154296875, -0.3099822998046875, -0.2403564453125, -0.1707305908203125, -0.101104736328125, -0.0314788818359375, 0.03814697265625, 0.1077728271484375, 0.177398681640625, 0.2470245361328125, 0.316650390625, 0.3862762451171875, 0.455902099609375, 0.5255279541015625, 0.59515380859375, 0.6647796630859375, 0.734405517578125, 0.8040313720703125, 0.8736572265625, 0.9432830810546875, 1.012908935546875, 1.0825347900390625, 1.15216064453125, 1.2217864990234375, 1.291412353515625, 1.3610382080078125, 1.4306640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 12.0, 9.0, 9.0, 16.0, 29.0, 16.0, 45.0, 66.0, 93.0, 171.0, 379.0, 1046.0, 3059.0, 11998.0, 85074.0, 2615493.0, 1409480.0, 53984.0, 9261.0, 2489.0, 898.0, 303.0, 139.0, 81.0, 36.0, 30.0, 22.0, 14.0, 15.0, 6.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-9.234375, -9.01910400390625, -8.8038330078125, -8.58856201171875, -8.373291015625, -8.15802001953125, -7.9427490234375, -7.72747802734375, -7.51220703125, -7.29693603515625, -7.0816650390625, -6.86639404296875, -6.651123046875, -6.43585205078125, -6.2205810546875, -6.00531005859375, -5.7900390625, -5.57476806640625, -5.3594970703125, -5.14422607421875, -4.928955078125, -4.71368408203125, -4.4984130859375, -4.28314208984375, -4.06787109375, -3.85260009765625, -3.6373291015625, -3.42205810546875, -3.206787109375, -2.99151611328125, -2.7762451171875, -2.56097412109375, -2.345703125, -2.13043212890625, -1.9151611328125, -1.69989013671875, -1.484619140625, -1.26934814453125, -1.0540771484375, -0.83880615234375, -0.62353515625, -0.40826416015625, -0.1929931640625, 0.02227783203125, 0.237548828125, 0.45281982421875, 0.6680908203125, 0.88336181640625, 1.0986328125, 1.31390380859375, 1.5291748046875, 1.74444580078125, 1.959716796875, 2.17498779296875, 2.3902587890625, 2.60552978515625, 2.82080078125, 3.03607177734375, 3.2513427734375, 3.46661376953125, 3.681884765625, 3.89715576171875, 4.1124267578125, 4.32769775390625, 4.54296875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 9.0, 12.0, 12.0, 14.0, 31.0, 45.0, 51.0, 50.0, 88.0, 101.0, 122.0, 175.0, 257.0, 381.0, 501.0, 500.0, 456.0, 350.0, 218.0, 178.0, 139.0, 89.0, 60.0, 57.0, 36.0, 28.0, 21.0, 22.0, 15.0, 13.0, 8.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.56683349609375, -2.4656982421875, -2.36456298828125, -2.263427734375, -2.16229248046875, -2.0611572265625, -1.96002197265625, -1.85888671875, -1.75775146484375, -1.6566162109375, -1.55548095703125, -1.454345703125, -1.35321044921875, -1.2520751953125, -1.15093994140625, -1.0498046875, -0.94866943359375, -0.8475341796875, -0.74639892578125, -0.645263671875, -0.54412841796875, -0.4429931640625, -0.34185791015625, -0.24072265625, -0.13958740234375, -0.0384521484375, 0.06268310546875, 0.163818359375, 0.26495361328125, 0.3660888671875, 0.46722412109375, 0.568359375, 0.66949462890625, 0.7706298828125, 0.87176513671875, 0.972900390625, 1.07403564453125, 1.1751708984375, 1.27630615234375, 1.37744140625, 1.47857666015625, 1.5797119140625, 1.68084716796875, 1.781982421875, 1.88311767578125, 1.9842529296875, 2.08538818359375, 2.1865234375, 2.28765869140625, 2.3887939453125, 2.48992919921875, 2.591064453125, 2.69219970703125, 2.7933349609375, 2.89447021484375, 2.99560546875, 3.09674072265625, 3.1978759765625, 3.29901123046875, 3.400146484375, 3.50128173828125, 3.6024169921875, 3.70355224609375, 3.8046875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 5.0, 6.0, 9.0, 15.0, 21.0, 28.0, 19.0, 35.0, 50.0, 87.0, 107.0, 151.0, 283.0, 608.0, 2031.0, 10866.0, 95935.0, 2735552.0, 1281536.0, 57001.0, 7132.0, 1537.0, 509.0, 261.0, 122.0, 105.0, 62.0, 59.0, 42.0, 30.0, 16.0, 10.0, 16.0, 10.0, 5.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.291015625, -9.99609375, -9.701171875, -9.40625, -9.111328125, -8.81640625, -8.521484375, -8.2265625, -7.931640625, -7.63671875, -7.341796875, -7.046875, -6.751953125, -6.45703125, -6.162109375, -5.8671875, -5.572265625, -5.27734375, -4.982421875, -4.6875, -4.392578125, -4.09765625, -3.802734375, -3.5078125, -3.212890625, -2.91796875, -2.623046875, -2.328125, -2.033203125, -1.73828125, -1.443359375, -1.1484375, -0.853515625, -0.55859375, -0.263671875, 0.03125, 0.326171875, 0.62109375, 0.916015625, 1.2109375, 1.505859375, 1.80078125, 2.095703125, 2.390625, 2.685546875, 2.98046875, 3.275390625, 3.5703125, 3.865234375, 4.16015625, 4.455078125, 4.75, 5.044921875, 5.33984375, 5.634765625, 5.9296875, 6.224609375, 6.51953125, 6.814453125, 7.109375, 7.404296875, 7.69921875, 7.994140625, 8.2890625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 10.0, 14.0, 26.0, 45.0, 85.0, 150.0, 207.0, 193.0, 125.0, 74.0, 46.0, 23.0, 7.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.37080383300781, -37.41209030151367, -36.453372955322266, -35.494659423828125, -34.535945892333984, -33.57722854614258, -32.61851501464844, -31.659799575805664, -30.70108413696289, -29.742368698120117, -28.783655166625977, -27.824939727783203, -26.86622428894043, -25.907508850097656, -24.948795318603516, -23.990079879760742, -23.0313663482666, -22.072650909423828, -21.113937377929688, -20.155221939086914, -19.19650650024414, -18.23779296875, -17.279077529907227, -16.320362091064453, -15.361647605895996, -14.402933120727539, -13.444217681884766, -12.485503196716309, -11.526788711547852, -10.568073272705078, -9.609358787536621, -8.650644302368164, -7.691930770874023, -6.733215808868408, -5.774500846862793, -4.815786361694336, -3.8570713996887207, -2.8983564376831055, -1.9396419525146484, -0.9809269905090332, -0.02221202850341797, 0.9365028142929077, 1.8952176570892334, 2.8539323806762695, 3.8126473426818848, 4.7713623046875, 5.730076789855957, 6.688791751861572, 7.6475067138671875, 8.606221199035645, 9.564936637878418, 10.523651123046875, 11.482366561889648, 12.441081047058105, 13.399795532226562, 14.358510971069336, 15.317225456237793, 16.27593994140625, 17.234655380249023, 18.193370819091797, 19.152084350585938, 20.11079978942871, 21.069515228271484, 22.028228759765625, 22.9869441986084]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 9.0, 16.0, 16.0, 17.0, 11.0, 14.0, 26.0, 22.0, 23.0, 27.0, 25.0, 40.0, 31.0, 35.0, 36.0, 41.0, 41.0, 53.0, 29.0, 46.0, 33.0, 36.0, 36.0, 33.0, 27.0, 28.0, 27.0, 25.0, 26.0, 27.0, 14.0, 13.0, 10.0, 10.0, 9.0, 13.0, 6.0, 6.0, 13.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.077351570129395, -9.769559860229492, -9.461769104003906, -9.153977394104004, -8.846185684204102, -8.538394927978516, -8.230603218078613, -7.922811508178711, -7.615020275115967, -7.307229042053223, -6.99943733215332, -6.691646099090576, -6.383854866027832, -6.07606315612793, -5.7682719230651855, -5.460480690002441, -5.152688980102539, -4.844897747039795, -4.537106037139893, -4.229314804077148, -3.921523332595825, -3.613731861114502, -3.305940628051758, -2.9981491565704346, -2.6903576850891113, -2.382566213607788, -2.074774742126465, -1.7669835090637207, -1.4591920375823975, -1.1514005661010742, -0.8436092138290405, -0.5358178615570068, -0.2280254364013672, 0.07976597547531128, 0.38755738735198975, 0.6953487992286682, 1.0031402111053467, 1.31093168258667, 1.6187230348587036, 1.9265143871307373, 2.2343058586120605, 2.542097330093384, 2.849888801574707, 3.157680034637451, 3.4654715061187744, 3.7732629776000977, 4.081054210662842, 4.388845443725586, 4.696637153625488, 5.004428386688232, 5.312220096588135, 5.620011329650879, 5.927803039550781, 6.235594272613525, 6.5433855056762695, 6.851177215576172, 7.158968448638916, 7.46675968170166, 7.7745513916015625, 8.082343101501465, 8.39013385772705, 8.697925567626953, 9.005717277526855, 9.313508033752441, 9.621299743652344]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 17.0, 8.0, 12.0, 18.0, 24.0, 31.0, 31.0, 33.0, 39.0, 50.0, 65.0, 56.0, 58.0, 56.0, 57.0, 53.0, 60.0, 65.0, 46.0, 46.0, 34.0, 37.0, 29.0, 15.0, 20.0, 16.0, 4.0, 7.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0], "bins": [-2.7734375, -2.710174560546875, -2.64691162109375, -2.583648681640625, -2.5203857421875, -2.457122802734375, -2.39385986328125, -2.330596923828125, -2.267333984375, -2.204071044921875, -2.14080810546875, -2.077545166015625, -2.0142822265625, -1.951019287109375, -1.88775634765625, -1.824493408203125, -1.76123046875, -1.697967529296875, -1.63470458984375, -1.571441650390625, -1.5081787109375, -1.444915771484375, -1.38165283203125, -1.318389892578125, -1.255126953125, -1.191864013671875, -1.12860107421875, -1.065338134765625, -1.0020751953125, -0.938812255859375, -0.87554931640625, -0.812286376953125, -0.7490234375, -0.685760498046875, -0.62249755859375, -0.559234619140625, -0.4959716796875, -0.432708740234375, -0.36944580078125, -0.306182861328125, -0.242919921875, -0.179656982421875, -0.11639404296875, -0.053131103515625, 0.0101318359375, 0.073394775390625, 0.13665771484375, 0.199920654296875, 0.26318359375, 0.326446533203125, 0.38970947265625, 0.452972412109375, 0.5162353515625, 0.579498291015625, 0.64276123046875, 0.706024169921875, 0.769287109375, 0.832550048828125, 0.89581298828125, 0.959075927734375, 1.0223388671875, 1.085601806640625, 1.14886474609375, 1.212127685546875, 1.275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 14.0, 7.0, 12.0, 20.0, 44.0, 66.0, 144.0, 300.0, 616.0, 1715.0, 4784.0, 13293.0, 38175.0, 105157.0, 229050.0, 305972.0, 207756.0, 90395.0, 33169.0, 11267.0, 4024.0, 1497.0, 585.0, 229.0, 112.0, 44.0, 28.0, 27.0, 14.0, 8.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5215301513671875, -1.469818115234375, -1.4181060791015625, -1.36639404296875, -1.3146820068359375, -1.262969970703125, -1.2112579345703125, -1.1595458984375, -1.1078338623046875, -1.056121826171875, -1.0044097900390625, -0.95269775390625, -0.9009857177734375, -0.849273681640625, -0.7975616455078125, -0.745849609375, -0.6941375732421875, -0.642425537109375, -0.5907135009765625, -0.53900146484375, -0.4872894287109375, -0.435577392578125, -0.3838653564453125, -0.3321533203125, -0.2804412841796875, -0.228729248046875, -0.1770172119140625, -0.12530517578125, -0.0735931396484375, -0.021881103515625, 0.0298309326171875, 0.08154296875, 0.1332550048828125, 0.184967041015625, 0.2366790771484375, 0.28839111328125, 0.3401031494140625, 0.391815185546875, 0.4435272216796875, 0.4952392578125, 0.5469512939453125, 0.598663330078125, 0.6503753662109375, 0.70208740234375, 0.7537994384765625, 0.805511474609375, 0.8572235107421875, 0.908935546875, 0.9606475830078125, 1.012359619140625, 1.0640716552734375, 1.11578369140625, 1.1674957275390625, 1.219207763671875, 1.2709197998046875, 1.3226318359375, 1.3743438720703125, 1.426055908203125, 1.4777679443359375, 1.52947998046875, 1.5811920166015625, 1.632904052734375, 1.6846160888671875, 1.736328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 6.0, 5.0, 7.0, 15.0, 11.0, 18.0, 20.0, 21.0, 33.0, 35.0, 43.0, 35.0, 42.0, 44.0, 40.0, 47.0, 1066.0, 56.0, 54.0, 48.0, 49.0, 40.0, 43.0, 29.0, 29.0, 37.0, 24.0, 29.0, 16.0, 17.0, 18.0, 11.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32708740234375, -1.2840576171875, -1.24102783203125, -1.197998046875, -1.15496826171875, -1.1119384765625, -1.06890869140625, -1.02587890625, -0.98284912109375, -0.9398193359375, -0.89678955078125, -0.853759765625, -0.81072998046875, -0.7677001953125, -0.72467041015625, -0.681640625, -0.63861083984375, -0.5955810546875, -0.55255126953125, -0.509521484375, -0.46649169921875, -0.4234619140625, -0.38043212890625, -0.33740234375, -0.29437255859375, -0.2513427734375, -0.20831298828125, -0.165283203125, -0.12225341796875, -0.0792236328125, -0.03619384765625, 0.0068359375, 0.04986572265625, 0.0928955078125, 0.13592529296875, 0.178955078125, 0.22198486328125, 0.2650146484375, 0.30804443359375, 0.35107421875, 0.39410400390625, 0.4371337890625, 0.48016357421875, 0.523193359375, 0.56622314453125, 0.6092529296875, 0.65228271484375, 0.6953125, 0.73834228515625, 0.7813720703125, 0.82440185546875, 0.867431640625, 0.91046142578125, 0.9534912109375, 0.99652099609375, 1.03955078125, 1.08258056640625, 1.1256103515625, 1.16864013671875, 1.211669921875, 1.25469970703125, 1.2977294921875, 1.34075927734375, 1.3837890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 9.0, 5.0, 9.0, 17.0, 25.0, 29.0, 42.0, 84.0, 114.0, 197.0, 284.0, 452.0, 676.0, 1013.0, 1574.0, 2515.0, 3828.0, 5957.0, 9232.0, 14846.0, 26090.0, 72936.0, 1311719.0, 528616.0, 56340.0, 23145.0, 13476.0, 8493.0, 5540.0, 3542.0, 2270.0, 1411.0, 916.0, 610.0, 363.0, 268.0, 168.0, 112.0, 74.0, 41.0, 31.0, 24.0, 14.0, 9.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9939422607421875, -0.959564208984375, -0.9251861572265625, -0.89080810546875, -0.8564300537109375, -0.822052001953125, -0.7876739501953125, -0.7532958984375, -0.7189178466796875, -0.684539794921875, -0.6501617431640625, -0.61578369140625, -0.5814056396484375, -0.547027587890625, -0.5126495361328125, -0.478271484375, -0.4438934326171875, -0.409515380859375, -0.3751373291015625, -0.34075927734375, -0.3063812255859375, -0.272003173828125, -0.2376251220703125, -0.2032470703125, -0.1688690185546875, -0.134490966796875, -0.1001129150390625, -0.06573486328125, -0.0313568115234375, 0.003021240234375, 0.0373992919921875, 0.07177734375, 0.1061553955078125, 0.140533447265625, 0.1749114990234375, 0.20928955078125, 0.2436676025390625, 0.278045654296875, 0.3124237060546875, 0.3468017578125, 0.3811798095703125, 0.415557861328125, 0.4499359130859375, 0.48431396484375, 0.5186920166015625, 0.553070068359375, 0.5874481201171875, 0.621826171875, 0.6562042236328125, 0.690582275390625, 0.7249603271484375, 0.75933837890625, 0.7937164306640625, 0.828094482421875, 0.8624725341796875, 0.8968505859375, 0.9312286376953125, 0.965606689453125, 0.9999847412109375, 1.03436279296875, 1.0687408447265625, 1.103118896484375, 1.1374969482421875, 1.171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 6.0, 16.0, 4.0, 11.0, 25.0, 25.0, 37.0, 64.0, 80.0, 105.0, 116.0, 91.0, 97.0, 74.0, 64.0, 36.0, 27.0, 18.0, 20.0, 19.0, 7.0, 2.0, 4.0, 7.0, 2.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11663818359375, -0.11246013641357422, -0.10828208923339844, -0.10410404205322266, -0.09992599487304688, -0.0957479476928711, -0.09156990051269531, -0.08739185333251953, -0.08321380615234375, -0.07903575897216797, -0.07485771179199219, -0.0706796646118164, -0.06650161743164062, -0.062323570251464844, -0.05814552307128906, -0.05396747589111328, -0.0497894287109375, -0.04561138153076172, -0.04143333435058594, -0.037255287170410156, -0.033077239990234375, -0.028899192810058594, -0.024721145629882812, -0.02054309844970703, -0.01636505126953125, -0.012187004089355469, -0.008008956909179688, -0.0038309097290039062, 0.000347137451171875, 0.004525184631347656, 0.008703231811523438, 0.012881278991699219, 0.017059326171875, 0.02123737335205078, 0.025415420532226562, 0.029593467712402344, 0.033771514892578125, 0.037949562072753906, 0.04212760925292969, 0.04630565643310547, 0.05048370361328125, 0.05466175079345703, 0.05883979797363281, 0.0630178451538086, 0.06719589233398438, 0.07137393951416016, 0.07555198669433594, 0.07973003387451172, 0.0839080810546875, 0.08808612823486328, 0.09226417541503906, 0.09644222259521484, 0.10062026977539062, 0.1047983169555664, 0.10897636413574219, 0.11315441131591797, 0.11733245849609375, 0.12151050567626953, 0.1256885528564453, 0.1298666000366211, 0.13404464721679688, 0.13822269439697266, 0.14240074157714844, 0.14657878875732422, 0.1507568359375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 8.0, 6.0, 9.0, 7.0, 23.0, 15.0, 30.0, 34.0, 51.0, 73.0, 129.0, 279.0, 1245.0, 17482.0, 979857.0, 46290.0, 2200.0, 369.0, 160.0, 74.0, 56.0, 41.0, 16.0, 13.0, 18.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.50390625, -2.435516357421875, -2.36712646484375, -2.298736572265625, -2.2303466796875, -2.161956787109375, -2.09356689453125, -2.025177001953125, -1.956787109375, -1.888397216796875, -1.82000732421875, -1.751617431640625, -1.6832275390625, -1.614837646484375, -1.54644775390625, -1.478057861328125, -1.40966796875, -1.341278076171875, -1.27288818359375, -1.204498291015625, -1.1361083984375, -1.067718505859375, -0.99932861328125, -0.930938720703125, -0.862548828125, -0.794158935546875, -0.72576904296875, -0.657379150390625, -0.5889892578125, -0.520599365234375, -0.45220947265625, -0.383819580078125, -0.3154296875, -0.247039794921875, -0.17864990234375, -0.110260009765625, -0.0418701171875, 0.026519775390625, 0.09490966796875, 0.163299560546875, 0.231689453125, 0.300079345703125, 0.36846923828125, 0.436859130859375, 0.5052490234375, 0.573638916015625, 0.64202880859375, 0.710418701171875, 0.77880859375, 0.847198486328125, 0.91558837890625, 0.983978271484375, 1.0523681640625, 1.120758056640625, 1.18914794921875, 1.257537841796875, 1.325927734375, 1.394317626953125, 1.46270751953125, 1.531097412109375, 1.5994873046875, 1.667877197265625, 1.73626708984375, 1.804656982421875, 1.873046875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 34.0, 113.0, 447.0, 319.0, 78.0, 15.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3178937435150146, -1.2626017332077026, -1.2073097229003906, -1.1520177125930786, -1.0967257022857666, -1.0414336919784546, -0.9861416816711426, -0.9308496713638306, -0.8755576610565186, -0.8202656507492065, -0.7649736404418945, -0.7096816301345825, -0.6543896198272705, -0.5990976095199585, -0.5438055992126465, -0.4885135889053345, -0.43322157859802246, -0.37792956829071045, -0.32263755798339844, -0.2673455476760864, -0.21205353736877441, -0.1567615270614624, -0.10146951675415039, -0.04617750644683838, 0.009114503860473633, 0.06440651416778564, 0.11969852447509766, 0.17499053478240967, 0.23028254508972168, 0.2855745553970337, 0.3408665657043457, 0.3961585760116577, 0.4514505863189697, 0.5067425966262817, 0.5620346069335938, 0.6173266172409058, 0.6726186275482178, 0.7279106378555298, 0.7832026481628418, 0.8384946584701538, 0.8937866687774658, 0.9490786790847778, 1.0043706893920898, 1.0596626996994019, 1.1149547100067139, 1.1702467203140259, 1.225538730621338, 1.28083074092865, 1.336122751235962, 1.391414761543274, 1.446706771850586, 1.501998782157898, 1.55729079246521, 1.612582802772522, 1.667874813079834, 1.723166823387146, 1.778458833694458, 1.83375084400177, 1.889042854309082, 1.944334864616394, 1.999626874923706, 2.0549187660217285, 2.11021089553833, 2.1655030250549316, 2.220794916152954]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 5.0, 12.0, 14.0, 13.0, 22.0, 31.0, 39.0, 39.0, 31.0, 56.0, 55.0, 57.0, 60.0, 69.0, 68.0, 58.0, 53.0, 53.0, 49.0, 45.0, 39.0, 28.0, 29.0, 23.0, 15.0, 13.0, 5.0, 7.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.4890289306640625, -0.4769285023212433, -0.46482810378074646, -0.45272767543792725, -0.4406272768974304, -0.4285268485546112, -0.416426420211792, -0.40432602167129517, -0.39222559332847595, -0.38012516498565674, -0.3680247664451599, -0.3559243381023407, -0.34382393956184387, -0.33172351121902466, -0.31962311267852783, -0.3075226843357086, -0.2954222559928894, -0.2833218276500702, -0.27122142910957336, -0.25912100076675415, -0.24702058732509613, -0.2349201738834381, -0.2228197604417801, -0.21071934700012207, -0.19861894845962524, -0.18651853501796722, -0.1744181215763092, -0.16231769323349, -0.15021727979183197, -0.13811686635017395, -0.12601645290851593, -0.11391603201627731, -0.1018156111240387, -0.08971519768238068, -0.07761477679014206, -0.06551436334848404, -0.05341394618153572, -0.0413135290145874, -0.029213115572929382, -0.017112694680690765, -0.005012281239032745, 0.0070881349965929985, 0.019188551232218742, 0.03128896653652191, 0.04338938370347023, 0.05548980087041855, 0.06759021431207657, 0.07969063520431519, 0.0917910486459732, 0.10389146208763123, 0.11599188297986984, 0.12809228897094727, 0.14019271731376648, 0.1522931307554245, 0.16439354419708252, 0.17649397253990173, 0.18859437108039856, 0.20069478452205658, 0.2127951979637146, 0.2248956263065338, 0.23699603974819183, 0.24909645318984985, 0.2611968517303467, 0.2732972800731659, 0.2853977084159851]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 7.0, 15.0, 11.0, 15.0, 20.0, 26.0, 24.0, 37.0, 42.0, 35.0, 58.0, 57.0, 51.0, 51.0, 62.0, 40.0, 42.0, 54.0, 50.0, 51.0, 48.0, 37.0, 31.0, 27.0, 23.0, 24.0, 14.0, 16.0, 5.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-2.30078125, -2.243133544921875, -2.18548583984375, -2.127838134765625, -2.0701904296875, -2.012542724609375, -1.95489501953125, -1.897247314453125, -1.839599609375, -1.781951904296875, -1.72430419921875, -1.666656494140625, -1.6090087890625, -1.551361083984375, -1.49371337890625, -1.436065673828125, -1.37841796875, -1.320770263671875, -1.26312255859375, -1.205474853515625, -1.1478271484375, -1.090179443359375, -1.03253173828125, -0.974884033203125, -0.917236328125, -0.859588623046875, -0.80194091796875, -0.744293212890625, -0.6866455078125, -0.628997802734375, -0.57135009765625, -0.513702392578125, -0.4560546875, -0.398406982421875, -0.34075927734375, -0.283111572265625, -0.2254638671875, -0.167816162109375, -0.11016845703125, -0.052520751953125, 0.005126953125, 0.062774658203125, 0.12042236328125, 0.178070068359375, 0.2357177734375, 0.293365478515625, 0.35101318359375, 0.408660888671875, 0.46630859375, 0.523956298828125, 0.58160400390625, 0.639251708984375, 0.6968994140625, 0.754547119140625, 0.81219482421875, 0.869842529296875, 0.927490234375, 0.985137939453125, 1.04278564453125, 1.100433349609375, 1.1580810546875, 1.215728759765625, 1.27337646484375, 1.331024169921875, 1.388671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 10.0, 13.0, 15.0, 27.0, 22.0, 47.0, 65.0, 118.0, 155.0, 281.0, 486.0, 952.0, 1933.0, 4221.0, 10191.0, 30103.0, 105209.0, 394514.0, 360890.0, 94341.0, 27732.0, 9528.0, 3879.0, 1732.0, 924.0, 476.0, 236.0, 158.0, 92.0, 75.0, 42.0, 24.0, 22.0, 3.0, 8.0, 3.0, 8.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.791015625, -2.691192626953125, -2.59136962890625, -2.491546630859375, -2.3917236328125, -2.291900634765625, -2.19207763671875, -2.092254638671875, -1.992431640625, -1.892608642578125, -1.79278564453125, -1.692962646484375, -1.5931396484375, -1.493316650390625, -1.39349365234375, -1.293670654296875, -1.19384765625, -1.094024658203125, -0.99420166015625, -0.894378662109375, -0.7945556640625, -0.694732666015625, -0.59490966796875, -0.495086669921875, -0.395263671875, -0.295440673828125, -0.19561767578125, -0.095794677734375, 0.0040283203125, 0.103851318359375, 0.20367431640625, 0.303497314453125, 0.4033203125, 0.503143310546875, 0.60296630859375, 0.702789306640625, 0.8026123046875, 0.902435302734375, 1.00225830078125, 1.102081298828125, 1.201904296875, 1.301727294921875, 1.40155029296875, 1.501373291015625, 1.6011962890625, 1.701019287109375, 1.80084228515625, 1.900665283203125, 2.00048828125, 2.100311279296875, 2.20013427734375, 2.299957275390625, 2.3997802734375, 2.499603271484375, 2.59942626953125, 2.699249267578125, 2.799072265625, 2.898895263671875, 2.99871826171875, 3.098541259765625, 3.1983642578125, 3.298187255859375, 3.39801025390625, 3.497833251953125, 3.59765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 10.0, 15.0, 11.0, 22.0, 19.0, 37.0, 43.0, 28.0, 28.0, 68.0, 67.0, 74.0, 128.0, 213.0, 1423.0, 262.0, 151.0, 64.0, 63.0, 55.0, 31.0, 21.0, 31.0, 30.0, 23.0, 27.0, 17.0, 12.0, 16.0, 9.0, 6.0, 4.0, 4.0, 7.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.80859375, -5.64605712890625, -5.4835205078125, -5.32098388671875, -5.158447265625, -4.99591064453125, -4.8333740234375, -4.67083740234375, -4.50830078125, -4.34576416015625, -4.1832275390625, -4.02069091796875, -3.858154296875, -3.69561767578125, -3.5330810546875, -3.37054443359375, -3.2080078125, -3.04547119140625, -2.8829345703125, -2.72039794921875, -2.557861328125, -2.39532470703125, -2.2327880859375, -2.07025146484375, -1.90771484375, -1.74517822265625, -1.5826416015625, -1.42010498046875, -1.257568359375, -1.09503173828125, -0.9324951171875, -0.76995849609375, -0.607421875, -0.44488525390625, -0.2823486328125, -0.11981201171875, 0.042724609375, 0.20526123046875, 0.3677978515625, 0.53033447265625, 0.69287109375, 0.85540771484375, 1.0179443359375, 1.18048095703125, 1.343017578125, 1.50555419921875, 1.6680908203125, 1.83062744140625, 1.9931640625, 2.15570068359375, 2.3182373046875, 2.48077392578125, 2.643310546875, 2.80584716796875, 2.9683837890625, 3.13092041015625, 3.29345703125, 3.45599365234375, 3.6185302734375, 3.78106689453125, 3.943603515625, 4.10614013671875, 4.2686767578125, 4.43121337890625, 4.59375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 10.0, 17.0, 10.0, 22.0, 29.0, 40.0, 37.0, 77.0, 80.0, 103.0, 135.0, 156.0, 324.0, 761.0, 3720.0, 48759.0, 2769228.0, 310006.0, 9340.0, 1428.0, 482.0, 248.0, 179.0, 136.0, 87.0, 63.0, 40.0, 53.0, 31.0, 17.0, 20.0, 12.0, 12.0, 14.0, 5.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.0897216796875, -8.773193359375, -8.4566650390625, -8.14013671875, -7.8236083984375, -7.507080078125, -7.1905517578125, -6.8740234375, -6.5574951171875, -6.240966796875, -5.9244384765625, -5.60791015625, -5.2913818359375, -4.974853515625, -4.6583251953125, -4.341796875, -4.0252685546875, -3.708740234375, -3.3922119140625, -3.07568359375, -2.7591552734375, -2.442626953125, -2.1260986328125, -1.8095703125, -1.4930419921875, -1.176513671875, -0.8599853515625, -0.54345703125, -0.2269287109375, 0.089599609375, 0.4061279296875, 0.72265625, 1.0391845703125, 1.355712890625, 1.6722412109375, 1.98876953125, 2.3052978515625, 2.621826171875, 2.9383544921875, 3.2548828125, 3.5714111328125, 3.887939453125, 4.2044677734375, 4.52099609375, 4.8375244140625, 5.154052734375, 5.4705810546875, 5.787109375, 6.1036376953125, 6.420166015625, 6.7366943359375, 7.05322265625, 7.3697509765625, 7.686279296875, 8.0028076171875, 8.3193359375, 8.6358642578125, 8.952392578125, 9.2689208984375, 9.58544921875, 9.9019775390625, 10.218505859375, 10.5350341796875, 10.8515625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 90.0, 697.0, 216.0, 12.0], "bins": [-134.36468505859375, -132.18492126464844, -130.00514221191406, -127.82537841796875, -125.64561462402344, -123.4658432006836, -121.28607940673828, -119.10630798339844, -116.92654418945312, -114.74677276611328, -112.56700897216797, -110.38723754882812, -108.20747375488281, -106.02770233154297, -103.84793853759766, -101.66816711425781, -99.48839569091797, -97.30862426757812, -95.12886047363281, -92.94908905029297, -90.76932525634766, -88.58955383300781, -86.4097900390625, -84.23001861572266, -82.05024719238281, -79.87047576904297, -77.69071197509766, -75.51094055175781, -73.3311767578125, -71.15140533447266, -68.97164154052734, -66.7918701171875, -64.61210632324219, -62.43233871459961, -60.25257110595703, -58.07280349731445, -55.893035888671875, -53.71326446533203, -51.53349685668945, -49.353729248046875, -47.17395782470703, -44.99419021606445, -42.814422607421875, -40.6346549987793, -38.45488739013672, -36.275115966796875, -34.0953483581543, -31.91558074951172, -29.735815048217773, -27.556047439575195, -25.376277923583984, -23.196510314941406, -21.016742706298828, -18.83697509765625, -16.657207489013672, -14.477437973022461, -12.297670364379883, -10.117902755737305, -7.93813419342041, -5.758366107940674, -3.5785980224609375, -1.3988304138183594, 0.7809381484985352, 2.9607067108154297, 5.140474319458008]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 9.0, 7.0, 9.0, 10.0, 18.0, 13.0, 12.0, 13.0, 25.0, 29.0, 36.0, 27.0, 31.0, 35.0, 41.0, 42.0, 28.0, 35.0, 49.0, 45.0, 39.0, 41.0, 42.0, 30.0, 50.0, 36.0, 31.0, 37.0, 20.0, 23.0, 22.0, 12.0, 15.0, 24.0, 11.0, 9.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.524447441101074, -13.106252670288086, -12.688056945800781, -12.269862174987793, -11.851666450500488, -11.4334716796875, -11.015275955200195, -10.597081184387207, -10.178886413574219, -9.76069164276123, -9.342495918273926, -8.924301147460938, -8.506105422973633, -8.087910652160645, -7.669715404510498, -7.251520156860352, -6.833324909210205, -6.415129661560059, -5.996934413909912, -5.578739166259766, -5.160544395446777, -4.742349147796631, -4.324153900146484, -3.905958890914917, -3.4877636432647705, -3.069568395614624, -2.6513733863830566, -2.23317813873291, -1.8149830102920532, -1.3967878818511963, -0.9785926342010498, -0.5603976249694824, -0.14220237731933594, 0.2759927809238434, 0.6941879391670227, 1.1123831272125244, 1.5305782556533813, 1.9487733840942383, 2.3669686317443848, 2.785163640975952, 3.2033588886260986, 3.621554136276245, 4.0397491455078125, 4.457944393157959, 4.8761396408081055, 5.294334411621094, 5.712530136108398, 6.130724906921387, 6.548920154571533, 6.96711540222168, 7.385310649871826, 7.803505897521973, 8.221700668334961, 8.639896392822266, 9.058091163635254, 9.476285934448242, 9.894481658935547, 10.312676429748535, 10.73087215423584, 11.149066925048828, 11.567262649536133, 11.985457420349121, 12.40365219116211, 12.821847915649414, 13.240042686462402]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 13.0, 12.0, 15.0, 15.0, 27.0, 44.0, 37.0, 38.0, 50.0, 63.0, 55.0, 62.0, 58.0, 58.0, 53.0, 54.0, 71.0, 62.0, 26.0, 39.0, 28.0, 29.0, 17.0, 17.0, 19.0, 14.0, 5.0, 5.0, 9.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0], "bins": [-2.966796875, -2.8966064453125, -2.826416015625, -2.7562255859375, -2.68603515625, -2.6158447265625, -2.545654296875, -2.4754638671875, -2.4052734375, -2.3350830078125, -2.264892578125, -2.1947021484375, -2.12451171875, -2.0543212890625, -1.984130859375, -1.9139404296875, -1.84375, -1.7735595703125, -1.703369140625, -1.6331787109375, -1.56298828125, -1.4927978515625, -1.422607421875, -1.3524169921875, -1.2822265625, -1.2120361328125, -1.141845703125, -1.0716552734375, -1.00146484375, -0.9312744140625, -0.861083984375, -0.7908935546875, -0.720703125, -0.6505126953125, -0.580322265625, -0.5101318359375, -0.43994140625, -0.3697509765625, -0.299560546875, -0.2293701171875, -0.1591796875, -0.0889892578125, -0.018798828125, 0.0513916015625, 0.12158203125, 0.1917724609375, 0.261962890625, 0.3321533203125, 0.40234375, 0.4725341796875, 0.542724609375, 0.6129150390625, 0.68310546875, 0.7532958984375, 0.823486328125, 0.8936767578125, 0.9638671875, 1.0340576171875, 1.104248046875, 1.1744384765625, 1.24462890625, 1.3148193359375, 1.385009765625, 1.4552001953125, 1.525390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 16.0, 27.0, 37.0, 51.0, 114.0, 179.0, 333.0, 598.0, 1283.0, 2831.0, 6708.0, 19174.0, 74847.0, 624383.0, 2866093.0, 498922.0, 67850.0, 18894.0, 6712.0, 2723.0, 1237.0, 571.0, 306.0, 162.0, 82.0, 38.0, 35.0, 24.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.82867431640625, -4.6925048828125, -4.55633544921875, -4.420166015625, -4.28399658203125, -4.1478271484375, -4.01165771484375, -3.87548828125, -3.73931884765625, -3.6031494140625, -3.46697998046875, -3.330810546875, -3.19464111328125, -3.0584716796875, -2.92230224609375, -2.7861328125, -2.64996337890625, -2.5137939453125, -2.37762451171875, -2.241455078125, -2.10528564453125, -1.9691162109375, -1.83294677734375, -1.69677734375, -1.56060791015625, -1.4244384765625, -1.28826904296875, -1.152099609375, -1.01593017578125, -0.8797607421875, -0.74359130859375, -0.607421875, -0.47125244140625, -0.3350830078125, -0.19891357421875, -0.062744140625, 0.07342529296875, 0.2095947265625, 0.34576416015625, 0.48193359375, 0.61810302734375, 0.7542724609375, 0.89044189453125, 1.026611328125, 1.16278076171875, 1.2989501953125, 1.43511962890625, 1.5712890625, 1.70745849609375, 1.8436279296875, 1.97979736328125, 2.115966796875, 2.25213623046875, 2.3883056640625, 2.52447509765625, 2.66064453125, 2.79681396484375, 2.9329833984375, 3.06915283203125, 3.205322265625, 3.34149169921875, 3.4776611328125, 3.61383056640625, 3.75]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 3.0, 11.0, 8.0, 9.0, 12.0, 22.0, 25.0, 23.0, 55.0, 39.0, 60.0, 73.0, 116.0, 159.0, 208.0, 302.0, 445.0, 535.0, 538.0, 385.0, 272.0, 201.0, 138.0, 100.0, 86.0, 49.0, 36.0, 41.0, 25.0, 25.0, 11.0, 13.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-3.689453125, -3.58660888671875, -3.4837646484375, -3.38092041015625, -3.278076171875, -3.17523193359375, -3.0723876953125, -2.96954345703125, -2.86669921875, -2.76385498046875, -2.6610107421875, -2.55816650390625, -2.455322265625, -2.35247802734375, -2.2496337890625, -2.14678955078125, -2.0439453125, -1.94110107421875, -1.8382568359375, -1.73541259765625, -1.632568359375, -1.52972412109375, -1.4268798828125, -1.32403564453125, -1.22119140625, -1.11834716796875, -1.0155029296875, -0.91265869140625, -0.809814453125, -0.70697021484375, -0.6041259765625, -0.50128173828125, -0.3984375, -0.29559326171875, -0.1927490234375, -0.08990478515625, 0.012939453125, 0.11578369140625, 0.2186279296875, 0.32147216796875, 0.42431640625, 0.52716064453125, 0.6300048828125, 0.73284912109375, 0.835693359375, 0.93853759765625, 1.0413818359375, 1.14422607421875, 1.2470703125, 1.34991455078125, 1.4527587890625, 1.55560302734375, 1.658447265625, 1.76129150390625, 1.8641357421875, 1.96697998046875, 2.06982421875, 2.17266845703125, 2.2755126953125, 2.37835693359375, 2.481201171875, 2.58404541015625, 2.6868896484375, 2.78973388671875, 2.892578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 12.0, 15.0, 26.0, 22.0, 35.0, 56.0, 63.0, 101.0, 180.0, 306.0, 613.0, 1430.0, 5770.0, 36065.0, 530053.0, 3423588.0, 172690.0, 17536.0, 3443.0, 1094.0, 410.0, 244.0, 157.0, 89.0, 70.0, 40.0, 35.0, 31.0, 16.0, 16.0, 6.0, 10.0, 11.0, 4.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3046875, -8.011474609375, -7.71826171875, -7.425048828125, -7.1318359375, -6.838623046875, -6.54541015625, -6.252197265625, -5.958984375, -5.665771484375, -5.37255859375, -5.079345703125, -4.7861328125, -4.492919921875, -4.19970703125, -3.906494140625, -3.61328125, -3.320068359375, -3.02685546875, -2.733642578125, -2.4404296875, -2.147216796875, -1.85400390625, -1.560791015625, -1.267578125, -0.974365234375, -0.68115234375, -0.387939453125, -0.0947265625, 0.198486328125, 0.49169921875, 0.784912109375, 1.078125, 1.371337890625, 1.66455078125, 1.957763671875, 2.2509765625, 2.544189453125, 2.83740234375, 3.130615234375, 3.423828125, 3.717041015625, 4.01025390625, 4.303466796875, 4.5966796875, 4.889892578125, 5.18310546875, 5.476318359375, 5.76953125, 6.062744140625, 6.35595703125, 6.649169921875, 6.9423828125, 7.235595703125, 7.52880859375, 7.822021484375, 8.115234375, 8.408447265625, 8.70166015625, 8.994873046875, 9.2880859375, 9.581298828125, 9.87451171875, 10.167724609375, 10.4609375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 20.0, 46.0, 91.0, 180.0, 235.0, 205.0, 120.0, 62.0, 28.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.397518157958984, -32.31162643432617, -31.22573471069336, -30.139842987060547, -29.053951263427734, -27.968059539794922, -26.88216781616211, -25.796276092529297, -24.710384368896484, -23.624492645263672, -22.53860092163086, -21.452709197998047, -20.366817474365234, -19.280925750732422, -18.19503402709961, -17.109142303466797, -16.023250579833984, -14.937358856201172, -13.85146713256836, -12.765575408935547, -11.679683685302734, -10.593791961669922, -9.50790023803711, -8.422008514404297, -7.336116790771484, -6.250225067138672, -5.164333343505859, -4.078441619873047, -2.9925498962402344, -1.9066581726074219, -0.8207664489746094, 0.2651252746582031, 1.3510169982910156, 2.436908721923828, 3.5228004455566406, 4.608692169189453, 5.694583892822266, 6.780475616455078, 7.866367340087891, 8.952259063720703, 10.038150787353516, 11.124042510986328, 12.20993423461914, 13.295825958251953, 14.381717681884766, 15.467609405517578, 16.55350112915039, 17.639392852783203, 18.725284576416016, 19.811176300048828, 20.89706802368164, 21.982959747314453, 23.068851470947266, 24.154743194580078, 25.24063491821289, 26.326526641845703, 27.412418365478516, 28.498310089111328, 29.58420181274414, 30.670093536376953, 31.755985260009766, 32.84187698364258, 33.92776870727539, 35.0136604309082, 36.099552154541016]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 16.0, 12.0, 7.0, 14.0, 22.0, 30.0, 22.0, 29.0, 36.0, 40.0, 40.0, 49.0, 47.0, 56.0, 44.0, 54.0, 59.0, 55.0, 49.0, 34.0, 51.0, 44.0, 33.0, 33.0, 25.0, 19.0, 23.0, 16.0, 8.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.893991470336914, -16.441286087036133, -15.988581657409668, -15.535876274108887, -15.083171844482422, -14.63046646118164, -14.17776107788086, -13.725056648254395, -13.272351264953613, -12.819645881652832, -12.366941452026367, -11.914236068725586, -11.461531639099121, -11.00882625579834, -10.556121826171875, -10.103416442871094, -9.650711059570312, -9.198005676269531, -8.745301246643066, -8.292595863342285, -7.839890956878662, -7.387186050415039, -6.934481143951416, -6.481776237487793, -6.029071807861328, -5.576366901397705, -5.123661994934082, -4.670956611633301, -4.218251705169678, -3.7655467987060547, -3.3128418922424316, -2.8601367473602295, -2.4074316024780273, -1.9547265768051147, -1.5020215511322021, -1.049316644668579, -0.5966116189956665, -0.1439065933227539, 0.30879831314086914, 0.7615034580230713, 1.2142083644866943, 1.666913390159607, 2.1196184158325195, 2.5723233222961426, 3.0250282287597656, 3.4777333736419678, 3.930438280105591, 4.383143424987793, 4.835848331451416, 5.288553237915039, 5.741258144378662, 6.193963050842285, 6.646668434143066, 7.0993733406066895, 7.5520782470703125, 8.004783630371094, 8.457488059997559, 8.91019344329834, 9.362897872924805, 9.815603256225586, 10.26830768585205, 10.721013069152832, 11.173717498779297, 11.626422882080078, 12.07912826538086]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 14.0, 19.0, 28.0, 30.0, 36.0, 33.0, 54.0, 45.0, 55.0, 55.0, 70.0, 55.0, 58.0, 46.0, 68.0, 44.0, 53.0, 40.0, 34.0, 36.0, 22.0, 19.0, 17.0, 17.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.5405731201171875, -2.473724365234375, -2.4068756103515625, -2.34002685546875, -2.2731781005859375, -2.206329345703125, -2.1394805908203125, -2.0726318359375, -2.0057830810546875, -1.938934326171875, -1.8720855712890625, -1.80523681640625, -1.7383880615234375, -1.671539306640625, -1.6046905517578125, -1.537841796875, -1.4709930419921875, -1.404144287109375, -1.3372955322265625, -1.27044677734375, -1.2035980224609375, -1.136749267578125, -1.0699005126953125, -1.0030517578125, -0.9362030029296875, -0.869354248046875, -0.8025054931640625, -0.73565673828125, -0.6688079833984375, -0.601959228515625, -0.5351104736328125, -0.46826171875, -0.4014129638671875, -0.334564208984375, -0.2677154541015625, -0.20086669921875, -0.1340179443359375, -0.067169189453125, -0.0003204345703125, 0.0665283203125, 0.1333770751953125, 0.200225830078125, 0.2670745849609375, 0.33392333984375, 0.4007720947265625, 0.467620849609375, 0.5344696044921875, 0.601318359375, 0.6681671142578125, 0.735015869140625, 0.8018646240234375, 0.86871337890625, 0.9355621337890625, 1.002410888671875, 1.0692596435546875, 1.1361083984375, 1.2029571533203125, 1.269805908203125, 1.3366546630859375, 1.40350341796875, 1.4703521728515625, 1.537200927734375, 1.6040496826171875, 1.6708984375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 11.0, 11.0, 21.0, 21.0, 50.0, 76.0, 90.0, 155.0, 244.0, 374.0, 670.0, 1070.0, 1974.0, 3733.0, 7343.0, 15197.0, 32493.0, 69858.0, 144586.0, 246136.0, 245936.0, 144736.0, 70301.0, 32589.0, 15184.0, 7248.0, 3610.0, 1995.0, 1122.0, 620.0, 374.0, 240.0, 157.0, 92.0, 79.0, 55.0, 29.0, 23.0, 19.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1416015625, -1.105926513671875, -1.07025146484375, -1.034576416015625, -0.9989013671875, -0.963226318359375, -0.92755126953125, -0.891876220703125, -0.856201171875, -0.820526123046875, -0.78485107421875, -0.749176025390625, -0.7135009765625, -0.677825927734375, -0.64215087890625, -0.606475830078125, -0.57080078125, -0.535125732421875, -0.49945068359375, -0.463775634765625, -0.4281005859375, -0.392425537109375, -0.35675048828125, -0.321075439453125, -0.285400390625, -0.249725341796875, -0.21405029296875, -0.178375244140625, -0.1427001953125, -0.107025146484375, -0.07135009765625, -0.035675048828125, 0.0, 0.035675048828125, 0.07135009765625, 0.107025146484375, 0.1427001953125, 0.178375244140625, 0.21405029296875, 0.249725341796875, 0.285400390625, 0.321075439453125, 0.35675048828125, 0.392425537109375, 0.4281005859375, 0.463775634765625, 0.49945068359375, 0.535125732421875, 0.57080078125, 0.606475830078125, 0.64215087890625, 0.677825927734375, 0.7135009765625, 0.749176025390625, 0.78485107421875, 0.820526123046875, 0.856201171875, 0.891876220703125, 0.92755126953125, 0.963226318359375, 0.9989013671875, 1.034576416015625, 1.07025146484375, 1.105926513671875, 1.1416015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 1.0, 17.0, 5.0, 15.0, 12.0, 15.0, 11.0, 19.0, 16.0, 23.0, 30.0, 26.0, 43.0, 40.0, 42.0, 47.0, 46.0, 34.0, 1067.0, 54.0, 41.0, 32.0, 43.0, 28.0, 37.0, 43.0, 25.0, 26.0, 38.0, 26.0, 22.0, 21.0, 16.0, 10.0, 14.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.226226806640625, -1.18389892578125, -1.141571044921875, -1.0992431640625, -1.056915283203125, -1.01458740234375, -0.972259521484375, -0.929931640625, -0.887603759765625, -0.84527587890625, -0.802947998046875, -0.7606201171875, -0.718292236328125, -0.67596435546875, -0.633636474609375, -0.59130859375, -0.548980712890625, -0.50665283203125, -0.464324951171875, -0.4219970703125, -0.379669189453125, -0.33734130859375, -0.295013427734375, -0.252685546875, -0.210357666015625, -0.16802978515625, -0.125701904296875, -0.0833740234375, -0.041046142578125, 0.00128173828125, 0.043609619140625, 0.0859375, 0.128265380859375, 0.17059326171875, 0.212921142578125, 0.2552490234375, 0.297576904296875, 0.33990478515625, 0.382232666015625, 0.424560546875, 0.466888427734375, 0.50921630859375, 0.551544189453125, 0.5938720703125, 0.636199951171875, 0.67852783203125, 0.720855712890625, 0.76318359375, 0.805511474609375, 0.84783935546875, 0.890167236328125, 0.9324951171875, 0.974822998046875, 1.01715087890625, 1.059478759765625, 1.101806640625, 1.144134521484375, 1.18646240234375, 1.228790283203125, 1.2711181640625, 1.313446044921875, 1.35577392578125, 1.398101806640625, 1.4404296875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 14.0, 19.0, 22.0, 33.0, 37.0, 58.0, 92.0, 159.0, 196.0, 308.0, 419.0, 674.0, 956.0, 1361.0, 2142.0, 3104.0, 4850.0, 7674.0, 12469.0, 21644.0, 48651.0, 285415.0, 1514618.0, 113467.0, 32843.0, 17030.0, 10130.0, 6392.0, 4076.0, 2724.0, 1856.0, 1211.0, 809.0, 536.0, 360.0, 238.0, 156.0, 113.0, 99.0, 51.0, 33.0, 29.0, 19.0, 18.0, 4.0, 8.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.099609375, -1.0675430297851562, -1.0354766845703125, -1.0034103393554688, -0.971343994140625, -0.9392776489257812, -0.9072113037109375, -0.8751449584960938, -0.84307861328125, -0.8110122680664062, -0.7789459228515625, -0.7468795776367188, -0.714813232421875, -0.6827468872070312, -0.6506805419921875, -0.6186141967773438, -0.5865478515625, -0.5544815063476562, -0.5224151611328125, -0.49034881591796875, -0.458282470703125, -0.42621612548828125, -0.3941497802734375, -0.36208343505859375, -0.33001708984375, -0.29795074462890625, -0.2658843994140625, -0.23381805419921875, -0.201751708984375, -0.16968536376953125, -0.1376190185546875, -0.10555267333984375, -0.073486328125, -0.04141998291015625, -0.0093536376953125, 0.02271270751953125, 0.054779052734375, 0.08684539794921875, 0.1189117431640625, 0.15097808837890625, 0.18304443359375, 0.21511077880859375, 0.2471771240234375, 0.27924346923828125, 0.311309814453125, 0.34337615966796875, 0.3754425048828125, 0.40750885009765625, 0.4395751953125, 0.47164154052734375, 0.5037078857421875, 0.5357742309570312, 0.567840576171875, 0.5999069213867188, 0.6319732666015625, 0.6640396118164062, 0.69610595703125, 0.7281723022460938, 0.7602386474609375, 0.7923049926757812, 0.824371337890625, 0.8564376831054688, 0.8885040283203125, 0.9205703735351562, 0.95263671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 16.0, 32.0, 42.0, 48.0, 98.0, 110.0, 163.0, 146.0, 112.0, 75.0, 51.0, 25.0, 25.0, 17.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.258544921875, -0.25188255310058594, -0.24522018432617188, -0.2385578155517578, -0.23189544677734375, -0.2252330780029297, -0.21857070922851562, -0.21190834045410156, -0.2052459716796875, -0.19858360290527344, -0.19192123413085938, -0.1852588653564453, -0.17859649658203125, -0.1719341278076172, -0.16527175903320312, -0.15860939025878906, -0.151947021484375, -0.14528465270996094, -0.13862228393554688, -0.1319599151611328, -0.12529754638671875, -0.11863517761230469, -0.11197280883789062, -0.10531044006347656, -0.0986480712890625, -0.09198570251464844, -0.08532333374023438, -0.07866096496582031, -0.07199859619140625, -0.06533622741699219, -0.058673858642578125, -0.05201148986816406, -0.04534912109375, -0.03868675231933594, -0.032024383544921875, -0.025362014770507812, -0.01869964599609375, -0.012037277221679688, -0.005374908447265625, 0.0012874603271484375, 0.0079498291015625, 0.014612197875976562, 0.021274566650390625, 0.027936935424804688, 0.03459930419921875, 0.04126167297363281, 0.047924041748046875, 0.05458641052246094, 0.061248779296875, 0.06791114807128906, 0.07457351684570312, 0.08123588562011719, 0.08789825439453125, 0.09456062316894531, 0.10122299194335938, 0.10788536071777344, 0.1145477294921875, 0.12121009826660156, 0.12787246704101562, 0.1345348358154297, 0.14119720458984375, 0.1478595733642578, 0.15452194213867188, 0.16118431091308594, 0.1678466796875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 13.0, 21.0, 33.0, 43.0, 95.0, 200.0, 1350.0, 883465.0, 162181.0, 765.0, 159.0, 84.0, 47.0, 33.0, 20.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.6171875, -3.47760009765625, -3.3380126953125, -3.19842529296875, -3.058837890625, -2.91925048828125, -2.7796630859375, -2.64007568359375, -2.50048828125, -2.36090087890625, -2.2213134765625, -2.08172607421875, -1.942138671875, -1.80255126953125, -1.6629638671875, -1.52337646484375, -1.3837890625, -1.24420166015625, -1.1046142578125, -0.96502685546875, -0.825439453125, -0.68585205078125, -0.5462646484375, -0.40667724609375, -0.26708984375, -0.12750244140625, 0.0120849609375, 0.15167236328125, 0.291259765625, 0.43084716796875, 0.5704345703125, 0.71002197265625, 0.849609375, 0.98919677734375, 1.1287841796875, 1.26837158203125, 1.407958984375, 1.54754638671875, 1.6871337890625, 1.82672119140625, 1.96630859375, 2.10589599609375, 2.2454833984375, 2.38507080078125, 2.524658203125, 2.66424560546875, 2.8038330078125, 2.94342041015625, 3.0830078125, 3.22259521484375, 3.3621826171875, 3.50177001953125, 3.641357421875, 3.78094482421875, 3.9205322265625, 4.06011962890625, 4.19970703125, 4.33929443359375, 4.4788818359375, 4.61846923828125, 4.758056640625, 4.89764404296875, 5.0372314453125, 5.17681884765625, 5.31640625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 21.0, 76.0, 231.0, 431.0, 175.0, 46.0, 19.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8177696466445923, -1.763284683227539, -1.7087998390197754, -1.6543148756027222, -1.599829912185669, -1.5453450679779053, -1.490860104560852, -1.4363751411437988, -1.3818902969360352, -1.327405333518982, -1.2729204893112183, -1.218435525894165, -1.1639506816864014, -1.1094657182693481, -1.054980754852295, -1.0004959106445312, -0.946010947227478, -0.8915260434150696, -0.8370411396026611, -0.7825561761856079, -0.7280712723731995, -0.673586368560791, -0.6191014051437378, -0.5646165013313293, -0.5101315975189209, -0.45564669370651245, -0.4011617600917816, -0.3466768264770508, -0.29219192266464233, -0.2377070188522339, -0.18322208523750305, -0.12873715162277222, -0.07425224781036377, -0.01976732909679413, 0.03471758961677551, 0.08920250833034515, 0.1436874270439148, 0.19817233085632324, 0.2526572644710541, 0.3071421980857849, 0.36162710189819336, 0.4161120057106018, 0.47059693932533264, 0.5250818729400635, 0.5795667767524719, 0.6340516805648804, 0.6885366439819336, 0.743021547794342, 0.7975064516067505, 0.8519913554191589, 0.9064762592315674, 0.9609612226486206, 1.0154461860656738, 1.0699310302734375, 1.1244159936904907, 1.178900957107544, 1.2333858013153076, 1.2878707647323608, 1.3423556089401245, 1.3968405723571777, 1.4513254165649414, 1.5058103799819946, 1.5602953433990479, 1.6147801876068115, 1.6692651510238647]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 8.0, 6.0, 13.0, 9.0, 19.0, 31.0, 23.0, 36.0, 50.0, 40.0, 41.0, 58.0, 51.0, 54.0, 56.0, 41.0, 49.0, 47.0, 52.0, 48.0, 53.0, 37.0, 35.0, 24.0, 21.0, 24.0, 17.0, 11.0, 8.0, 9.0, 11.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4721947908401489, -0.4602656066417694, -0.4483364224433899, -0.43640726804733276, -0.42447808384895325, -0.41254889965057373, -0.4006197452545166, -0.3886905610561371, -0.37676137685775757, -0.36483219265937805, -0.35290300846099854, -0.3409738540649414, -0.3290446698665619, -0.3171154856681824, -0.30518633127212524, -0.2932571470737457, -0.2813279628753662, -0.2693987786769867, -0.2574695944786072, -0.24554044008255005, -0.23361125588417053, -0.22168207168579102, -0.2097529023885727, -0.19782373309135437, -0.18589454889297485, -0.17396536469459534, -0.16203619539737701, -0.1501070261001587, -0.13817784190177917, -0.12624865770339966, -0.11431948840618134, -0.10239031165838242, -0.0904611349105835, -0.07853195816278458, -0.06660278141498566, -0.05467360466718674, -0.04274442791938782, -0.030815251171588898, -0.018886074423789978, -0.006956897675991058, 0.004972279071807861, 0.01690145581960678, 0.0288306325674057, 0.04075980931520462, 0.05268898606300354, 0.06461816281080246, 0.07654733955860138, 0.0884765163064003, 0.10040569305419922, 0.11233486980199814, 0.12426404654979706, 0.13619321584701538, 0.1481224000453949, 0.16005158424377441, 0.17198075354099274, 0.18390992283821106, 0.19583910703659058, 0.2077682912349701, 0.21969746053218842, 0.23162662982940674, 0.24355581402778625, 0.25548499822616577, 0.2674141526222229, 0.2793433368206024, 0.29127252101898193]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 12.0, 11.0, 14.0, 11.0, 14.0, 22.0, 22.0, 34.0, 23.0, 40.0, 40.0, 45.0, 47.0, 50.0, 49.0, 37.0, 43.0, 41.0, 32.0, 47.0, 53.0, 34.0, 33.0, 36.0, 33.0, 31.0, 25.0, 19.0, 25.0, 11.0, 8.0, 11.0, 11.0, 11.0, 3.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.8046875, -1.752716064453125, -1.70074462890625, -1.648773193359375, -1.5968017578125, -1.544830322265625, -1.49285888671875, -1.440887451171875, -1.388916015625, -1.336944580078125, -1.28497314453125, -1.233001708984375, -1.1810302734375, -1.129058837890625, -1.07708740234375, -1.025115966796875, -0.97314453125, -0.921173095703125, -0.86920166015625, -0.817230224609375, -0.7652587890625, -0.713287353515625, -0.66131591796875, -0.609344482421875, -0.557373046875, -0.505401611328125, -0.45343017578125, -0.401458740234375, -0.3494873046875, -0.297515869140625, -0.24554443359375, -0.193572998046875, -0.1416015625, -0.089630126953125, -0.03765869140625, 0.014312744140625, 0.0662841796875, 0.118255615234375, 0.17022705078125, 0.222198486328125, 0.274169921875, 0.326141357421875, 0.37811279296875, 0.430084228515625, 0.4820556640625, 0.534027099609375, 0.58599853515625, 0.637969970703125, 0.68994140625, 0.741912841796875, 0.79388427734375, 0.845855712890625, 0.8978271484375, 0.949798583984375, 1.00177001953125, 1.053741455078125, 1.105712890625, 1.157684326171875, 1.20965576171875, 1.261627197265625, 1.3135986328125, 1.365570068359375, 1.41754150390625, 1.469512939453125, 1.521484375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 18.0, 21.0, 37.0, 54.0, 71.0, 126.0, 204.0, 304.0, 478.0, 794.0, 1293.0, 2252.0, 4269.0, 8160.0, 18303.0, 47086.0, 152110.0, 459404.0, 236343.0, 69653.0, 24676.0, 10687.0, 5278.0, 2790.0, 1626.0, 929.0, 572.0, 370.0, 232.0, 144.0, 89.0, 54.0, 33.0, 22.0, 22.0, 22.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.259765625, -2.175048828125, -2.09033203125, -2.005615234375, -1.9208984375, -1.836181640625, -1.75146484375, -1.666748046875, -1.58203125, -1.497314453125, -1.41259765625, -1.327880859375, -1.2431640625, -1.158447265625, -1.07373046875, -0.989013671875, -0.904296875, -0.819580078125, -0.73486328125, -0.650146484375, -0.5654296875, -0.480712890625, -0.39599609375, -0.311279296875, -0.2265625, -0.141845703125, -0.05712890625, 0.027587890625, 0.1123046875, 0.197021484375, 0.28173828125, 0.366455078125, 0.451171875, 0.535888671875, 0.62060546875, 0.705322265625, 0.7900390625, 0.874755859375, 0.95947265625, 1.044189453125, 1.12890625, 1.213623046875, 1.29833984375, 1.383056640625, 1.4677734375, 1.552490234375, 1.63720703125, 1.721923828125, 1.806640625, 1.891357421875, 1.97607421875, 2.060791015625, 2.1455078125, 2.230224609375, 2.31494140625, 2.399658203125, 2.484375, 2.569091796875, 2.65380859375, 2.738525390625, 2.8232421875, 2.907958984375, 2.99267578125, 3.077392578125, 3.162109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 13.0, 12.0, 11.0, 19.0, 17.0, 24.0, 21.0, 31.0, 37.0, 40.0, 28.0, 41.0, 71.0, 112.0, 145.0, 276.0, 1375.0, 217.0, 132.0, 61.0, 59.0, 42.0, 39.0, 33.0, 28.0, 27.0, 17.0, 27.0, 16.0, 14.0, 9.0, 4.0, 7.0, 7.0, 9.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.15234375, -5.9727783203125, -5.793212890625, -5.6136474609375, -5.43408203125, -5.2545166015625, -5.074951171875, -4.8953857421875, -4.7158203125, -4.5362548828125, -4.356689453125, -4.1771240234375, -3.99755859375, -3.8179931640625, -3.638427734375, -3.4588623046875, -3.279296875, -3.0997314453125, -2.920166015625, -2.7406005859375, -2.56103515625, -2.3814697265625, -2.201904296875, -2.0223388671875, -1.8427734375, -1.6632080078125, -1.483642578125, -1.3040771484375, -1.12451171875, -0.9449462890625, -0.765380859375, -0.5858154296875, -0.40625, -0.2266845703125, -0.047119140625, 0.1324462890625, 0.31201171875, 0.4915771484375, 0.671142578125, 0.8507080078125, 1.0302734375, 1.2098388671875, 1.389404296875, 1.5689697265625, 1.74853515625, 1.9281005859375, 2.107666015625, 2.2872314453125, 2.466796875, 2.6463623046875, 2.825927734375, 3.0054931640625, 3.18505859375, 3.3646240234375, 3.544189453125, 3.7237548828125, 3.9033203125, 4.0828857421875, 4.262451171875, 4.4420166015625, 4.62158203125, 4.8011474609375, 4.980712890625, 5.1602783203125, 5.33984375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 19.0, 16.0, 17.0, 30.0, 30.0, 56.0, 59.0, 61.0, 99.0, 174.0, 264.0, 493.0, 1300.0, 4972.0, 32624.0, 2197296.0, 880498.0, 21539.0, 3777.0, 1061.0, 457.0, 230.0, 164.0, 97.0, 82.0, 59.0, 46.0, 37.0, 26.0, 27.0, 22.0, 10.0, 9.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5625, -12.1920166015625, -11.821533203125, -11.4510498046875, -11.08056640625, -10.7100830078125, -10.339599609375, -9.9691162109375, -9.5986328125, -9.2281494140625, -8.857666015625, -8.4871826171875, -8.11669921875, -7.7462158203125, -7.375732421875, -7.0052490234375, -6.634765625, -6.2642822265625, -5.893798828125, -5.5233154296875, -5.15283203125, -4.7823486328125, -4.411865234375, -4.0413818359375, -3.6708984375, -3.3004150390625, -2.929931640625, -2.5594482421875, -2.18896484375, -1.8184814453125, -1.447998046875, -1.0775146484375, -0.70703125, -0.3365478515625, 0.033935546875, 0.4044189453125, 0.77490234375, 1.1453857421875, 1.515869140625, 1.8863525390625, 2.2568359375, 2.6273193359375, 2.997802734375, 3.3682861328125, 3.73876953125, 4.1092529296875, 4.479736328125, 4.8502197265625, 5.220703125, 5.5911865234375, 5.961669921875, 6.3321533203125, 6.70263671875, 7.0731201171875, 7.443603515625, 7.8140869140625, 8.1845703125, 8.5550537109375, 8.925537109375, 9.2960205078125, 9.66650390625, 10.0369873046875, 10.407470703125, 10.7779541015625, 11.1484375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 22.0, 719.0, 273.0, 4.0, 1.0, 1.0], "bins": [-201.0170440673828, -197.65365600585938, -194.29025268554688, -190.92686462402344, -187.5634765625, -184.2000732421875, -180.83668518066406, -177.47328186035156, -174.10989379882812, -170.7465057373047, -167.3831024169922, -164.01971435546875, -160.65631103515625, -157.2929229736328, -153.92953491210938, -150.56613159179688, -147.20274353027344, -143.83935546875, -140.4759521484375, -137.11256408691406, -133.74917602539062, -130.38577270507812, -127.02238464355469, -123.65898895263672, -120.29559326171875, -116.93219757080078, -113.56880187988281, -110.20541381835938, -106.8420181274414, -103.47862243652344, -100.115234375, -96.75183868408203, -93.3884506225586, -90.02505493164062, -86.66166687011719, -83.29827117919922, -79.93487548828125, -76.57147979736328, -73.20808410644531, -69.84469604492188, -66.4813003540039, -63.11790466308594, -59.754512786865234, -56.39112091064453, -53.02772521972656, -49.664329528808594, -46.30093765258789, -42.93754577636719, -39.57415008544922, -36.21075439453125, -32.84736251831055, -29.48396873474121, -26.120574951171875, -22.75718116760254, -19.393787384033203, -16.030393600463867, -12.666997909545898, -9.303604125976562, -5.940210342407227, -2.5768165588378906, 0.7865772247314453, 4.149971008300781, 7.513364791870117, 10.876758575439453, 14.240152359008789]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 10.0, 14.0, 13.0, 15.0, 22.0, 19.0, 33.0, 24.0, 42.0, 33.0, 37.0, 46.0, 53.0, 41.0, 54.0, 48.0, 46.0, 47.0, 44.0, 31.0, 31.0, 30.0, 32.0, 30.0, 39.0, 25.0, 22.0, 14.0, 11.0, 20.0, 9.0, 9.0, 9.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.38605499267578, -15.87166976928711, -15.357284545898438, -14.842899322509766, -14.328514099121094, -13.814128875732422, -13.29974365234375, -12.785358428955078, -12.270973205566406, -11.756587982177734, -11.242202758789062, -10.72781753540039, -10.213432312011719, -9.699047088623047, -9.184661865234375, -8.670276641845703, -8.155890464782715, -7.641505241394043, -7.127120018005371, -6.612734794616699, -6.098349571228027, -5.5839643478393555, -5.069578647613525, -4.5551934242248535, -4.040808200836182, -3.5264229774475098, -3.012037754058838, -2.497652292251587, -1.983267068862915, -1.4688818454742432, -0.9544963836669922, -0.4401111602783203, 0.07427406311035156, 0.5886593461036682, 1.1030446290969849, 1.6174299716949463, 2.131815195083618, 2.64620041847229, 3.160585880279541, 3.674971103668213, 4.189356327056885, 4.703741550445557, 5.2181267738342285, 5.732512474060059, 6.2468976974487305, 6.761282920837402, 7.275668144226074, 7.790053367614746, 8.304438591003418, 8.81882381439209, 9.333209037780762, 9.847594261169434, 10.361979484558105, 10.876364707946777, 11.390750885009766, 11.905136108398438, 12.41952133178711, 12.933906555175781, 13.448291778564453, 13.962677001953125, 14.477062225341797, 14.991447448730469, 15.50583267211914, 16.020217895507812, 16.534603118896484]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 0.0, 4.0, 6.0, 9.0, 11.0, 17.0, 13.0, 18.0, 24.0, 18.0, 22.0, 38.0, 38.0, 40.0, 48.0, 38.0, 48.0, 42.0, 38.0, 44.0, 45.0, 30.0, 37.0, 43.0, 38.0, 38.0, 35.0, 30.0, 30.0, 21.0, 24.0, 18.0, 17.0, 15.0, 13.0, 13.0, 6.0, 7.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.009765625, -1.9550933837890625, -1.900421142578125, -1.8457489013671875, -1.79107666015625, -1.7364044189453125, -1.681732177734375, -1.6270599365234375, -1.5723876953125, -1.5177154541015625, -1.463043212890625, -1.4083709716796875, -1.35369873046875, -1.2990264892578125, -1.244354248046875, -1.1896820068359375, -1.135009765625, -1.0803375244140625, -1.025665283203125, -0.9709930419921875, -0.91632080078125, -0.8616485595703125, -0.806976318359375, -0.7523040771484375, -0.6976318359375, -0.6429595947265625, -0.588287353515625, -0.5336151123046875, -0.47894287109375, -0.4242706298828125, -0.369598388671875, -0.3149261474609375, -0.26025390625, -0.2055816650390625, -0.150909423828125, -0.0962371826171875, -0.04156494140625, 0.0131072998046875, 0.067779541015625, 0.1224517822265625, 0.1771240234375, 0.2317962646484375, 0.286468505859375, 0.3411407470703125, 0.39581298828125, 0.4504852294921875, 0.505157470703125, 0.5598297119140625, 0.614501953125, 0.6691741943359375, 0.723846435546875, 0.7785186767578125, 0.83319091796875, 0.8878631591796875, 0.942535400390625, 0.9972076416015625, 1.0518798828125, 1.1065521240234375, 1.161224365234375, 1.2158966064453125, 1.27056884765625, 1.3252410888671875, 1.379913330078125, 1.4345855712890625, 1.4892578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 11.0, 7.0, 11.0, 20.0, 30.0, 32.0, 58.0, 99.0, 120.0, 220.0, 380.0, 652.0, 1329.0, 2607.0, 5914.0, 15521.0, 51388.0, 323646.0, 2481733.0, 1145833.0, 119203.0, 27867.0, 9509.0, 4128.0, 1888.0, 898.0, 473.0, 268.0, 168.0, 79.0, 46.0, 61.0, 22.0, 21.0, 18.0, 12.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0], "bins": [-5.0625, -4.931884765625, -4.80126953125, -4.670654296875, -4.5400390625, -4.409423828125, -4.27880859375, -4.148193359375, -4.017578125, -3.886962890625, -3.75634765625, -3.625732421875, -3.4951171875, -3.364501953125, -3.23388671875, -3.103271484375, -2.97265625, -2.842041015625, -2.71142578125, -2.580810546875, -2.4501953125, -2.319580078125, -2.18896484375, -2.058349609375, -1.927734375, -1.797119140625, -1.66650390625, -1.535888671875, -1.4052734375, -1.274658203125, -1.14404296875, -1.013427734375, -0.8828125, -0.752197265625, -0.62158203125, -0.490966796875, -0.3603515625, -0.229736328125, -0.09912109375, 0.031494140625, 0.162109375, 0.292724609375, 0.42333984375, 0.553955078125, 0.6845703125, 0.815185546875, 0.94580078125, 1.076416015625, 1.20703125, 1.337646484375, 1.46826171875, 1.598876953125, 1.7294921875, 1.860107421875, 1.99072265625, 2.121337890625, 2.251953125, 2.382568359375, 2.51318359375, 2.643798828125, 2.7744140625, 2.905029296875, 3.03564453125, 3.166259765625, 3.296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 24.0, 19.0, 40.0, 34.0, 68.0, 94.0, 117.0, 200.0, 296.0, 542.0, 782.0, 689.0, 448.0, 249.0, 160.0, 99.0, 58.0, 44.0, 40.0, 16.0, 20.0, 13.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.58050537109375, -4.4266357421875, -4.27276611328125, -4.118896484375, -3.96502685546875, -3.8111572265625, -3.65728759765625, -3.50341796875, -3.34954833984375, -3.1956787109375, -3.04180908203125, -2.887939453125, -2.73406982421875, -2.5802001953125, -2.42633056640625, -2.2724609375, -2.11859130859375, -1.9647216796875, -1.81085205078125, -1.656982421875, -1.50311279296875, -1.3492431640625, -1.19537353515625, -1.04150390625, -0.88763427734375, -0.7337646484375, -0.57989501953125, -0.426025390625, -0.27215576171875, -0.1182861328125, 0.03558349609375, 0.189453125, 0.34332275390625, 0.4971923828125, 0.65106201171875, 0.804931640625, 0.95880126953125, 1.1126708984375, 1.26654052734375, 1.42041015625, 1.57427978515625, 1.7281494140625, 1.88201904296875, 2.035888671875, 2.18975830078125, 2.3436279296875, 2.49749755859375, 2.6513671875, 2.80523681640625, 2.9591064453125, 3.11297607421875, 3.266845703125, 3.42071533203125, 3.5745849609375, 3.72845458984375, 3.88232421875, 4.03619384765625, 4.1900634765625, 4.34393310546875, 4.497802734375, 4.65167236328125, 4.8055419921875, 4.95941162109375, 5.11328125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 9.0, 19.0, 25.0, 38.0, 46.0, 96.0, 133.0, 243.0, 575.0, 2865.0, 151032.0, 3997331.0, 39347.0, 1494.0, 421.0, 217.0, 127.0, 75.0, 57.0, 41.0, 25.0, 22.0, 15.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.639404296875, -19.01318359375, -18.386962890625, -17.7607421875, -17.134521484375, -16.50830078125, -15.882080078125, -15.255859375, -14.629638671875, -14.00341796875, -13.377197265625, -12.7509765625, -12.124755859375, -11.49853515625, -10.872314453125, -10.24609375, -9.619873046875, -8.99365234375, -8.367431640625, -7.7412109375, -7.114990234375, -6.48876953125, -5.862548828125, -5.236328125, -4.610107421875, -3.98388671875, -3.357666015625, -2.7314453125, -2.105224609375, -1.47900390625, -0.852783203125, -0.2265625, 0.399658203125, 1.02587890625, 1.652099609375, 2.2783203125, 2.904541015625, 3.53076171875, 4.156982421875, 4.783203125, 5.409423828125, 6.03564453125, 6.661865234375, 7.2880859375, 7.914306640625, 8.54052734375, 9.166748046875, 9.79296875, 10.419189453125, 11.04541015625, 11.671630859375, 12.2978515625, 12.924072265625, 13.55029296875, 14.176513671875, 14.802734375, 15.428955078125, 16.05517578125, 16.681396484375, 17.3076171875, 17.933837890625, 18.56005859375, 19.186279296875, 19.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 15.0, 76.0, 250.0, 382.0, 214.0, 62.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.24877166748047, -69.34900665283203, -67.44923400878906, -65.54946899414062, -63.649696350097656, -61.74993133544922, -59.85015869140625, -57.95039367675781, -56.05062484741211, -54.150856018066406, -52.2510871887207, -50.351318359375, -48.4515495300293, -46.551780700683594, -44.652015686035156, -42.75224685668945, -40.85247802734375, -38.95270919799805, -37.052940368652344, -35.15317153930664, -33.25340270996094, -31.353635787963867, -29.453866958618164, -27.554100036621094, -25.654327392578125, -23.754558563232422, -21.85478973388672, -19.955020904541016, -18.055253982543945, -16.155485153198242, -14.255716323852539, -12.355948448181152, -10.456180572509766, -8.556411743164062, -6.656643867492676, -4.756875038146973, -2.8571066856384277, -0.9573383331298828, 0.9424304962158203, 2.842198371887207, 4.74196720123291, 6.641735553741455, 8.54150390625, 10.441272735595703, 12.341041564941406, 14.240809440612793, 16.140579223632812, 18.040346145629883, 19.940114974975586, 21.83988380432129, 23.739652633666992, 25.639419555664062, 27.539188385009766, 29.43895721435547, 31.338726043701172, 33.238494873046875, 35.13826370239258, 37.03803253173828, 38.937801361083984, 40.83757019042969, 42.73733901977539, 44.637107849121094, 46.53687286376953, 48.436641693115234, 50.33641052246094]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 19.0, 21.0, 29.0, 27.0, 35.0, 26.0, 37.0, 38.0, 50.0, 43.0, 45.0, 49.0, 52.0, 50.0, 35.0, 53.0, 34.0, 46.0, 38.0, 25.0, 22.0, 22.0, 29.0, 28.0, 11.0, 21.0, 11.0, 9.0, 10.0, 4.0, 12.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.414841651916504, -11.030830383300781, -10.646818161010742, -10.262805938720703, -9.87879467010498, -9.494783401489258, -9.110771179199219, -8.72675895690918, -8.342747688293457, -7.958735942840576, -7.574724197387695, -7.1907124519348145, -6.806700706481934, -6.422688961029053, -6.038677215576172, -5.654665470123291, -5.27065372467041, -4.886641979217529, -4.502630233764648, -4.118618488311768, -3.7346067428588867, -3.350594997406006, -2.966583251953125, -2.582571506500244, -2.1985597610473633, -1.8145480155944824, -1.4305362701416016, -1.0465245246887207, -0.6625127792358398, -0.278501033782959, 0.10551071166992188, 0.48952245712280273, 0.87353515625, 1.2575469017028809, 1.6415586471557617, 2.0255703926086426, 2.4095821380615234, 2.7935938835144043, 3.177605628967285, 3.561617374420166, 3.945629119873047, 4.329640865325928, 4.713652610778809, 5.0976643562316895, 5.48167610168457, 5.865687847137451, 6.249699592590332, 6.633711338043213, 7.017723083496094, 7.401734828948975, 7.7857465744018555, 8.169757843017578, 8.553770065307617, 8.937782287597656, 9.321793556213379, 9.705804824829102, 10.08981704711914, 10.47382926940918, 10.857840538024902, 11.241851806640625, 11.625864028930664, 12.009876251220703, 12.393887519836426, 12.777898788452148, 13.161911010742188]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 6.0, 11.0, 8.0, 12.0, 13.0, 21.0, 17.0, 24.0, 30.0, 44.0, 38.0, 35.0, 56.0, 52.0, 31.0, 48.0, 50.0, 55.0, 33.0, 46.0, 43.0, 36.0, 35.0, 38.0, 28.0, 33.0, 29.0, 14.0, 17.0, 26.0, 12.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.69378662109375, -1.6405029296875, -1.58721923828125, -1.533935546875, -1.48065185546875, -1.4273681640625, -1.37408447265625, -1.32080078125, -1.26751708984375, -1.2142333984375, -1.16094970703125, -1.107666015625, -1.05438232421875, -1.0010986328125, -0.94781494140625, -0.89453125, -0.84124755859375, -0.7879638671875, -0.73468017578125, -0.681396484375, -0.62811279296875, -0.5748291015625, -0.52154541015625, -0.46826171875, -0.41497802734375, -0.3616943359375, -0.30841064453125, -0.255126953125, -0.20184326171875, -0.1485595703125, -0.09527587890625, -0.0419921875, 0.01129150390625, 0.0645751953125, 0.11785888671875, 0.171142578125, 0.22442626953125, 0.2777099609375, 0.33099365234375, 0.38427734375, 0.43756103515625, 0.4908447265625, 0.54412841796875, 0.597412109375, 0.65069580078125, 0.7039794921875, 0.75726318359375, 0.810546875, 0.86383056640625, 0.9171142578125, 0.97039794921875, 1.023681640625, 1.07696533203125, 1.1302490234375, 1.18353271484375, 1.23681640625, 1.29010009765625, 1.3433837890625, 1.39666748046875, 1.449951171875, 1.50323486328125, 1.5565185546875, 1.60980224609375, 1.6630859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 8.0, 15.0, 22.0, 28.0, 42.0, 64.0, 83.0, 160.0, 241.0, 382.0, 570.0, 905.0, 1514.0, 2439.0, 3915.0, 6395.0, 10633.0, 17516.0, 28901.0, 48375.0, 78775.0, 122383.0, 169847.0, 179864.0, 139014.0, 92095.0, 56686.0, 34517.0, 20835.0, 12534.0, 7608.0, 4576.0, 2807.0, 1760.0, 1150.0, 671.0, 455.0, 264.0, 157.0, 106.0, 79.0, 45.0, 44.0, 27.0, 13.0, 9.0, 4.0, 7.0, 0.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.6572265625, -0.6367950439453125, -0.616363525390625, -0.5959320068359375, -0.57550048828125, -0.5550689697265625, -0.534637451171875, -0.5142059326171875, -0.4937744140625, -0.4733428955078125, -0.452911376953125, -0.4324798583984375, -0.41204833984375, -0.3916168212890625, -0.371185302734375, -0.3507537841796875, -0.330322265625, -0.3098907470703125, -0.289459228515625, -0.2690277099609375, -0.24859619140625, -0.2281646728515625, -0.207733154296875, -0.1873016357421875, -0.1668701171875, -0.1464385986328125, -0.126007080078125, -0.1055755615234375, -0.08514404296875, -0.0647125244140625, -0.044281005859375, -0.0238494873046875, -0.00341796875, 0.0170135498046875, 0.037445068359375, 0.0578765869140625, 0.07830810546875, 0.0987396240234375, 0.119171142578125, 0.1396026611328125, 0.1600341796875, 0.1804656982421875, 0.200897216796875, 0.2213287353515625, 0.24176025390625, 0.2621917724609375, 0.282623291015625, 0.3030548095703125, 0.323486328125, 0.3439178466796875, 0.364349365234375, 0.3847808837890625, 0.40521240234375, 0.4256439208984375, 0.446075439453125, 0.4665069580078125, 0.4869384765625, 0.5073699951171875, 0.527801513671875, 0.5482330322265625, 0.56866455078125, 0.5890960693359375, 0.609527587890625, 0.6299591064453125, 0.650390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 12.0, 11.0, 19.0, 24.0, 19.0, 25.0, 21.0, 40.0, 25.0, 36.0, 38.0, 42.0, 35.0, 32.0, 35.0, 47.0, 41.0, 1073.0, 44.0, 39.0, 40.0, 32.0, 29.0, 36.0, 32.0, 25.0, 24.0, 15.0, 19.0, 24.0, 10.0, 14.0, 9.0, 11.0, 8.0, 5.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.172576904296875, -1.13226318359375, -1.091949462890625, -1.0516357421875, -1.011322021484375, -0.97100830078125, -0.930694580078125, -0.890380859375, -0.850067138671875, -0.80975341796875, -0.769439697265625, -0.7291259765625, -0.688812255859375, -0.64849853515625, -0.608184814453125, -0.56787109375, -0.527557373046875, -0.48724365234375, -0.446929931640625, -0.4066162109375, -0.366302490234375, -0.32598876953125, -0.285675048828125, -0.245361328125, -0.205047607421875, -0.16473388671875, -0.124420166015625, -0.0841064453125, -0.043792724609375, -0.00347900390625, 0.036834716796875, 0.0771484375, 0.117462158203125, 0.15777587890625, 0.198089599609375, 0.2384033203125, 0.278717041015625, 0.31903076171875, 0.359344482421875, 0.399658203125, 0.439971923828125, 0.48028564453125, 0.520599365234375, 0.5609130859375, 0.601226806640625, 0.64154052734375, 0.681854248046875, 0.72216796875, 0.762481689453125, 0.80279541015625, 0.843109130859375, 0.8834228515625, 0.923736572265625, 0.96405029296875, 1.004364013671875, 1.044677734375, 1.084991455078125, 1.12530517578125, 1.165618896484375, 1.2059326171875, 1.246246337890625, 1.28656005859375, 1.326873779296875, 1.3671875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 14.0, 8.0, 14.0, 19.0, 27.0, 54.0, 76.0, 101.0, 195.0, 259.0, 380.0, 618.0, 1007.0, 1590.0, 2366.0, 3783.0, 6403.0, 10864.0, 19369.0, 42720.0, 233930.0, 1580125.0, 120505.0, 32323.0, 16314.0, 9248.0, 5610.0, 3359.0, 2130.0, 1308.0, 811.0, 579.0, 366.0, 247.0, 161.0, 87.0, 57.0, 42.0, 26.0, 19.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.962890625, -0.9311676025390625, -0.899444580078125, -0.8677215576171875, -0.83599853515625, -0.8042755126953125, -0.772552490234375, -0.7408294677734375, -0.7091064453125, -0.6773834228515625, -0.645660400390625, -0.6139373779296875, -0.58221435546875, -0.5504913330078125, -0.518768310546875, -0.4870452880859375, -0.455322265625, -0.4235992431640625, -0.391876220703125, -0.3601531982421875, -0.32843017578125, -0.2967071533203125, -0.264984130859375, -0.2332611083984375, -0.2015380859375, -0.1698150634765625, -0.138092041015625, -0.1063690185546875, -0.07464599609375, -0.0429229736328125, -0.011199951171875, 0.0205230712890625, 0.05224609375, 0.0839691162109375, 0.115692138671875, 0.1474151611328125, 0.17913818359375, 0.2108612060546875, 0.242584228515625, 0.2743072509765625, 0.3060302734375, 0.3377532958984375, 0.369476318359375, 0.4011993408203125, 0.43292236328125, 0.4646453857421875, 0.496368408203125, 0.5280914306640625, 0.559814453125, 0.5915374755859375, 0.623260498046875, 0.6549835205078125, 0.68670654296875, 0.7184295654296875, 0.750152587890625, 0.7818756103515625, 0.8135986328125, 0.8453216552734375, 0.877044677734375, 0.9087677001953125, 0.94049072265625, 0.9722137451171875, 1.003936767578125, 1.0356597900390625, 1.0673828125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 2.0, 4.0, 9.0, 18.0, 17.0, 19.0, 19.0, 19.0, 24.0, 27.0, 31.0, 28.0, 41.0, 49.0, 50.0, 57.0, 61.0, 83.0, 66.0, 52.0, 38.0, 38.0, 32.0, 35.0, 34.0, 27.0, 26.0, 26.0, 15.0, 11.0, 15.0, 8.0, 2.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11669921875, -0.11336708068847656, -0.11003494262695312, -0.10670280456542969, -0.10337066650390625, -0.10003852844238281, -0.09670639038085938, -0.09337425231933594, -0.0900421142578125, -0.08670997619628906, -0.08337783813476562, -0.08004570007324219, -0.07671356201171875, -0.07338142395019531, -0.07004928588867188, -0.06671714782714844, -0.063385009765625, -0.06005287170410156, -0.056720733642578125, -0.05338859558105469, -0.05005645751953125, -0.04672431945800781, -0.043392181396484375, -0.04006004333496094, -0.0367279052734375, -0.03339576721191406, -0.030063629150390625, -0.026731491088867188, -0.02339935302734375, -0.020067214965820312, -0.016735076904296875, -0.013402938842773438, -0.01007080078125, -0.0067386627197265625, -0.003406524658203125, -7.43865966796875e-05, 0.00325775146484375, 0.0065898895263671875, 0.009922027587890625, 0.013254165649414062, 0.0165863037109375, 0.019918441772460938, 0.023250579833984375, 0.026582717895507812, 0.02991485595703125, 0.03324699401855469, 0.036579132080078125, 0.03991127014160156, 0.043243408203125, 0.04657554626464844, 0.049907684326171875, 0.05323982238769531, 0.05657196044921875, 0.05990409851074219, 0.06323623657226562, 0.06656837463378906, 0.0699005126953125, 0.07323265075683594, 0.07656478881835938, 0.07989692687988281, 0.08322906494140625, 0.08656120300292969, 0.08989334106445312, 0.09322547912597656, 0.0965576171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 14.0, 18.0, 23.0, 44.0, 36.0, 53.0, 43.0, 98.0, 142.0, 265.0, 988.0, 48211.0, 986827.0, 10450.0, 655.0, 204.0, 128.0, 93.0, 45.0, 39.0, 25.0, 30.0, 21.0, 13.0, 22.0, 15.0, 4.0, 5.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.045074462890625, -1.97296142578125, -1.900848388671875, -1.8287353515625, -1.756622314453125, -1.68450927734375, -1.612396240234375, -1.540283203125, -1.468170166015625, -1.39605712890625, -1.323944091796875, -1.2518310546875, -1.179718017578125, -1.10760498046875, -1.035491943359375, -0.96337890625, -0.891265869140625, -0.81915283203125, -0.747039794921875, -0.6749267578125, -0.602813720703125, -0.53070068359375, -0.458587646484375, -0.386474609375, -0.314361572265625, -0.24224853515625, -0.170135498046875, -0.0980224609375, -0.025909423828125, 0.04620361328125, 0.118316650390625, 0.1904296875, 0.262542724609375, 0.33465576171875, 0.406768798828125, 0.4788818359375, 0.550994873046875, 0.62310791015625, 0.695220947265625, 0.767333984375, 0.839447021484375, 0.91156005859375, 0.983673095703125, 1.0557861328125, 1.127899169921875, 1.20001220703125, 1.272125244140625, 1.34423828125, 1.416351318359375, 1.48846435546875, 1.560577392578125, 1.6326904296875, 1.704803466796875, 1.77691650390625, 1.849029541015625, 1.921142578125, 1.993255615234375, 2.06536865234375, 2.137481689453125, 2.2095947265625, 2.281707763671875, 2.35382080078125, 2.425933837890625, 2.498046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 11.0, 59.0, 558.0, 350.0, 36.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73728346824646, -2.639051914215088, -2.540820598602295, -2.442589044570923, -2.34435772895813, -2.246126174926758, -2.147894859313965, -2.0496633052825928, -1.9514319896697998, -1.8532005548477173, -1.7549691200256348, -1.6567376852035522, -1.5585062503814697, -1.4602748155593872, -1.3620433807373047, -1.2638118267059326, -1.16558039188385, -1.0673489570617676, -0.9691175222396851, -0.8708860874176025, -0.77265465259552, -0.6744232177734375, -0.5761917233467102, -0.4779602885246277, -0.37972885370254517, -0.28149741888046265, -0.18326596915721893, -0.08503451943397522, 0.0131969153881073, 0.11142835021018982, 0.20965981483459473, 0.30789124965667725, 0.40612268447875977, 0.5043541193008423, 0.6025855541229248, 0.7008169889450073, 0.7990484237670898, 0.8972798585891724, 0.9955113530158997, 1.093742847442627, 1.19197416305542, 1.2902055978775024, 1.388437032699585, 1.4866684675216675, 1.58489990234375, 1.6831313371658325, 1.781362771987915, 1.879594326019287, 1.9778257608413696, 2.076057195663452, 2.174288749694824, 2.272520065307617, 2.3707516193389893, 2.4689829349517822, 2.5672144889831543, 2.6654458045959473, 2.7636773586273193, 2.8619089126586914, 2.9601402282714844, 3.0583717823028564, 3.1566030979156494, 3.2548346519470215, 3.3530659675598145, 3.4512975215911865, 3.5495288372039795]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 8.0, 6.0, 7.0, 9.0, 12.0, 20.0, 18.0, 25.0, 29.0, 31.0, 38.0, 59.0, 53.0, 35.0, 57.0, 51.0, 57.0, 55.0, 58.0, 47.0, 50.0, 49.0, 39.0, 29.0, 31.0, 27.0, 19.0, 25.0, 18.0, 10.0, 8.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6050333380699158, -0.5891799330711365, -0.5733264684677124, -0.5574730634689331, -0.541619598865509, -0.5257661938667297, -0.5099127292633057, -0.49405932426452637, -0.47820591926574707, -0.4623524844646454, -0.4464990496635437, -0.4306456446647644, -0.4147922098636627, -0.39893877506256104, -0.38308534026145935, -0.36723190546035767, -0.351378470659256, -0.3355250358581543, -0.3196716010570526, -0.3038181662559509, -0.28796476125717163, -0.27211132645606995, -0.25625789165496826, -0.24040445685386658, -0.2245510369539261, -0.2086976021528244, -0.1928441822528839, -0.17699074745178223, -0.16113731265068054, -0.14528389275074005, -0.12943045794963837, -0.11357703059911728, -0.09772360324859619, -0.0818701758980751, -0.06601674854755402, -0.05016331374645233, -0.034309886395931244, -0.018456459045410156, -0.0026030242443084717, 0.013250403106212616, 0.029103830456733704, 0.04495725780725479, 0.06081068888306618, 0.07666411995887756, 0.09251754730939865, 0.10837097465991974, 0.12422440946102142, 0.14007782936096191, 0.1559312641620636, 0.17178469896316528, 0.18763811886310577, 0.20349155366420746, 0.21934497356414795, 0.23519840836524963, 0.2510518431663513, 0.266905277967453, 0.2827587127685547, 0.29861214756965637, 0.31446558237075806, 0.33031898736953735, 0.34617242217063904, 0.3620258569717407, 0.3778792917728424, 0.3937327265739441, 0.4095861315727234]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 24.0, 18.0, 27.0, 30.0, 43.0, 39.0, 60.0, 49.0, 65.0, 75.0, 56.0, 70.0, 52.0, 67.0, 52.0, 50.0, 47.0, 30.0, 30.0, 28.0, 29.0, 17.0, 13.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.287506103515625, -2.21173095703125, -2.135955810546875, -2.0601806640625, -1.984405517578125, -1.90863037109375, -1.832855224609375, -1.757080078125, -1.681304931640625, -1.60552978515625, -1.529754638671875, -1.4539794921875, -1.378204345703125, -1.30242919921875, -1.226654052734375, -1.15087890625, -1.075103759765625, -0.99932861328125, -0.923553466796875, -0.8477783203125, -0.772003173828125, -0.69622802734375, -0.620452880859375, -0.544677734375, -0.468902587890625, -0.39312744140625, -0.317352294921875, -0.2415771484375, -0.165802001953125, -0.09002685546875, -0.014251708984375, 0.0615234375, 0.137298583984375, 0.21307373046875, 0.288848876953125, 0.3646240234375, 0.440399169921875, 0.51617431640625, 0.591949462890625, 0.667724609375, 0.743499755859375, 0.81927490234375, 0.895050048828125, 0.9708251953125, 1.046600341796875, 1.12237548828125, 1.198150634765625, 1.27392578125, 1.349700927734375, 1.42547607421875, 1.501251220703125, 1.5770263671875, 1.652801513671875, 1.72857666015625, 1.804351806640625, 1.880126953125, 1.955902099609375, 2.03167724609375, 2.107452392578125, 2.1832275390625, 2.259002685546875, 2.33477783203125, 2.410552978515625, 2.486328125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 10.0, 9.0, 13.0, 29.0, 54.0, 86.0, 175.0, 310.0, 619.0, 1397.0, 2983.0, 6853.0, 18012.0, 51120.0, 172640.0, 482953.0, 214090.0, 61633.0, 21241.0, 7928.0, 3341.0, 1495.0, 750.0, 348.0, 192.0, 110.0, 60.0, 36.0, 22.0, 12.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.25933837890625, -2.1710205078125, -2.08270263671875, -1.994384765625, -1.90606689453125, -1.8177490234375, -1.72943115234375, -1.64111328125, -1.55279541015625, -1.4644775390625, -1.37615966796875, -1.287841796875, -1.19952392578125, -1.1112060546875, -1.02288818359375, -0.9345703125, -0.84625244140625, -0.7579345703125, -0.66961669921875, -0.581298828125, -0.49298095703125, -0.4046630859375, -0.31634521484375, -0.22802734375, -0.13970947265625, -0.0513916015625, 0.03692626953125, 0.125244140625, 0.21356201171875, 0.3018798828125, 0.39019775390625, 0.478515625, 0.56683349609375, 0.6551513671875, 0.74346923828125, 0.831787109375, 0.92010498046875, 1.0084228515625, 1.09674072265625, 1.18505859375, 1.27337646484375, 1.3616943359375, 1.45001220703125, 1.538330078125, 1.62664794921875, 1.7149658203125, 1.80328369140625, 1.8916015625, 1.97991943359375, 2.0682373046875, 2.15655517578125, 2.244873046875, 2.33319091796875, 2.4215087890625, 2.50982666015625, 2.59814453125, 2.68646240234375, 2.7747802734375, 2.86309814453125, 2.951416015625, 3.03973388671875, 3.1280517578125, 3.21636962890625, 3.3046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 12.0, 7.0, 15.0, 12.0, 28.0, 24.0, 37.0, 39.0, 39.0, 53.0, 56.0, 68.0, 123.0, 221.0, 1519.0, 224.0, 124.0, 66.0, 56.0, 47.0, 46.0, 34.0, 34.0, 24.0, 24.0, 20.0, 15.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7176513671875, -6.517333984375, -6.3170166015625, -6.11669921875, -5.9163818359375, -5.716064453125, -5.5157470703125, -5.3154296875, -5.1151123046875, -4.914794921875, -4.7144775390625, -4.51416015625, -4.3138427734375, -4.113525390625, -3.9132080078125, -3.712890625, -3.5125732421875, -3.312255859375, -3.1119384765625, -2.91162109375, -2.7113037109375, -2.510986328125, -2.3106689453125, -2.1103515625, -1.9100341796875, -1.709716796875, -1.5093994140625, -1.30908203125, -1.1087646484375, -0.908447265625, -0.7081298828125, -0.5078125, -0.3074951171875, -0.107177734375, 0.0931396484375, 0.29345703125, 0.4937744140625, 0.694091796875, 0.8944091796875, 1.0947265625, 1.2950439453125, 1.495361328125, 1.6956787109375, 1.89599609375, 2.0963134765625, 2.296630859375, 2.4969482421875, 2.697265625, 2.8975830078125, 3.097900390625, 3.2982177734375, 3.49853515625, 3.6988525390625, 3.899169921875, 4.0994873046875, 4.2998046875, 4.5001220703125, 4.700439453125, 4.9007568359375, 5.10107421875, 5.3013916015625, 5.501708984375, 5.7020263671875, 5.90234375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 15.0, 14.0, 10.0, 21.0, 31.0, 39.0, 51.0, 61.0, 99.0, 166.0, 197.0, 398.0, 1222.0, 8865.0, 673348.0, 2441671.0, 16589.0, 1606.0, 473.0, 260.0, 144.0, 103.0, 96.0, 48.0, 38.0, 31.0, 22.0, 18.0, 16.0, 10.0, 5.0, 9.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.8668212890625, -11.444580078125, -11.0223388671875, -10.60009765625, -10.1778564453125, -9.755615234375, -9.3333740234375, -8.9111328125, -8.4888916015625, -8.066650390625, -7.6444091796875, -7.22216796875, -6.7999267578125, -6.377685546875, -5.9554443359375, -5.533203125, -5.1109619140625, -4.688720703125, -4.2664794921875, -3.84423828125, -3.4219970703125, -2.999755859375, -2.5775146484375, -2.1552734375, -1.7330322265625, -1.310791015625, -0.8885498046875, -0.46630859375, -0.0440673828125, 0.378173828125, 0.8004150390625, 1.22265625, 1.6448974609375, 2.067138671875, 2.4893798828125, 2.91162109375, 3.3338623046875, 3.756103515625, 4.1783447265625, 4.6005859375, 5.0228271484375, 5.445068359375, 5.8673095703125, 6.28955078125, 6.7117919921875, 7.134033203125, 7.5562744140625, 7.978515625, 8.4007568359375, 8.822998046875, 9.2452392578125, 9.66748046875, 10.0897216796875, 10.511962890625, 10.9342041015625, 11.3564453125, 11.7786865234375, 12.200927734375, 12.6231689453125, 13.04541015625, 13.4676513671875, 13.889892578125, 14.3121337890625, 14.734375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 528.0, 482.0, 4.0], "bins": [-254.04322814941406, -249.94281005859375, -245.84239196777344, -241.74197387695312, -237.6415557861328, -233.5411376953125, -229.4407196044922, -225.34030151367188, -221.2398681640625, -217.1394500732422, -213.03903198242188, -208.93861389160156, -204.83819580078125, -200.73777770996094, -196.63735961914062, -192.53692626953125, -188.4365234375, -184.3361053466797, -180.23568725585938, -176.13526916503906, -172.03485107421875, -167.93443298339844, -163.83401489257812, -159.73358154296875, -155.6331787109375, -151.5327606201172, -147.43234252929688, -143.33192443847656, -139.23150634765625, -135.13108825683594, -131.03067016601562, -126.93024444580078, -122.82980346679688, -118.72938537597656, -114.62896728515625, -110.52854919433594, -106.42813110351562, -102.32771301269531, -98.22728729248047, -94.12686920166016, -90.02645111083984, -85.92603302001953, -81.82561492919922, -77.7251968383789, -73.62477111816406, -69.52435302734375, -65.42393493652344, -61.323516845703125, -57.22309875488281, -53.1226806640625, -49.02226257324219, -44.92184066772461, -40.8214225769043, -36.721004486083984, -32.620582580566406, -28.520164489746094, -24.41974639892578, -20.31932830810547, -16.218908309936523, -12.118489265441895, -8.018070220947266, -3.917652130126953, 0.1827678680419922, 4.2831878662109375, 8.38360595703125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 10.0, 6.0, 14.0, 17.0, 12.0, 17.0, 22.0, 27.0, 31.0, 33.0, 39.0, 42.0, 39.0, 33.0, 52.0, 50.0, 42.0, 35.0, 31.0, 44.0, 38.0, 44.0, 30.0, 35.0, 35.0, 37.0, 24.0, 26.0, 25.0, 16.0, 22.0, 15.0, 12.0, 7.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.349242210388184, -14.865498542785645, -14.381753921508789, -13.89801025390625, -13.414265632629395, -12.930521965026855, -12.44677734375, -11.963033676147461, -11.479289054870605, -10.995545387268066, -10.511800765991211, -10.028057098388672, -9.544312477111816, -9.060568809509277, -8.576824188232422, -8.093080520629883, -7.6093363761901855, -7.125592231750488, -6.641848087310791, -6.158103942871094, -5.6743597984313965, -5.190615653991699, -4.70687198638916, -4.223127365112305, -3.7393834590911865, -3.2556393146514893, -2.771895170211792, -2.288151264190674, -1.804407000541687, -1.3206629753112793, -0.836918830871582, -0.35317468643188477, 0.1305694580078125, 0.6143136024475098, 1.098057746887207, 1.5818017721176147, 2.0655460357666016, 2.5492899417877197, 3.033034086227417, 3.5167782306671143, 4.000522613525391, 4.484266757965088, 4.968010902404785, 5.451755046844482, 5.93549919128418, 6.419242858886719, 6.902987480163574, 7.386731147766113, 7.8704752922058105, 8.354219436645508, 8.837963104248047, 9.321707725524902, 9.805451393127441, 10.289196014404297, 10.772939682006836, 11.256684303283691, 11.74042797088623, 12.22417163848877, 12.707916259765625, 13.191659927368164, 13.67540454864502, 14.159148216247559, 14.642892837524414, 15.126636505126953, 15.610381126403809]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 13.0, 12.0, 12.0, 10.0, 27.0, 19.0, 29.0, 35.0, 35.0, 39.0, 45.0, 44.0, 67.0, 53.0, 60.0, 41.0, 52.0, 51.0, 62.0, 42.0, 37.0, 38.0, 39.0, 28.0, 26.0, 14.0, 22.0, 7.0, 11.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.16497802734375, -2.0975341796875, -2.03009033203125, -1.962646484375, -1.89520263671875, -1.8277587890625, -1.76031494140625, -1.69287109375, -1.62542724609375, -1.5579833984375, -1.49053955078125, -1.423095703125, -1.35565185546875, -1.2882080078125, -1.22076416015625, -1.1533203125, -1.08587646484375, -1.0184326171875, -0.95098876953125, -0.883544921875, -0.81610107421875, -0.7486572265625, -0.68121337890625, -0.61376953125, -0.54632568359375, -0.4788818359375, -0.41143798828125, -0.343994140625, -0.27655029296875, -0.2091064453125, -0.14166259765625, -0.07421875, -0.00677490234375, 0.0606689453125, 0.12811279296875, 0.195556640625, 0.26300048828125, 0.3304443359375, 0.39788818359375, 0.46533203125, 0.53277587890625, 0.6002197265625, 0.66766357421875, 0.735107421875, 0.80255126953125, 0.8699951171875, 0.93743896484375, 1.0048828125, 1.07232666015625, 1.1397705078125, 1.20721435546875, 1.274658203125, 1.34210205078125, 1.4095458984375, 1.47698974609375, 1.54443359375, 1.61187744140625, 1.6793212890625, 1.74676513671875, 1.814208984375, 1.88165283203125, 1.9490966796875, 2.01654052734375, 2.083984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 11.0, 18.0, 10.0, 30.0, 37.0, 59.0, 86.0, 131.0, 196.0, 370.0, 614.0, 1140.0, 2390.0, 5033.0, 12120.0, 32575.0, 129362.0, 1099910.0, 2454789.0, 359602.0, 61196.0, 19613.0, 7805.0, 3534.0, 1657.0, 800.0, 468.0, 262.0, 166.0, 101.0, 70.0, 49.0, 22.0, 21.0, 13.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.70538330078125, -3.5787353515625, -3.45208740234375, -3.325439453125, -3.19879150390625, -3.0721435546875, -2.94549560546875, -2.81884765625, -2.69219970703125, -2.5655517578125, -2.43890380859375, -2.312255859375, -2.18560791015625, -2.0589599609375, -1.93231201171875, -1.8056640625, -1.67901611328125, -1.5523681640625, -1.42572021484375, -1.299072265625, -1.17242431640625, -1.0457763671875, -0.91912841796875, -0.79248046875, -0.66583251953125, -0.5391845703125, -0.41253662109375, -0.285888671875, -0.15924072265625, -0.0325927734375, 0.09405517578125, 0.220703125, 0.34735107421875, 0.4739990234375, 0.60064697265625, 0.727294921875, 0.85394287109375, 0.9805908203125, 1.10723876953125, 1.23388671875, 1.36053466796875, 1.4871826171875, 1.61383056640625, 1.740478515625, 1.86712646484375, 1.9937744140625, 2.12042236328125, 2.2470703125, 2.37371826171875, 2.5003662109375, 2.62701416015625, 2.753662109375, 2.88031005859375, 3.0069580078125, 3.13360595703125, 3.26025390625, 3.38690185546875, 3.5135498046875, 3.64019775390625, 3.766845703125, 3.89349365234375, 4.0201416015625, 4.14678955078125, 4.2734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 7.0, 6.0, 9.0, 18.0, 21.0, 37.0, 52.0, 80.0, 78.0, 119.0, 193.0, 294.0, 452.0, 685.0, 683.0, 465.0, 325.0, 200.0, 114.0, 69.0, 49.0, 38.0, 21.0, 16.0, 8.0, 9.0, 11.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.7578125, -5.620849609375, -5.48388671875, -5.346923828125, -5.2099609375, -5.072998046875, -4.93603515625, -4.799072265625, -4.662109375, -4.525146484375, -4.38818359375, -4.251220703125, -4.1142578125, -3.977294921875, -3.84033203125, -3.703369140625, -3.56640625, -3.429443359375, -3.29248046875, -3.155517578125, -3.0185546875, -2.881591796875, -2.74462890625, -2.607666015625, -2.470703125, -2.333740234375, -2.19677734375, -2.059814453125, -1.9228515625, -1.785888671875, -1.64892578125, -1.511962890625, -1.375, -1.238037109375, -1.10107421875, -0.964111328125, -0.8271484375, -0.690185546875, -0.55322265625, -0.416259765625, -0.279296875, -0.142333984375, -0.00537109375, 0.131591796875, 0.2685546875, 0.405517578125, 0.54248046875, 0.679443359375, 0.81640625, 0.953369140625, 1.09033203125, 1.227294921875, 1.3642578125, 1.501220703125, 1.63818359375, 1.775146484375, 1.912109375, 2.049072265625, 2.18603515625, 2.322998046875, 2.4599609375, 2.596923828125, 2.73388671875, 2.870849609375, 3.0078125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 12.0, 14.0, 12.0, 12.0, 37.0, 46.0, 69.0, 103.0, 225.0, 534.0, 2860.0, 66386.0, 3999605.0, 119169.0, 3887.0, 631.0, 250.0, 120.0, 89.0, 74.0, 43.0, 35.0, 15.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1640625, -12.5806884765625, -11.997314453125, -11.4139404296875, -10.83056640625, -10.2471923828125, -9.663818359375, -9.0804443359375, -8.4970703125, -7.9136962890625, -7.330322265625, -6.7469482421875, -6.16357421875, -5.5802001953125, -4.996826171875, -4.4134521484375, -3.830078125, -3.2467041015625, -2.663330078125, -2.0799560546875, -1.49658203125, -0.9132080078125, -0.329833984375, 0.2535400390625, 0.8369140625, 1.4202880859375, 2.003662109375, 2.5870361328125, 3.17041015625, 3.7537841796875, 4.337158203125, 4.9205322265625, 5.50390625, 6.0872802734375, 6.670654296875, 7.2540283203125, 7.83740234375, 8.4207763671875, 9.004150390625, 9.5875244140625, 10.1708984375, 10.7542724609375, 11.337646484375, 11.9210205078125, 12.50439453125, 13.0877685546875, 13.671142578125, 14.2545166015625, 14.837890625, 15.4212646484375, 16.004638671875, 16.5880126953125, 17.17138671875, 17.7547607421875, 18.338134765625, 18.9215087890625, 19.5048828125, 20.0882568359375, 20.671630859375, 21.2550048828125, 21.83837890625, 22.4217529296875, 23.005126953125, 23.5885009765625, 24.171875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 29.0, 54.0, 128.0, 248.0, 262.0, 144.0, 71.0, 38.0, 11.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.337215423583984, -15.11185073852539, -13.886486053466797, -12.661120414733887, -11.435755729675293, -10.2103910446167, -8.985025405883789, -7.759660720825195, -6.534296035766602, -5.308931350708008, -4.083566188812256, -2.858201265335083, -1.6328363418579102, -0.4074716567993164, 0.8178935050964355, 2.0432586669921875, 3.2686233520507812, 4.493988037109375, 5.719353199005127, 6.944718360900879, 8.170083045959473, 9.395447731018066, 10.620813369750977, 11.84617805480957, 13.071542739868164, 14.296907424926758, 15.522272109985352, 16.747636795043945, 17.973003387451172, 19.198368072509766, 20.42373275756836, 21.649097442626953, 22.874462127685547, 24.09982681274414, 25.325191497802734, 26.550556182861328, 27.775920867919922, 29.001285552978516, 30.226652145385742, 31.452016830444336, 32.67738342285156, 33.902748107910156, 35.12811279296875, 36.353477478027344, 37.57884216308594, 38.80420684814453, 40.029571533203125, 41.25493621826172, 42.48030090332031, 43.705665588378906, 44.9310302734375, 46.156394958496094, 47.38175964355469, 48.60712432861328, 49.832489013671875, 51.05785369873047, 52.28321838378906, 53.508583068847656, 54.73394775390625, 55.959312438964844, 57.18467712402344, 58.41004180908203, 59.635406494140625, 60.86077117919922, 62.08613967895508]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 6.0, 12.0, 5.0, 11.0, 15.0, 12.0, 15.0, 21.0, 22.0, 24.0, 29.0, 35.0, 36.0, 42.0, 36.0, 46.0, 32.0, 43.0, 59.0, 51.0, 34.0, 29.0, 32.0, 33.0, 44.0, 35.0, 27.0, 20.0, 25.0, 29.0, 23.0, 14.0, 13.0, 15.0, 20.0, 7.0, 6.0, 8.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-13.171545028686523, -12.812033653259277, -12.452521324157715, -12.093009948730469, -11.733498573303223, -11.373987197875977, -11.014474868774414, -10.654963493347168, -10.295452117919922, -9.935940742492676, -9.576428413391113, -9.216917037963867, -8.857405662536621, -8.497894287109375, -8.138381958007812, -7.778870582580566, -7.419358730316162, -7.059846878051758, -6.700335502624512, -6.340823650360107, -5.981312274932861, -5.621800422668457, -5.262289047241211, -4.902777194976807, -4.543265342712402, -4.183753490447998, -3.824242115020752, -3.4647302627563477, -3.1052188873291016, -2.7457070350646973, -2.386195421218872, -2.026683807373047, -1.6671724319458008, -1.3076608180999756, -0.9481491446495056, -0.5886374711990356, -0.22912585735321045, 0.13038575649261475, 0.4898974895477295, 0.8494091033935547, 1.2089207172393799, 1.568432331085205, 1.9279439449310303, 2.2874555587768555, 2.6469674110412598, 3.006478786468506, 3.36599063873291, 3.7255022525787354, 4.0850138664245605, 4.444525718688965, 4.804037094116211, 5.163548946380615, 5.523060321807861, 5.882572174072266, 6.242083549499512, 6.601595401763916, 6.96110725402832, 7.320619106292725, 7.680130481719971, 8.039642333984375, 8.399153709411621, 8.758665084838867, 9.11817741394043, 9.477688789367676, 9.837200164794922]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 8.0, 16.0, 8.0, 19.0, 33.0, 29.0, 37.0, 35.0, 55.0, 54.0, 59.0, 68.0, 62.0, 55.0, 68.0, 69.0, 53.0, 50.0, 38.0, 28.0, 33.0, 28.0, 22.0, 20.0, 12.0, 11.0, 10.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.873626708984375, -2.79803466796875, -2.722442626953125, -2.6468505859375, -2.571258544921875, -2.49566650390625, -2.420074462890625, -2.344482421875, -2.268890380859375, -2.19329833984375, -2.117706298828125, -2.0421142578125, -1.966522216796875, -1.89093017578125, -1.815338134765625, -1.73974609375, -1.664154052734375, -1.58856201171875, -1.512969970703125, -1.4373779296875, -1.361785888671875, -1.28619384765625, -1.210601806640625, -1.135009765625, -1.059417724609375, -0.98382568359375, -0.908233642578125, -0.8326416015625, -0.757049560546875, -0.68145751953125, -0.605865478515625, -0.5302734375, -0.454681396484375, -0.37908935546875, -0.303497314453125, -0.2279052734375, -0.152313232421875, -0.07672119140625, -0.001129150390625, 0.074462890625, 0.150054931640625, 0.22564697265625, 0.301239013671875, 0.3768310546875, 0.452423095703125, 0.52801513671875, 0.603607177734375, 0.67919921875, 0.754791259765625, 0.83038330078125, 0.905975341796875, 0.9815673828125, 1.057159423828125, 1.13275146484375, 1.208343505859375, 1.283935546875, 1.359527587890625, 1.43511962890625, 1.510711669921875, 1.5863037109375, 1.661895751953125, 1.73748779296875, 1.813079833984375, 1.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 12.0, 18.0, 22.0, 43.0, 43.0, 91.0, 175.0, 299.0, 618.0, 1163.0, 2252.0, 4801.0, 10004.0, 22454.0, 50934.0, 115490.0, 234311.0, 287268.0, 174021.0, 80062.0, 35054.0, 15427.0, 7091.0, 3458.0, 1629.0, 824.0, 421.0, 220.0, 132.0, 72.0, 57.0, 28.0, 15.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.0546875, -1.0229873657226562, -0.9912872314453125, -0.9595870971679688, -0.927886962890625, -0.8961868286132812, -0.8644866943359375, -0.8327865600585938, -0.80108642578125, -0.7693862915039062, -0.7376861572265625, -0.7059860229492188, -0.674285888671875, -0.6425857543945312, -0.6108856201171875, -0.5791854858398438, -0.5474853515625, -0.5157852172851562, -0.4840850830078125, -0.45238494873046875, -0.420684814453125, -0.38898468017578125, -0.3572845458984375, -0.32558441162109375, -0.29388427734375, -0.26218414306640625, -0.2304840087890625, -0.19878387451171875, -0.167083740234375, -0.13538360595703125, -0.1036834716796875, -0.07198333740234375, -0.040283203125, -0.00858306884765625, 0.0231170654296875, 0.05481719970703125, 0.086517333984375, 0.11821746826171875, 0.1499176025390625, 0.18161773681640625, 0.21331787109375, 0.24501800537109375, 0.2767181396484375, 0.30841827392578125, 0.340118408203125, 0.37181854248046875, 0.4035186767578125, 0.43521881103515625, 0.4669189453125, 0.49861907958984375, 0.5303192138671875, 0.5620193481445312, 0.593719482421875, 0.6254196166992188, 0.6571197509765625, 0.6888198852539062, 0.72052001953125, 0.7522201538085938, 0.7839202880859375, 0.8156204223632812, 0.847320556640625, 0.8790206909179688, 0.9107208251953125, 0.9424209594726562, 0.97412109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 13.0, 13.0, 9.0, 14.0, 13.0, 16.0, 28.0, 24.0, 31.0, 36.0, 43.0, 45.0, 38.0, 41.0, 38.0, 44.0, 1062.0, 47.0, 44.0, 45.0, 40.0, 36.0, 37.0, 31.0, 27.0, 22.0, 30.0, 20.0, 18.0, 15.0, 19.0, 14.0, 18.0, 11.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1650390625, -1.1261138916015625, -1.087188720703125, -1.0482635498046875, -1.00933837890625, -0.9704132080078125, -0.931488037109375, -0.8925628662109375, -0.8536376953125, -0.8147125244140625, -0.775787353515625, -0.7368621826171875, -0.69793701171875, -0.6590118408203125, -0.620086669921875, -0.5811614990234375, -0.542236328125, -0.5033111572265625, -0.464385986328125, -0.4254608154296875, -0.38653564453125, -0.3476104736328125, -0.308685302734375, -0.2697601318359375, -0.2308349609375, -0.1919097900390625, -0.152984619140625, -0.1140594482421875, -0.07513427734375, -0.0362091064453125, 0.002716064453125, 0.0416412353515625, 0.08056640625, 0.1194915771484375, 0.158416748046875, 0.1973419189453125, 0.23626708984375, 0.2751922607421875, 0.314117431640625, 0.3530426025390625, 0.3919677734375, 0.4308929443359375, 0.469818115234375, 0.5087432861328125, 0.54766845703125, 0.5865936279296875, 0.625518798828125, 0.6644439697265625, 0.703369140625, 0.7422943115234375, 0.781219482421875, 0.8201446533203125, 0.85906982421875, 0.8979949951171875, 0.936920166015625, 0.9758453369140625, 1.0147705078125, 1.0536956787109375, 1.092620849609375, 1.1315460205078125, 1.17047119140625, 1.2093963623046875, 1.248321533203125, 1.2872467041015625, 1.326171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 8.0, 9.0, 15.0, 31.0, 49.0, 97.0, 149.0, 224.0, 314.0, 577.0, 838.0, 1389.0, 2334.0, 3769.0, 6003.0, 10328.0, 18782.0, 41056.0, 255919.0, 1597340.0, 94406.0, 27646.0, 14431.0, 8284.0, 5124.0, 3082.0, 1882.0, 1186.0, 731.0, 407.0, 257.0, 176.0, 89.0, 71.0, 47.0, 32.0, 11.0, 16.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.957672119140625, -0.92706298828125, -0.896453857421875, -0.8658447265625, -0.835235595703125, -0.80462646484375, -0.774017333984375, -0.743408203125, -0.712799072265625, -0.68218994140625, -0.651580810546875, -0.6209716796875, -0.590362548828125, -0.55975341796875, -0.529144287109375, -0.49853515625, -0.467926025390625, -0.43731689453125, -0.406707763671875, -0.3760986328125, -0.345489501953125, -0.31488037109375, -0.284271240234375, -0.253662109375, -0.223052978515625, -0.19244384765625, -0.161834716796875, -0.1312255859375, -0.100616455078125, -0.07000732421875, -0.039398193359375, -0.0087890625, 0.021820068359375, 0.05242919921875, 0.083038330078125, 0.1136474609375, 0.144256591796875, 0.17486572265625, 0.205474853515625, 0.236083984375, 0.266693115234375, 0.29730224609375, 0.327911376953125, 0.3585205078125, 0.389129638671875, 0.41973876953125, 0.450347900390625, 0.48095703125, 0.511566162109375, 0.54217529296875, 0.572784423828125, 0.6033935546875, 0.634002685546875, 0.66461181640625, 0.695220947265625, 0.725830078125, 0.756439208984375, 0.78704833984375, 0.817657470703125, 0.8482666015625, 0.878875732421875, 0.90948486328125, 0.940093994140625, 0.970703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 11.0, 11.0, 13.0, 24.0, 32.0, 34.0, 37.0, 48.0, 51.0, 67.0, 87.0, 72.0, 77.0, 73.0, 60.0, 63.0, 41.0, 37.0, 30.0, 22.0, 22.0, 15.0, 11.0, 6.0, 9.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.0738062858581543, -0.0716848373413086, -0.06956338882446289, -0.06744194030761719, -0.06532049179077148, -0.06319904327392578, -0.06107759475708008, -0.058956146240234375, -0.05683469772338867, -0.05471324920654297, -0.052591800689697266, -0.05047035217285156, -0.04834890365600586, -0.046227455139160156, -0.04410600662231445, -0.04198455810546875, -0.03986310958862305, -0.037741661071777344, -0.03562021255493164, -0.03349876403808594, -0.031377315521240234, -0.02925586700439453, -0.027134418487548828, -0.025012969970703125, -0.022891521453857422, -0.02077007293701172, -0.018648624420166016, -0.016527175903320312, -0.01440572738647461, -0.012284278869628906, -0.010162830352783203, -0.0080413818359375, -0.005919933319091797, -0.0037984848022460938, -0.0016770362854003906, 0.0004444122314453125, 0.0025658607482910156, 0.004687309265136719, 0.006808757781982422, 0.008930206298828125, 0.011051654815673828, 0.013173103332519531, 0.015294551849365234, 0.017416000366210938, 0.01953744888305664, 0.021658897399902344, 0.023780345916748047, 0.02590179443359375, 0.028023242950439453, 0.030144691467285156, 0.03226613998413086, 0.03438758850097656, 0.036509037017822266, 0.03863048553466797, 0.04075193405151367, 0.042873382568359375, 0.04499483108520508, 0.04711627960205078, 0.049237728118896484, 0.05135917663574219, 0.05348062515258789, 0.055602073669433594, 0.0577235221862793, 0.059844970703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 9.0, 10.0, 14.0, 22.0, 21.0, 29.0, 45.0, 93.0, 121.0, 268.0, 810.0, 3876.0, 349814.0, 686482.0, 5339.0, 908.0, 282.0, 129.0, 77.0, 51.0, 38.0, 23.0, 18.0, 13.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.144561767578125, -1.10064697265625, -1.056732177734375, -1.0128173828125, -0.968902587890625, -0.92498779296875, -0.881072998046875, -0.837158203125, -0.793243408203125, -0.74932861328125, -0.705413818359375, -0.6614990234375, -0.617584228515625, -0.57366943359375, -0.529754638671875, -0.48583984375, -0.441925048828125, -0.39801025390625, -0.354095458984375, -0.3101806640625, -0.266265869140625, -0.22235107421875, -0.178436279296875, -0.134521484375, -0.090606689453125, -0.04669189453125, -0.002777099609375, 0.0411376953125, 0.085052490234375, 0.12896728515625, 0.172882080078125, 0.216796875, 0.260711669921875, 0.30462646484375, 0.348541259765625, 0.3924560546875, 0.436370849609375, 0.48028564453125, 0.524200439453125, 0.568115234375, 0.612030029296875, 0.65594482421875, 0.699859619140625, 0.7437744140625, 0.787689208984375, 0.83160400390625, 0.875518798828125, 0.91943359375, 0.963348388671875, 1.00726318359375, 1.051177978515625, 1.0950927734375, 1.139007568359375, 1.18292236328125, 1.226837158203125, 1.270751953125, 1.314666748046875, 1.35858154296875, 1.402496337890625, 1.4464111328125, 1.490325927734375, 1.53424072265625, 1.578155517578125, 1.6220703125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 26.0, 91.0, 381.0, 386.0, 83.0, 25.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7072547674179077, -0.6764556169509888, -0.6456565260887146, -0.6148573756217957, -0.5840582251548767, -0.5532591342926025, -0.5224599838256836, -0.49166086316108704, -0.4608617424964905, -0.4300626218318939, -0.399263471364975, -0.3684643507003784, -0.33766523003578186, -0.3068661093711853, -0.27606695890426636, -0.2452678382396698, -0.21446868777275085, -0.1836695522069931, -0.15287043154239655, -0.1220712959766388, -0.09127216786146164, -0.060473039746284485, -0.029673904180526733, 0.0011252164840698242, 0.031924352049827576, 0.06272348016500473, 0.09352260828018188, 0.12432174384593964, 0.1551208794116974, 0.18592000007629395, 0.2167191356420517, 0.24751825630664825, 0.278317391872406, 0.30911651253700256, 0.3399156630039215, 0.37071478366851807, 0.4015139043331146, 0.4323130249977112, 0.4631121754646301, 0.4939112961292267, 0.5247104167938232, 0.5555095672607422, 0.5863086581230164, 0.6171078085899353, 0.6479069590568542, 0.6787060499191284, 0.7095052003860474, 0.7403043508529663, 0.7711035013198853, 0.8019026517868042, 0.8327017426490784, 0.8635008931159973, 0.8943000435829163, 0.9250991344451904, 0.9558982849121094, 0.9866974353790283, 1.0174964666366577, 1.0482956171035767, 1.0790947675704956, 1.109893798828125, 1.140692949295044, 1.171492099761963, 1.2022912502288818, 1.2330904006958008, 1.2638895511627197]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 19.0, 26.0, 23.0, 38.0, 35.0, 48.0, 48.0, 56.0, 67.0, 84.0, 81.0, 72.0, 62.0, 62.0, 57.0, 40.0, 33.0, 30.0, 35.0, 16.0, 20.0, 12.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2954719662666321, -0.2875341475009918, -0.2795962989330292, -0.2716584801673889, -0.26372063159942627, -0.255782812833786, -0.24784497916698456, -0.2399071455001831, -0.23196931183338165, -0.2240314781665802, -0.21609364449977875, -0.2081558108329773, -0.20021799206733704, -0.1922801434993744, -0.18434232473373413, -0.17640449106693268, -0.16846665740013123, -0.16052882373332977, -0.15259099006652832, -0.14465315639972687, -0.13671532273292542, -0.12877750396728516, -0.1208396703004837, -0.11290183663368225, -0.1049640029668808, -0.09702616930007935, -0.0890883356332779, -0.08115050941705704, -0.07321267575025558, -0.06527484208345413, -0.05733701214194298, -0.049399182200431824, -0.04146134853363037, -0.03352351486682892, -0.025585684925317764, -0.01764785312116146, -0.009710021317005157, -0.0017721876502037048, 0.006165642291307449, 0.014103472232818604, 0.022041305899620056, 0.02997913770377636, 0.03791696950793266, 0.04585479944944382, 0.05379263311624527, 0.06173046678304672, 0.06966829299926758, 0.07760612666606903, 0.08554396033287048, 0.09348179399967194, 0.10141962766647339, 0.10935745388269424, 0.1172952875494957, 0.12523311376571655, 0.133170947432518, 0.14110878109931946, 0.1490466147661209, 0.15698444843292236, 0.16492228209972382, 0.17286011576652527, 0.18079793453216553, 0.18873578310012817, 0.19667360186576843, 0.20461143553256989, 0.21254926919937134]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 10.0, 3.0, 9.0, 9.0, 9.0, 12.0, 21.0, 21.0, 32.0, 35.0, 43.0, 51.0, 71.0, 72.0, 63.0, 67.0, 53.0, 65.0, 61.0, 55.0, 54.0, 41.0, 33.0, 31.0, 19.0, 27.0, 16.0, 12.0, 2.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.2890625, -3.2107391357421875, -3.132415771484375, -3.0540924072265625, -2.97576904296875, -2.8974456787109375, -2.819122314453125, -2.7407989501953125, -2.6624755859375, -2.5841522216796875, -2.505828857421875, -2.4275054931640625, -2.34918212890625, -2.2708587646484375, -2.192535400390625, -2.1142120361328125, -2.035888671875, -1.9575653076171875, -1.879241943359375, -1.8009185791015625, -1.72259521484375, -1.6442718505859375, -1.565948486328125, -1.4876251220703125, -1.4093017578125, -1.3309783935546875, -1.252655029296875, -1.1743316650390625, -1.09600830078125, -1.0176849365234375, -0.939361572265625, -0.8610382080078125, -0.78271484375, -0.7043914794921875, -0.626068115234375, -0.5477447509765625, -0.46942138671875, -0.3910980224609375, -0.312774658203125, -0.2344512939453125, -0.1561279296875, -0.0778045654296875, 0.000518798828125, 0.0788421630859375, 0.15716552734375, 0.2354888916015625, 0.313812255859375, 0.3921356201171875, 0.470458984375, 0.5487823486328125, 0.627105712890625, 0.7054290771484375, 0.78375244140625, 0.8620758056640625, 0.940399169921875, 1.0187225341796875, 1.0970458984375, 1.1753692626953125, 1.253692626953125, 1.3320159912109375, 1.41033935546875, 1.4886627197265625, 1.566986083984375, 1.6453094482421875, 1.7236328125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 20.0, 31.0, 35.0, 78.0, 139.0, 181.0, 298.0, 484.0, 829.0, 1380.0, 2692.0, 5606.0, 12208.0, 29577.0, 83819.0, 326402.0, 418860.0, 103477.0, 35188.0, 14056.0, 6204.0, 3064.0, 1639.0, 889.0, 528.0, 300.0, 201.0, 132.0, 95.0, 51.0, 35.0, 26.0, 11.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28515625, -3.18878173828125, -3.0924072265625, -2.99603271484375, -2.899658203125, -2.80328369140625, -2.7069091796875, -2.61053466796875, -2.51416015625, -2.41778564453125, -2.3214111328125, -2.22503662109375, -2.128662109375, -2.03228759765625, -1.9359130859375, -1.83953857421875, -1.7431640625, -1.64678955078125, -1.5504150390625, -1.45404052734375, -1.357666015625, -1.26129150390625, -1.1649169921875, -1.06854248046875, -0.97216796875, -0.87579345703125, -0.7794189453125, -0.68304443359375, -0.586669921875, -0.49029541015625, -0.3939208984375, -0.29754638671875, -0.201171875, -0.10479736328125, -0.0084228515625, 0.08795166015625, 0.184326171875, 0.28070068359375, 0.3770751953125, 0.47344970703125, 0.56982421875, 0.66619873046875, 0.7625732421875, 0.85894775390625, 0.955322265625, 1.05169677734375, 1.1480712890625, 1.24444580078125, 1.3408203125, 1.43719482421875, 1.5335693359375, 1.62994384765625, 1.726318359375, 1.82269287109375, 1.9190673828125, 2.01544189453125, 2.11181640625, 2.20819091796875, 2.3045654296875, 2.40093994140625, 2.497314453125, 2.59368896484375, 2.6900634765625, 2.78643798828125, 2.8828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 15.0, 12.0, 16.0, 26.0, 26.0, 31.0, 35.0, 39.0, 46.0, 57.0, 61.0, 78.0, 150.0, 904.0, 852.0, 160.0, 88.0, 73.0, 74.0, 45.0, 33.0, 27.0, 39.0, 23.0, 22.0, 12.0, 14.0, 15.0, 16.0, 12.0, 6.0, 5.0, 0.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.7216796875, -5.537109375, -5.3525390625, -5.16796875, -4.9833984375, -4.798828125, -4.6142578125, -4.4296875, -4.2451171875, -4.060546875, -3.8759765625, -3.69140625, -3.5068359375, -3.322265625, -3.1376953125, -2.953125, -2.7685546875, -2.583984375, -2.3994140625, -2.21484375, -2.0302734375, -1.845703125, -1.6611328125, -1.4765625, -1.2919921875, -1.107421875, -0.9228515625, -0.73828125, -0.5537109375, -0.369140625, -0.1845703125, 0.0, 0.1845703125, 0.369140625, 0.5537109375, 0.73828125, 0.9228515625, 1.107421875, 1.2919921875, 1.4765625, 1.6611328125, 1.845703125, 2.0302734375, 2.21484375, 2.3994140625, 2.583984375, 2.7685546875, 2.953125, 3.1376953125, 3.322265625, 3.5068359375, 3.69140625, 3.8759765625, 4.060546875, 4.2451171875, 4.4296875, 4.6142578125, 4.798828125, 4.9833984375, 5.16796875, 5.3525390625, 5.537109375, 5.7216796875, 5.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 5.0, 13.0, 26.0, 25.0, 36.0, 58.0, 88.0, 93.0, 156.0, 246.0, 492.0, 1474.0, 10531.0, 434833.0, 2670489.0, 23226.0, 2484.0, 588.0, 246.0, 174.0, 112.0, 90.0, 54.0, 34.0, 30.0, 22.0, 22.0, 15.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.681396484375, -15.22216796875, -14.762939453125, -14.3037109375, -13.844482421875, -13.38525390625, -12.926025390625, -12.466796875, -12.007568359375, -11.54833984375, -11.089111328125, -10.6298828125, -10.170654296875, -9.71142578125, -9.252197265625, -8.79296875, -8.333740234375, -7.87451171875, -7.415283203125, -6.9560546875, -6.496826171875, -6.03759765625, -5.578369140625, -5.119140625, -4.659912109375, -4.20068359375, -3.741455078125, -3.2822265625, -2.822998046875, -2.36376953125, -1.904541015625, -1.4453125, -0.986083984375, -0.52685546875, -0.067626953125, 0.3916015625, 0.850830078125, 1.31005859375, 1.769287109375, 2.228515625, 2.687744140625, 3.14697265625, 3.606201171875, 4.0654296875, 4.524658203125, 4.98388671875, 5.443115234375, 5.90234375, 6.361572265625, 6.82080078125, 7.280029296875, 7.7392578125, 8.198486328125, 8.65771484375, 9.116943359375, 9.576171875, 10.035400390625, 10.49462890625, 10.953857421875, 11.4130859375, 11.872314453125, 12.33154296875, 12.790771484375, 13.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 63.0, 809.0, 141.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.6790008544922, -189.33090209960938, -185.98280334472656, -182.63470458984375, -179.28662109375, -175.9385223388672, -172.59042358398438, -169.24232482910156, -165.89422607421875, -162.54612731933594, -159.19802856445312, -155.8499298095703, -152.5018310546875, -149.15374755859375, -145.80564880371094, -142.45755004882812, -139.1094512939453, -135.7613525390625, -132.4132537841797, -129.06515502929688, -125.7170639038086, -122.36896514892578, -119.0208740234375, -115.67277526855469, -112.32467651367188, -108.97657775878906, -105.62847900390625, -102.28038787841797, -98.93228912353516, -95.58419036865234, -92.23609924316406, -88.88800048828125, -85.53990173339844, -82.19180297851562, -78.84370422363281, -75.49561309814453, -72.14751434326172, -68.7994155883789, -65.45132446289062, -62.10322570800781, -58.755126953125, -55.40702819824219, -52.05893325805664, -48.710838317871094, -45.36273956298828, -42.01464080810547, -38.66654586791992, -35.318450927734375, -31.970354080200195, -28.622257232666016, -25.274160385131836, -21.926063537597656, -18.577966690063477, -15.229869842529297, -11.881772994995117, -8.533676147460938, -5.185579299926758, -1.8374824523925781, 1.5106143951416016, 4.858711242675781, 8.206808090209961, 11.55490493774414, 14.90300178527832, 18.2510986328125, 21.59919548034668]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 8.0, 13.0, 16.0, 14.0, 22.0, 18.0, 25.0, 21.0, 37.0, 29.0, 35.0, 35.0, 29.0, 44.0, 31.0, 31.0, 44.0, 50.0, 46.0, 48.0, 44.0, 40.0, 35.0, 36.0, 39.0, 24.0, 29.0, 16.0, 27.0, 22.0, 18.0, 14.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.94007396697998, -15.442998886108398, -14.945924758911133, -14.44884967803955, -13.951775550842285, -13.454700469970703, -12.957626342773438, -12.460551261901855, -11.963476181030273, -11.466401100158691, -10.969326972961426, -10.472251892089844, -9.975177764892578, -9.478102684020996, -8.981027603149414, -8.483953475952148, -7.986879348754883, -7.489804744720459, -6.992730140686035, -6.495655059814453, -5.9985809326171875, -5.5015058517456055, -5.004431247711182, -4.507356643676758, -4.010282039642334, -3.51320743560791, -3.0161328315734863, -2.5190579891204834, -2.0219833850860596, -1.5249087810516357, -1.0278339385986328, -0.530759334564209, -0.03368568420410156, 0.46338897943496704, 0.9604636430740356, 1.457538366317749, 1.9546129703521729, 2.4516875743865967, 2.9487624168395996, 3.4458370208740234, 3.9429116249084473, 4.439986228942871, 4.937060832977295, 5.434135437011719, 5.931210517883301, 6.428284645080566, 6.925359725952148, 7.422434329986572, 7.919508934020996, 8.416584014892578, 8.913658142089844, 9.410733222961426, 9.907807350158691, 10.404882431030273, 10.901956558227539, 11.399031639099121, 11.896106719970703, 12.393181800842285, 12.89025592803955, 13.387331008911133, 13.884405136108398, 14.38148021697998, 14.878555297851562, 15.375629425048828, 15.872703552246094]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 9.0, 6.0, 15.0, 9.0, 16.0, 16.0, 26.0, 33.0, 43.0, 55.0, 43.0, 68.0, 52.0, 42.0, 64.0, 60.0, 66.0, 53.0, 41.0, 51.0, 48.0, 35.0, 41.0, 17.0, 16.0, 16.0, 16.0, 12.0, 13.0, 8.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0], "bins": [-3.373046875, -3.2945098876953125, -3.215972900390625, -3.1374359130859375, -3.05889892578125, -2.9803619384765625, -2.901824951171875, -2.8232879638671875, -2.7447509765625, -2.6662139892578125, -2.587677001953125, -2.5091400146484375, -2.43060302734375, -2.3520660400390625, -2.273529052734375, -2.1949920654296875, -2.116455078125, -2.0379180908203125, -1.959381103515625, -1.8808441162109375, -1.80230712890625, -1.7237701416015625, -1.645233154296875, -1.5666961669921875, -1.4881591796875, -1.4096221923828125, -1.331085205078125, -1.2525482177734375, -1.17401123046875, -1.0954742431640625, -1.016937255859375, -0.9384002685546875, -0.85986328125, -0.7813262939453125, -0.702789306640625, -0.6242523193359375, -0.54571533203125, -0.4671783447265625, -0.388641357421875, -0.3101043701171875, -0.2315673828125, -0.1530303955078125, -0.074493408203125, 0.0040435791015625, 0.08258056640625, 0.1611175537109375, 0.239654541015625, 0.3181915283203125, 0.396728515625, 0.4752655029296875, 0.553802490234375, 0.6323394775390625, 0.71087646484375, 0.7894134521484375, 0.867950439453125, 0.9464874267578125, 1.0250244140625, 1.1035614013671875, 1.182098388671875, 1.2606353759765625, 1.33917236328125, 1.4177093505859375, 1.496246337890625, 1.5747833251953125, 1.6533203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 10.0, 16.0, 25.0, 26.0, 52.0, 66.0, 123.0, 188.0, 416.0, 836.0, 1990.0, 5851.0, 20786.0, 130452.0, 2395873.0, 1526432.0, 87050.0, 16502.0, 4590.0, 1630.0, 626.0, 311.0, 159.0, 85.0, 61.0, 40.0, 25.0, 23.0, 10.0, 8.0, 1.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0], "bins": [-7.67578125, -7.49261474609375, -7.3094482421875, -7.12628173828125, -6.943115234375, -6.75994873046875, -6.5767822265625, -6.39361572265625, -6.21044921875, -6.02728271484375, -5.8441162109375, -5.66094970703125, -5.477783203125, -5.29461669921875, -5.1114501953125, -4.92828369140625, -4.7451171875, -4.56195068359375, -4.3787841796875, -4.19561767578125, -4.012451171875, -3.82928466796875, -3.6461181640625, -3.46295166015625, -3.27978515625, -3.09661865234375, -2.9134521484375, -2.73028564453125, -2.547119140625, -2.36395263671875, -2.1807861328125, -1.99761962890625, -1.814453125, -1.63128662109375, -1.4481201171875, -1.26495361328125, -1.081787109375, -0.89862060546875, -0.7154541015625, -0.53228759765625, -0.34912109375, -0.16595458984375, 0.0172119140625, 0.20037841796875, 0.383544921875, 0.56671142578125, 0.7498779296875, 0.93304443359375, 1.1162109375, 1.29937744140625, 1.4825439453125, 1.66571044921875, 1.848876953125, 2.03204345703125, 2.2152099609375, 2.39837646484375, 2.58154296875, 2.76470947265625, 2.9478759765625, 3.13104248046875, 3.314208984375, 3.49737548828125, 3.6805419921875, 3.86370849609375, 4.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 17.0, 16.0, 35.0, 51.0, 75.0, 83.0, 140.0, 197.0, 337.0, 554.0, 730.0, 646.0, 437.0, 247.0, 163.0, 96.0, 73.0, 47.0, 31.0, 27.0, 17.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27496337890625, -4.1358642578125, -3.99676513671875, -3.857666015625, -3.71856689453125, -3.5794677734375, -3.44036865234375, -3.30126953125, -3.16217041015625, -3.0230712890625, -2.88397216796875, -2.744873046875, -2.60577392578125, -2.4666748046875, -2.32757568359375, -2.1884765625, -2.04937744140625, -1.9102783203125, -1.77117919921875, -1.632080078125, -1.49298095703125, -1.3538818359375, -1.21478271484375, -1.07568359375, -0.93658447265625, -0.7974853515625, -0.65838623046875, -0.519287109375, -0.38018798828125, -0.2410888671875, -0.10198974609375, 0.037109375, 0.17620849609375, 0.3153076171875, 0.45440673828125, 0.593505859375, 0.73260498046875, 0.8717041015625, 1.01080322265625, 1.14990234375, 1.28900146484375, 1.4281005859375, 1.56719970703125, 1.706298828125, 1.84539794921875, 1.9844970703125, 2.12359619140625, 2.2626953125, 2.40179443359375, 2.5408935546875, 2.67999267578125, 2.819091796875, 2.95819091796875, 3.0972900390625, 3.23638916015625, 3.37548828125, 3.51458740234375, 3.6536865234375, 3.79278564453125, 3.931884765625, 4.07098388671875, 4.2100830078125, 4.34918212890625, 4.48828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 10.0, 12.0, 19.0, 26.0, 43.0, 51.0, 77.0, 117.0, 227.0, 595.0, 2928.0, 149001.0, 4012036.0, 26701.0, 1438.0, 436.0, 187.0, 112.0, 85.0, 46.0, 44.0, 29.0, 15.0, 9.0, 14.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.561767578125, -20.87353515625, -20.185302734375, -19.4970703125, -18.808837890625, -18.12060546875, -17.432373046875, -16.744140625, -16.055908203125, -15.36767578125, -14.679443359375, -13.9912109375, -13.302978515625, -12.61474609375, -11.926513671875, -11.23828125, -10.550048828125, -9.86181640625, -9.173583984375, -8.4853515625, -7.797119140625, -7.10888671875, -6.420654296875, -5.732421875, -5.044189453125, -4.35595703125, -3.667724609375, -2.9794921875, -2.291259765625, -1.60302734375, -0.914794921875, -0.2265625, 0.461669921875, 1.14990234375, 1.838134765625, 2.5263671875, 3.214599609375, 3.90283203125, 4.591064453125, 5.279296875, 5.967529296875, 6.65576171875, 7.343994140625, 8.0322265625, 8.720458984375, 9.40869140625, 10.096923828125, 10.78515625, 11.473388671875, 12.16162109375, 12.849853515625, 13.5380859375, 14.226318359375, 14.91455078125, 15.602783203125, 16.291015625, 16.979248046875, 17.66748046875, 18.355712890625, 19.0439453125, 19.732177734375, 20.42041015625, 21.108642578125, 21.796875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 39.0, 101.0, 211.0, 280.0, 210.0, 109.0, 35.0, 10.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.667701721191406, -13.407197952270508, -12.14669418334961, -10.886191368103027, -9.625687599182129, -8.36518383026123, -7.10468053817749, -5.84417724609375, -4.583673477172852, -3.3231699466705322, -2.062666416168213, -0.8021628856658936, 0.4583406448364258, 1.7188444137573242, 2.9793477058410645, 4.239850997924805, 5.500354766845703, 6.760858535766602, 8.0213623046875, 9.281865119934082, 10.54236888885498, 11.802872657775879, 13.063375473022461, 14.32387924194336, 15.584383010864258, 16.844886779785156, 18.105390548706055, 19.365894317626953, 20.62639617919922, 21.88690185546875, 23.147403717041016, 24.407907485961914, 25.668411254882812, 26.92891502380371, 28.18941879272461, 29.449922561645508, 30.710426330566406, 31.970928192138672, 33.2314338684082, 34.49193572998047, 35.75244140625, 37.012943267822266, 38.2734489440918, 39.53395080566406, 40.794456481933594, 42.05495834350586, 43.31546401977539, 44.575965881347656, 45.83646774291992, 47.09696960449219, 48.35747528076172, 49.617977142333984, 50.878482818603516, 52.13898468017578, 53.39949035644531, 54.65999221801758, 55.920494079589844, 57.18099594116211, 58.44150161743164, 59.702003479003906, 60.96250915527344, 62.2230110168457, 63.483516693115234, 64.7440185546875, 66.00452423095703]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 9.0, 13.0, 22.0, 14.0, 15.0, 22.0, 26.0, 22.0, 29.0, 28.0, 34.0, 41.0, 24.0, 48.0, 39.0, 43.0, 41.0, 43.0, 41.0, 61.0, 37.0, 42.0, 45.0, 30.0, 35.0, 35.0, 28.0, 22.0, 27.0, 16.0, 10.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-13.631193161010742, -13.263228416442871, -12.895262718200684, -12.527297973632812, -12.159332275390625, -11.791367530822754, -11.423402786254883, -11.055437088012695, -10.687472343444824, -10.319507598876953, -9.951541900634766, -9.583577156066895, -9.215612411499023, -8.847646713256836, -8.479681968688965, -8.111717224121094, -7.743751525878906, -7.375786304473877, -7.007821083068848, -6.639856338500977, -6.271891117095947, -5.903925895690918, -5.535961151123047, -5.167995929718018, -4.800030708312988, -4.432065486907959, -4.06410026550293, -3.6961355209350586, -3.3281702995300293, -2.960205078125, -2.59224009513855, -2.2242751121520996, -1.856308937072754, -1.4883438348770142, -1.1203787326812744, -0.7524136304855347, -0.3844485282897949, -0.016483426094055176, 0.35148167610168457, 0.7194466590881348, 1.087411880493164, 1.4553769826889038, 1.8233420848846436, 2.1913070678710938, 2.559272289276123, 2.9272375106811523, 3.2952024936676025, 3.6631674766540527, 4.031132698059082, 4.399097919464111, 4.767063140869141, 5.135027885437012, 5.502993106842041, 5.87095832824707, 6.238923072814941, 6.606888294219971, 6.974853515625, 7.342818737030029, 7.710783958435059, 8.07874870300293, 8.446714401245117, 8.814679145812988, 9.18264389038086, 9.550609588623047, 9.918574333190918]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 11.0, 11.0, 12.0, 19.0, 21.0, 24.0, 20.0, 35.0, 47.0, 49.0, 50.0, 65.0, 53.0, 57.0, 67.0, 59.0, 46.0, 50.0, 53.0, 43.0, 31.0, 34.0, 34.0, 16.0, 20.0, 21.0, 13.0, 5.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.36773681640625, -2.2960205078125, -2.22430419921875, -2.152587890625, -2.08087158203125, -2.0091552734375, -1.93743896484375, -1.86572265625, -1.79400634765625, -1.7222900390625, -1.65057373046875, -1.578857421875, -1.50714111328125, -1.4354248046875, -1.36370849609375, -1.2919921875, -1.22027587890625, -1.1485595703125, -1.07684326171875, -1.005126953125, -0.93341064453125, -0.8616943359375, -0.78997802734375, -0.71826171875, -0.64654541015625, -0.5748291015625, -0.50311279296875, -0.431396484375, -0.35968017578125, -0.2879638671875, -0.21624755859375, -0.14453125, -0.07281494140625, -0.0010986328125, 0.07061767578125, 0.142333984375, 0.21405029296875, 0.2857666015625, 0.35748291015625, 0.42919921875, 0.50091552734375, 0.5726318359375, 0.64434814453125, 0.716064453125, 0.78778076171875, 0.8594970703125, 0.93121337890625, 1.0029296875, 1.07464599609375, 1.1463623046875, 1.21807861328125, 1.289794921875, 1.36151123046875, 1.4332275390625, 1.50494384765625, 1.57666015625, 1.64837646484375, 1.7200927734375, 1.79180908203125, 1.863525390625, 1.93524169921875, 2.0069580078125, 2.07867431640625, 2.150390625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 6.0, 23.0, 26.0, 25.0, 58.0, 111.0, 164.0, 349.0, 649.0, 1232.0, 2483.0, 5419.0, 12222.0, 28389.0, 68945.0, 164093.0, 300547.0, 255405.0, 120534.0, 49821.0, 21021.0, 8951.0, 4099.0, 1945.0, 937.0, 465.0, 252.0, 136.0, 82.0, 69.0, 37.0, 17.0, 15.0, 10.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9326858520507812, -0.9058990478515625, -0.8791122436523438, -0.852325439453125, -0.8255386352539062, -0.7987518310546875, -0.7719650268554688, -0.74517822265625, -0.7183914184570312, -0.6916046142578125, -0.6648178100585938, -0.638031005859375, -0.6112442016601562, -0.5844573974609375, -0.5576705932617188, -0.5308837890625, -0.5040969848632812, -0.4773101806640625, -0.45052337646484375, -0.423736572265625, -0.39694976806640625, -0.3701629638671875, -0.34337615966796875, -0.31658935546875, -0.28980255126953125, -0.2630157470703125, -0.23622894287109375, -0.209442138671875, -0.18265533447265625, -0.1558685302734375, -0.12908172607421875, -0.102294921875, -0.07550811767578125, -0.0487213134765625, -0.02193450927734375, 0.004852294921875, 0.03163909912109375, 0.0584259033203125, 0.08521270751953125, 0.11199951171875, 0.13878631591796875, 0.1655731201171875, 0.19235992431640625, 0.219146728515625, 0.24593353271484375, 0.2727203369140625, 0.29950714111328125, 0.3262939453125, 0.35308074951171875, 0.3798675537109375, 0.40665435791015625, 0.433441162109375, 0.46022796630859375, 0.4870147705078125, 0.5138015747070312, 0.54058837890625, 0.5673751831054688, 0.5941619873046875, 0.6209487915039062, 0.647735595703125, 0.6745223999023438, 0.7013092041015625, 0.7280960083007812, 0.7548828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 14.0, 9.0, 26.0, 7.0, 18.0, 27.0, 32.0, 16.0, 31.0, 37.0, 29.0, 38.0, 56.0, 49.0, 42.0, 39.0, 1064.0, 30.0, 59.0, 41.0, 48.0, 35.0, 30.0, 24.0, 32.0, 24.0, 29.0, 15.0, 23.0, 15.0, 20.0, 8.0, 13.0, 7.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.482421875, -1.4412689208984375, -1.400115966796875, -1.3589630126953125, -1.31781005859375, -1.2766571044921875, -1.235504150390625, -1.1943511962890625, -1.1531982421875, -1.1120452880859375, -1.070892333984375, -1.0297393798828125, -0.98858642578125, -0.9474334716796875, -0.906280517578125, -0.8651275634765625, -0.823974609375, -0.7828216552734375, -0.741668701171875, -0.7005157470703125, -0.65936279296875, -0.6182098388671875, -0.577056884765625, -0.5359039306640625, -0.4947509765625, -0.4535980224609375, -0.412445068359375, -0.3712921142578125, -0.33013916015625, -0.2889862060546875, -0.247833251953125, -0.2066802978515625, -0.16552734375, -0.1243743896484375, -0.083221435546875, -0.0420684814453125, -0.00091552734375, 0.0402374267578125, 0.081390380859375, 0.1225433349609375, 0.1636962890625, 0.2048492431640625, 0.246002197265625, 0.2871551513671875, 0.32830810546875, 0.3694610595703125, 0.410614013671875, 0.4517669677734375, 0.492919921875, 0.5340728759765625, 0.575225830078125, 0.6163787841796875, 0.65753173828125, 0.6986846923828125, 0.739837646484375, 0.7809906005859375, 0.8221435546875, 0.8632965087890625, 0.904449462890625, 0.9456024169921875, 0.98675537109375, 1.0279083251953125, 1.069061279296875, 1.1102142333984375, 1.1513671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 18.0, 23.0, 36.0, 43.0, 100.0, 166.0, 264.0, 433.0, 678.0, 1120.0, 1904.0, 3414.0, 6090.0, 11368.0, 21745.0, 61803.0, 1515956.0, 388402.0, 43175.0, 18367.0, 9453.0, 5318.0, 2954.0, 1758.0, 988.0, 620.0, 399.0, 208.0, 129.0, 64.0, 58.0, 28.0, 16.0, 14.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7846145629882812, -0.7542877197265625, -0.7239608764648438, -0.693634033203125, -0.6633071899414062, -0.6329803466796875, -0.6026535034179688, -0.57232666015625, -0.5419998168945312, -0.5116729736328125, -0.48134613037109375, -0.451019287109375, -0.42069244384765625, -0.3903656005859375, -0.36003875732421875, -0.3297119140625, -0.29938507080078125, -0.2690582275390625, -0.23873138427734375, -0.208404541015625, -0.17807769775390625, -0.1477508544921875, -0.11742401123046875, -0.08709716796875, -0.05677032470703125, -0.0264434814453125, 0.00388336181640625, 0.034210205078125, 0.06453704833984375, 0.0948638916015625, 0.12519073486328125, 0.155517578125, 0.18584442138671875, 0.2161712646484375, 0.24649810791015625, 0.276824951171875, 0.30715179443359375, 0.3374786376953125, 0.36780548095703125, 0.39813232421875, 0.42845916748046875, 0.4587860107421875, 0.48911285400390625, 0.519439697265625, 0.5497665405273438, 0.5800933837890625, 0.6104202270507812, 0.6407470703125, 0.6710739135742188, 0.7014007568359375, 0.7317276000976562, 0.762054443359375, 0.7923812866210938, 0.8227081298828125, 0.8530349731445312, 0.88336181640625, 0.9136886596679688, 0.9440155029296875, 0.9743423461914062, 1.004669189453125, 1.0349960327148438, 1.0653228759765625, 1.0956497192382812, 1.1259765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 4.0, 16.0, 23.0, 30.0, 25.0, 39.0, 38.0, 43.0, 53.0, 74.0, 82.0, 84.0, 50.0, 56.0, 70.0, 49.0, 62.0, 36.0, 35.0, 30.0, 23.0, 16.0, 10.0, 7.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034423828125, -0.03293609619140625, -0.0314483642578125, -0.02996063232421875, -0.028472900390625, -0.02698516845703125, -0.0254974365234375, -0.02400970458984375, -0.02252197265625, -0.02103424072265625, -0.0195465087890625, -0.01805877685546875, -0.016571044921875, -0.01508331298828125, -0.0135955810546875, -0.01210784912109375, -0.0106201171875, -0.00913238525390625, -0.0076446533203125, -0.00615692138671875, -0.004669189453125, -0.00318145751953125, -0.0016937255859375, -0.00020599365234375, 0.00128173828125, 0.00276947021484375, 0.0042572021484375, 0.00574493408203125, 0.007232666015625, 0.00872039794921875, 0.0102081298828125, 0.01169586181640625, 0.01318359375, 0.01467132568359375, 0.0161590576171875, 0.01764678955078125, 0.019134521484375, 0.02062225341796875, 0.0221099853515625, 0.02359771728515625, 0.02508544921875, 0.02657318115234375, 0.0280609130859375, 0.02954864501953125, 0.031036376953125, 0.03252410888671875, 0.0340118408203125, 0.03549957275390625, 0.0369873046875, 0.03847503662109375, 0.0399627685546875, 0.04145050048828125, 0.042938232421875, 0.04442596435546875, 0.0459136962890625, 0.04740142822265625, 0.04888916015625, 0.05037689208984375, 0.0518646240234375, 0.05335235595703125, 0.054840087890625, 0.05632781982421875, 0.0578155517578125, 0.05930328369140625, 0.060791015625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 7.0, 5.0, 9.0, 6.0, 18.0, 20.0, 28.0, 34.0, 62.0, 79.0, 132.0, 261.0, 852.0, 34930.0, 999366.0, 11476.0, 636.0, 232.0, 119.0, 82.0, 46.0, 41.0, 27.0, 26.0, 17.0, 13.0, 9.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2457275390625, -1.214111328125, -1.1824951171875, -1.15087890625, -1.1192626953125, -1.087646484375, -1.0560302734375, -1.0244140625, -0.9927978515625, -0.961181640625, -0.9295654296875, -0.89794921875, -0.8663330078125, -0.834716796875, -0.8031005859375, -0.771484375, -0.7398681640625, -0.708251953125, -0.6766357421875, -0.64501953125, -0.6134033203125, -0.581787109375, -0.5501708984375, -0.5185546875, -0.4869384765625, -0.455322265625, -0.4237060546875, -0.39208984375, -0.3604736328125, -0.328857421875, -0.2972412109375, -0.265625, -0.2340087890625, -0.202392578125, -0.1707763671875, -0.13916015625, -0.1075439453125, -0.075927734375, -0.0443115234375, -0.0126953125, 0.0189208984375, 0.050537109375, 0.0821533203125, 0.11376953125, 0.1453857421875, 0.177001953125, 0.2086181640625, 0.240234375, 0.2718505859375, 0.303466796875, 0.3350830078125, 0.36669921875, 0.3983154296875, 0.429931640625, 0.4615478515625, 0.4931640625, 0.5247802734375, 0.556396484375, 0.5880126953125, 0.61962890625, 0.6512451171875, 0.682861328125, 0.7144775390625, 0.74609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 43.0, 125.0, 267.0, 310.0, 160.0, 61.0, 23.0, 6.0, 1.0, 0.0, 2.0], "bins": [-0.5731314420700073, -0.5629009008407593, -0.5526703000068665, -0.5424397587776184, -0.5322091579437256, -0.5219786167144775, -0.5117480754852295, -0.5015174746513367, -0.49128690361976624, -0.4810563325881958, -0.47082576155662537, -0.46059519052505493, -0.4503646492958069, -0.44013407826423645, -0.429903507232666, -0.4196729362010956, -0.40944236516952515, -0.3992117941379547, -0.3889812231063843, -0.37875068187713623, -0.3685201108455658, -0.35828953981399536, -0.3480589687824249, -0.3378283977508545, -0.32759785652160645, -0.317367285490036, -0.3071367144584656, -0.29690617322921753, -0.2866756021976471, -0.27644503116607666, -0.2662144601345062, -0.2559838891029358, -0.24575331807136536, -0.23552274703979492, -0.22529219090938568, -0.21506161987781525, -0.2048310488462448, -0.19460049271583557, -0.18436992168426514, -0.1741393506526947, -0.16390877962112427, -0.15367820858955383, -0.1434476524591446, -0.13321708142757416, -0.12298651039600372, -0.11275594681501389, -0.10252538323402405, -0.09229481220245361, -0.08206425607204437, -0.07183369249105453, -0.0616031214594841, -0.05137255787849426, -0.04114199057221413, -0.03091142326593399, -0.020680859684944153, -0.010450288653373718, -0.00021972507238388062, 0.010010841302573681, 0.020241407677531242, 0.03047197312116623, 0.040702540427446365, 0.0509331077337265, 0.06116367131471634, 0.07139424234628677, 0.08162480592727661]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 8.0, 8.0, 6.0, 8.0, 26.0, 20.0, 37.0, 45.0, 40.0, 45.0, 52.0, 59.0, 60.0, 61.0, 66.0, 86.0, 57.0, 55.0, 47.0, 46.0, 49.0, 34.0, 17.0, 24.0, 20.0, 6.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07222437858581543, -0.0683198943734169, -0.06441541016101837, -0.060510922223329544, -0.056606438010931015, -0.052701953798532486, -0.04879746586084366, -0.04489298164844513, -0.0409884974360466, -0.03708401322364807, -0.03317952901124954, -0.029275041073560715, -0.025370556861162186, -0.021466072648763657, -0.01756158657371998, -0.0136571004986763, -0.009752616286277771, -0.005848131142556667, -0.0019436459988355637, 0.00196083914488554, 0.005865324288606644, 0.009769808501005173, 0.013674294576048851, 0.01757878065109253, 0.02148326486349106, 0.025387749075889587, 0.029292235150933266, 0.033196721225976944, 0.03710120543837547, 0.041005689650774, 0.04491017758846283, 0.04881466180086136, 0.05271914601325989, 0.05662363022565842, 0.060528114438056946, 0.06443259865045547, 0.068337082862854, 0.07224157452583313, 0.07614605873823166, 0.08005054295063019, 0.08395502716302872, 0.08785951137542725, 0.09176399558782578, 0.0956684798002243, 0.09957297146320343, 0.10347744822502136, 0.10738193988800049, 0.11128642410039902, 0.11519090831279755, 0.11909539252519608, 0.1229998767375946, 0.12690436840057373, 0.13080884516239166, 0.1347133368253708, 0.13861781358718872, 0.14252230525016785, 0.14642679691314697, 0.1503312885761261, 0.15423576533794403, 0.15814025700092316, 0.1620447337627411, 0.16594922542572021, 0.16985370218753815, 0.17375819385051727, 0.1776626706123352]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 17.0, 15.0, 15.0, 26.0, 31.0, 32.0, 42.0, 51.0, 55.0, 49.0, 45.0, 68.0, 55.0, 63.0, 67.0, 42.0, 56.0, 39.0, 38.0, 39.0, 21.0, 29.0, 22.0, 23.0, 15.0, 12.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.591400146484375, -2.51678466796875, -2.442169189453125, -2.3675537109375, -2.292938232421875, -2.21832275390625, -2.143707275390625, -2.069091796875, -1.994476318359375, -1.91986083984375, -1.845245361328125, -1.7706298828125, -1.696014404296875, -1.62139892578125, -1.546783447265625, -1.47216796875, -1.397552490234375, -1.32293701171875, -1.248321533203125, -1.1737060546875, -1.099090576171875, -1.02447509765625, -0.949859619140625, -0.875244140625, -0.800628662109375, -0.72601318359375, -0.651397705078125, -0.5767822265625, -0.502166748046875, -0.42755126953125, -0.352935791015625, -0.2783203125, -0.203704833984375, -0.12908935546875, -0.054473876953125, 0.0201416015625, 0.094757080078125, 0.16937255859375, 0.243988037109375, 0.318603515625, 0.393218994140625, 0.46783447265625, 0.542449951171875, 0.6170654296875, 0.691680908203125, 0.76629638671875, 0.840911865234375, 0.91552734375, 0.990142822265625, 1.06475830078125, 1.139373779296875, 1.2139892578125, 1.288604736328125, 1.36322021484375, 1.437835693359375, 1.512451171875, 1.587066650390625, 1.66168212890625, 1.736297607421875, 1.8109130859375, 1.885528564453125, 1.96014404296875, 2.034759521484375, 2.109375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 12.0, 11.0, 23.0, 37.0, 28.0, 38.0, 60.0, 61.0, 107.0, 148.0, 221.0, 359.0, 484.0, 847.0, 1361.0, 2833.0, 6194.0, 16249.0, 54168.0, 288776.0, 537241.0, 96861.0, 24988.0, 8922.0, 3728.0, 1890.0, 1015.0, 585.0, 376.0, 266.0, 180.0, 128.0, 85.0, 72.0, 45.0, 29.0, 37.0, 14.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.525390625, -3.412384033203125, -3.29937744140625, -3.186370849609375, -3.0733642578125, -2.960357666015625, -2.84735107421875, -2.734344482421875, -2.621337890625, -2.508331298828125, -2.39532470703125, -2.282318115234375, -2.1693115234375, -2.056304931640625, -1.94329833984375, -1.830291748046875, -1.71728515625, -1.604278564453125, -1.49127197265625, -1.378265380859375, -1.2652587890625, -1.152252197265625, -1.03924560546875, -0.926239013671875, -0.813232421875, -0.700225830078125, -0.58721923828125, -0.474212646484375, -0.3612060546875, -0.248199462890625, -0.13519287109375, -0.022186279296875, 0.0908203125, 0.203826904296875, 0.31683349609375, 0.429840087890625, 0.5428466796875, 0.655853271484375, 0.76885986328125, 0.881866455078125, 0.994873046875, 1.107879638671875, 1.22088623046875, 1.333892822265625, 1.4468994140625, 1.559906005859375, 1.67291259765625, 1.785919189453125, 1.89892578125, 2.011932373046875, 2.12493896484375, 2.237945556640625, 2.3509521484375, 2.463958740234375, 2.57696533203125, 2.689971923828125, 2.802978515625, 2.915985107421875, 3.02899169921875, 3.141998291015625, 3.2550048828125, 3.368011474609375, 3.48101806640625, 3.594024658203125, 3.70703125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 6.0, 13.0, 12.0, 18.0, 17.0, 20.0, 21.0, 28.0, 29.0, 35.0, 53.0, 45.0, 48.0, 62.0, 84.0, 178.0, 1419.0, 339.0, 136.0, 98.0, 51.0, 54.0, 33.0, 43.0, 38.0, 24.0, 21.0, 23.0, 14.0, 14.0, 6.0, 12.0, 6.0, 7.0, 5.0, 10.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.90765380859375, -5.7098388671875, -5.51202392578125, -5.314208984375, -5.11639404296875, -4.9185791015625, -4.72076416015625, -4.52294921875, -4.32513427734375, -4.1273193359375, -3.92950439453125, -3.731689453125, -3.53387451171875, -3.3360595703125, -3.13824462890625, -2.9404296875, -2.74261474609375, -2.5447998046875, -2.34698486328125, -2.149169921875, -1.95135498046875, -1.7535400390625, -1.55572509765625, -1.35791015625, -1.16009521484375, -0.9622802734375, -0.76446533203125, -0.566650390625, -0.36883544921875, -0.1710205078125, 0.02679443359375, 0.224609375, 0.42242431640625, 0.6202392578125, 0.81805419921875, 1.015869140625, 1.21368408203125, 1.4114990234375, 1.60931396484375, 1.80712890625, 2.00494384765625, 2.2027587890625, 2.40057373046875, 2.598388671875, 2.79620361328125, 2.9940185546875, 3.19183349609375, 3.3896484375, 3.58746337890625, 3.7852783203125, 3.98309326171875, 4.180908203125, 4.37872314453125, 4.5765380859375, 4.77435302734375, 4.97216796875, 5.16998291015625, 5.3677978515625, 5.56561279296875, 5.763427734375, 5.96124267578125, 6.1590576171875, 6.35687255859375, 6.5546875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 8.0, 8.0, 10.0, 10.0, 6.0, 23.0, 19.0, 22.0, 30.0, 52.0, 57.0, 76.0, 140.0, 205.0, 445.0, 1194.0, 4870.0, 48421.0, 2905449.0, 172375.0, 9018.0, 1824.0, 616.0, 273.0, 162.0, 100.0, 62.0, 51.0, 34.0, 27.0, 30.0, 20.0, 19.0, 9.0, 8.0, 8.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.4453125, -14.999755859375, -14.55419921875, -14.108642578125, -13.6630859375, -13.217529296875, -12.77197265625, -12.326416015625, -11.880859375, -11.435302734375, -10.98974609375, -10.544189453125, -10.0986328125, -9.653076171875, -9.20751953125, -8.761962890625, -8.31640625, -7.870849609375, -7.42529296875, -6.979736328125, -6.5341796875, -6.088623046875, -5.64306640625, -5.197509765625, -4.751953125, -4.306396484375, -3.86083984375, -3.415283203125, -2.9697265625, -2.524169921875, -2.07861328125, -1.633056640625, -1.1875, -0.741943359375, -0.29638671875, 0.149169921875, 0.5947265625, 1.040283203125, 1.48583984375, 1.931396484375, 2.376953125, 2.822509765625, 3.26806640625, 3.713623046875, 4.1591796875, 4.604736328125, 5.05029296875, 5.495849609375, 5.94140625, 6.386962890625, 6.83251953125, 7.278076171875, 7.7236328125, 8.169189453125, 8.61474609375, 9.060302734375, 9.505859375, 9.951416015625, 10.39697265625, 10.842529296875, 11.2880859375, 11.733642578125, 12.17919921875, 12.624755859375, 13.0703125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 20.0, 588.0, 399.0, 14.0], "bins": [-184.0859832763672, -181.1138916015625, -178.1417999267578, -175.16970825195312, -172.19761657714844, -169.22552490234375, -166.25343322753906, -163.28134155273438, -160.3092498779297, -157.337158203125, -154.3650665283203, -151.39297485351562, -148.42088317871094, -145.44879150390625, -142.47669982910156, -139.50460815429688, -136.53250122070312, -133.56040954589844, -130.58831787109375, -127.61622619628906, -124.64413452148438, -121.67204284667969, -118.699951171875, -115.72785186767578, -112.75576782226562, -109.78367614746094, -106.81158447265625, -103.83949279785156, -100.86740112304688, -97.89530944824219, -94.9232177734375, -91.95111846923828, -88.9790267944336, -86.0069351196289, -83.03484344482422, -80.06275177001953, -77.09066009521484, -74.11856079101562, -71.14646911621094, -68.17437744140625, -65.20228576660156, -62.230194091796875, -59.25810241699219, -56.2860107421875, -53.31391525268555, -50.34182357788086, -47.36973190307617, -44.39763641357422, -41.4255485534668, -38.45345687866211, -35.48136520385742, -32.50926971435547, -29.53717803955078, -26.565086364746094, -23.592994689941406, -20.620901107788086, -17.6488094329834, -14.676716804504395, -11.70462417602539, -8.732532501220703, -5.760439872741699, -2.7883472442626953, 0.1837444305419922, 3.1558380126953125, 6.127929210662842]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 12.0, 2.0, 14.0, 12.0, 11.0, 12.0, 14.0, 17.0, 25.0, 34.0, 35.0, 41.0, 32.0, 23.0, 35.0, 48.0, 39.0, 44.0, 34.0, 44.0, 41.0, 38.0, 43.0, 33.0, 35.0, 34.0, 30.0, 33.0, 27.0, 19.0, 20.0, 19.0, 11.0, 14.0, 12.0, 8.0, 8.0, 8.0, 10.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.396547317504883, -17.863195419311523, -17.329843521118164, -16.796491622924805, -16.263139724731445, -15.729787826538086, -15.196435928344727, -14.663084030151367, -14.129732131958008, -13.596380233764648, -13.063028335571289, -12.52967643737793, -11.99632453918457, -11.462972640991211, -10.929620742797852, -10.396268844604492, -9.86291790008545, -9.32956600189209, -8.79621410369873, -8.262862205505371, -7.729510307312012, -7.196158409118652, -6.662806987762451, -6.129455089569092, -5.596103191375732, -5.062751293182373, -4.529399394989014, -3.9960477352142334, -3.462695837020874, -2.9293439388275146, -2.3959922790527344, -1.862640380859375, -1.3292875289916992, -0.7959356904029846, -0.26258385181427, 0.2707679271697998, 0.8041198253631592, 1.3374717235565186, 1.8708233833312988, 2.404175281524658, 2.9375271797180176, 3.470879077911377, 4.004230976104736, 4.5375823974609375, 5.070934295654297, 5.604286193847656, 6.137638092041016, 6.670989990234375, 7.204341888427734, 7.737693786621094, 8.271045684814453, 8.804397583007812, 9.337749481201172, 9.871101379394531, 10.40445327758789, 10.93780517578125, 11.47115707397461, 12.004508972167969, 12.537860870361328, 13.071212768554688, 13.604564666748047, 14.137916564941406, 14.671268463134766, 15.204620361328125, 15.737971305847168]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 4.0, 11.0, 11.0, 9.0, 14.0, 15.0, 23.0, 28.0, 28.0, 35.0, 48.0, 43.0, 43.0, 48.0, 51.0, 46.0, 39.0, 64.0, 59.0, 48.0, 47.0, 35.0, 50.0, 25.0, 38.0, 23.0, 23.0, 17.0, 18.0, 10.0, 7.0, 13.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.580078125, -2.50921630859375, -2.4383544921875, -2.36749267578125, -2.296630859375, -2.22576904296875, -2.1549072265625, -2.08404541015625, -2.01318359375, -1.94232177734375, -1.8714599609375, -1.80059814453125, -1.729736328125, -1.65887451171875, -1.5880126953125, -1.51715087890625, -1.4462890625, -1.37542724609375, -1.3045654296875, -1.23370361328125, -1.162841796875, -1.09197998046875, -1.0211181640625, -0.95025634765625, -0.87939453125, -0.80853271484375, -0.7376708984375, -0.66680908203125, -0.595947265625, -0.52508544921875, -0.4542236328125, -0.38336181640625, -0.3125, -0.24163818359375, -0.1707763671875, -0.09991455078125, -0.029052734375, 0.04180908203125, 0.1126708984375, 0.18353271484375, 0.25439453125, 0.32525634765625, 0.3961181640625, 0.46697998046875, 0.537841796875, 0.60870361328125, 0.6795654296875, 0.75042724609375, 0.8212890625, 0.89215087890625, 0.9630126953125, 1.03387451171875, 1.104736328125, 1.17559814453125, 1.2464599609375, 1.31732177734375, 1.38818359375, 1.45904541015625, 1.5299072265625, 1.60076904296875, 1.671630859375, 1.74249267578125, 1.8133544921875, 1.88421630859375, 1.955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 7.0, 24.0, 21.0, 30.0, 45.0, 60.0, 79.0, 136.0, 194.0, 392.0, 575.0, 1015.0, 1901.0, 3472.0, 6757.0, 15029.0, 38874.0, 147989.0, 880100.0, 2235993.0, 678775.0, 119492.0, 35011.0, 13941.0, 6583.0, 3398.0, 1777.0, 1027.0, 579.0, 372.0, 224.0, 117.0, 93.0, 49.0, 35.0, 32.0, 17.0, 8.0, 10.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.65625, -3.54351806640625, -3.4307861328125, -3.31805419921875, -3.205322265625, -3.09259033203125, -2.9798583984375, -2.86712646484375, -2.75439453125, -2.64166259765625, -2.5289306640625, -2.41619873046875, -2.303466796875, -2.19073486328125, -2.0780029296875, -1.96527099609375, -1.8525390625, -1.73980712890625, -1.6270751953125, -1.51434326171875, -1.401611328125, -1.28887939453125, -1.1761474609375, -1.06341552734375, -0.95068359375, -0.83795166015625, -0.7252197265625, -0.61248779296875, -0.499755859375, -0.38702392578125, -0.2742919921875, -0.16156005859375, -0.048828125, 0.06390380859375, 0.1766357421875, 0.28936767578125, 0.402099609375, 0.51483154296875, 0.6275634765625, 0.74029541015625, 0.85302734375, 0.96575927734375, 1.0784912109375, 1.19122314453125, 1.303955078125, 1.41668701171875, 1.5294189453125, 1.64215087890625, 1.7548828125, 1.86761474609375, 1.9803466796875, 2.09307861328125, 2.205810546875, 2.31854248046875, 2.4312744140625, 2.54400634765625, 2.65673828125, 2.76947021484375, 2.8822021484375, 2.99493408203125, 3.107666015625, 3.22039794921875, 3.3331298828125, 3.44586181640625, 3.55859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 6.0, 11.0, 9.0, 10.0, 20.0, 28.0, 25.0, 43.0, 52.0, 69.0, 115.0, 188.0, 280.0, 477.0, 547.0, 671.0, 466.0, 345.0, 228.0, 145.0, 110.0, 67.0, 51.0, 37.0, 18.0, 19.0, 9.0, 6.0, 8.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.09002685546875, -4.9495849609375, -4.80914306640625, -4.668701171875, -4.52825927734375, -4.3878173828125, -4.24737548828125, -4.10693359375, -3.96649169921875, -3.8260498046875, -3.68560791015625, -3.545166015625, -3.40472412109375, -3.2642822265625, -3.12384033203125, -2.9833984375, -2.84295654296875, -2.7025146484375, -2.56207275390625, -2.421630859375, -2.28118896484375, -2.1407470703125, -2.00030517578125, -1.85986328125, -1.71942138671875, -1.5789794921875, -1.43853759765625, -1.298095703125, -1.15765380859375, -1.0172119140625, -0.87677001953125, -0.736328125, -0.59588623046875, -0.4554443359375, -0.31500244140625, -0.174560546875, -0.03411865234375, 0.1063232421875, 0.24676513671875, 0.38720703125, 0.52764892578125, 0.6680908203125, 0.80853271484375, 0.948974609375, 1.08941650390625, 1.2298583984375, 1.37030029296875, 1.5107421875, 1.65118408203125, 1.7916259765625, 1.93206787109375, 2.072509765625, 2.21295166015625, 2.3533935546875, 2.49383544921875, 2.63427734375, 2.77471923828125, 2.9151611328125, 3.05560302734375, 3.196044921875, 3.33648681640625, 3.4769287109375, 3.61737060546875, 3.7578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 3.0, 7.0, 9.0, 14.0, 18.0, 35.0, 52.0, 85.0, 131.0, 243.0, 410.0, 985.0, 3506.0, 39736.0, 3447626.0, 682043.0, 15607.0, 2217.0, 713.0, 358.0, 184.0, 79.0, 62.0, 43.0, 27.0, 26.0, 15.0, 10.0, 17.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.0345458984375, -12.530029296875, -12.0255126953125, -11.52099609375, -11.0164794921875, -10.511962890625, -10.0074462890625, -9.5029296875, -8.9984130859375, -8.493896484375, -7.9893798828125, -7.48486328125, -6.9803466796875, -6.475830078125, -5.9713134765625, -5.466796875, -4.9622802734375, -4.457763671875, -3.9532470703125, -3.44873046875, -2.9442138671875, -2.439697265625, -1.9351806640625, -1.4306640625, -0.9261474609375, -0.421630859375, 0.0828857421875, 0.58740234375, 1.0919189453125, 1.596435546875, 2.1009521484375, 2.60546875, 3.1099853515625, 3.614501953125, 4.1190185546875, 4.62353515625, 5.1280517578125, 5.632568359375, 6.1370849609375, 6.6416015625, 7.1461181640625, 7.650634765625, 8.1551513671875, 8.65966796875, 9.1641845703125, 9.668701171875, 10.1732177734375, 10.677734375, 11.1822509765625, 11.686767578125, 12.1912841796875, 12.69580078125, 13.2003173828125, 13.704833984375, 14.2093505859375, 14.7138671875, 15.2183837890625, 15.722900390625, 16.2274169921875, 16.73193359375, 17.2364501953125, 17.740966796875, 18.2454833984375, 18.75]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 134.0, 505.0, 309.0, 49.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.03105926513672, -70.08778381347656, -67.1445083618164, -64.20122528076172, -61.25794982910156, -58.314674377441406, -55.37139892578125, -52.42811965942383, -49.484840393066406, -46.54156494140625, -43.59828567504883, -40.65501022338867, -37.71173095703125, -34.768455505371094, -31.825178146362305, -28.881900787353516, -25.93862533569336, -22.99534797668457, -20.05207061767578, -17.108795166015625, -14.16551685333252, -11.22223949432373, -8.278963088989258, -5.335685729980469, -2.3924083709716797, 0.5508687496185303, 3.4941458702087402, 6.437422752380371, 9.38070011138916, 12.32397747039795, 15.267253875732422, 18.21053123474121, 21.15380859375, 24.09708595275879, 27.040363311767578, 29.983638763427734, 32.926918029785156, 35.87019348144531, 38.81346893310547, 41.75674819946289, 44.70002746582031, 47.64330291748047, 50.58658218383789, 53.52985763549805, 56.47313690185547, 59.416412353515625, 62.35968780517578, 65.30296325683594, 68.24624633789062, 71.18952178955078, 74.13279724121094, 77.07608032226562, 80.01935577392578, 82.96263122558594, 85.9059066772461, 88.84918212890625, 91.7924575805664, 94.73573303222656, 97.67900848388672, 100.6222915649414, 103.56556701660156, 106.50884246826172, 109.45211791992188, 112.39540100097656, 115.33867645263672]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 11.0, 15.0, 20.0, 28.0, 24.0, 24.0, 31.0, 36.0, 36.0, 48.0, 40.0, 44.0, 56.0, 54.0, 45.0, 44.0, 50.0, 47.0, 35.0, 39.0, 28.0, 33.0, 25.0, 21.0, 22.0, 20.0, 25.0, 19.0, 14.0, 7.0, 5.0, 6.0, 9.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.346147537231445, -13.881064414978027, -13.415982246398926, -12.950899124145508, -12.485816955566406, -12.020733833312988, -11.55565071105957, -11.090568542480469, -10.62548542022705, -10.160402297973633, -9.695320129394531, -9.230237007141113, -8.765154838562012, -8.300071716308594, -7.834989070892334, -7.369906425476074, -6.9048237800598145, -6.439741134643555, -5.974658489227295, -5.509575843811035, -5.044492721557617, -4.579410076141357, -4.114327430725098, -3.649244546890259, -3.184161901473999, -2.7190792560577393, -2.2539963722229004, -1.7889137268066406, -1.3238309621810913, -0.858748197555542, -0.3936655521392822, 0.07141733169555664, 0.5364999771118164, 1.0015827417373657, 1.466665506362915, 1.9317481517791748, 2.3968310356140137, 2.8619136810302734, 3.326996326446533, 3.792079210281372, 4.257162094116211, 4.722244739532471, 5.1873273849487305, 5.652410507202148, 6.117493152618408, 6.582575798034668, 7.047658443450928, 7.5127410888671875, 7.977823734283447, 8.442906379699707, 8.907989501953125, 9.373071670532227, 9.838154792785645, 10.303237915039062, 10.768320083618164, 11.233403205871582, 11.698485374450684, 12.163568496704102, 12.628650665283203, 13.093733787536621, 13.558815956115723, 14.02389907836914, 14.488981246948242, 14.95406436920166, 15.419147491455078]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 3.0, 11.0, 10.0, 19.0, 23.0, 24.0, 28.0, 32.0, 43.0, 34.0, 31.0, 55.0, 57.0, 45.0, 45.0, 48.0, 45.0, 53.0, 52.0, 42.0, 45.0, 44.0, 38.0, 32.0, 18.0, 21.0, 20.0, 19.0, 15.0, 12.0, 3.0, 9.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.283203125, -2.2167510986328125, -2.150299072265625, -2.0838470458984375, -2.01739501953125, -1.9509429931640625, -1.884490966796875, -1.8180389404296875, -1.7515869140625, -1.6851348876953125, -1.618682861328125, -1.5522308349609375, -1.48577880859375, -1.4193267822265625, -1.352874755859375, -1.2864227294921875, -1.219970703125, -1.1535186767578125, -1.087066650390625, -1.0206146240234375, -0.95416259765625, -0.8877105712890625, -0.821258544921875, -0.7548065185546875, -0.6883544921875, -0.6219024658203125, -0.555450439453125, -0.4889984130859375, -0.42254638671875, -0.3560943603515625, -0.289642333984375, -0.2231903076171875, -0.15673828125, -0.0902862548828125, -0.023834228515625, 0.0426177978515625, 0.10906982421875, 0.1755218505859375, 0.241973876953125, 0.3084259033203125, 0.3748779296875, 0.4413299560546875, 0.507781982421875, 0.5742340087890625, 0.64068603515625, 0.7071380615234375, 0.773590087890625, 0.8400421142578125, 0.906494140625, 0.9729461669921875, 1.039398193359375, 1.1058502197265625, 1.17230224609375, 1.2387542724609375, 1.305206298828125, 1.3716583251953125, 1.4381103515625, 1.5045623779296875, 1.571014404296875, 1.6374664306640625, 1.70391845703125, 1.7703704833984375, 1.836822509765625, 1.9032745361328125, 1.9697265625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 14.0, 24.0, 20.0, 48.0, 68.0, 95.0, 164.0, 252.0, 341.0, 566.0, 1047.0, 1789.0, 3448.0, 7591.0, 18301.0, 49854.0, 140064.0, 307045.0, 300560.0, 135612.0, 48695.0, 17853.0, 7414.0, 3364.0, 1691.0, 989.0, 614.0, 362.0, 233.0, 139.0, 101.0, 74.0, 42.0, 20.0, 14.0, 14.0, 11.0, 9.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330078125, -0.806121826171875, -0.77923583984375, -0.752349853515625, -0.7254638671875, -0.698577880859375, -0.67169189453125, -0.644805908203125, -0.617919921875, -0.591033935546875, -0.56414794921875, -0.537261962890625, -0.5103759765625, -0.483489990234375, -0.45660400390625, -0.429718017578125, -0.40283203125, -0.375946044921875, -0.34906005859375, -0.322174072265625, -0.2952880859375, -0.268402099609375, -0.24151611328125, -0.214630126953125, -0.187744140625, -0.160858154296875, -0.13397216796875, -0.107086181640625, -0.0802001953125, -0.053314208984375, -0.02642822265625, 0.000457763671875, 0.02734375, 0.054229736328125, 0.08111572265625, 0.108001708984375, 0.1348876953125, 0.161773681640625, 0.18865966796875, 0.215545654296875, 0.242431640625, 0.269317626953125, 0.29620361328125, 0.323089599609375, 0.3499755859375, 0.376861572265625, 0.40374755859375, 0.430633544921875, 0.45751953125, 0.484405517578125, 0.51129150390625, 0.538177490234375, 0.5650634765625, 0.591949462890625, 0.61883544921875, 0.645721435546875, 0.672607421875, 0.699493408203125, 0.72637939453125, 0.753265380859375, 0.7801513671875, 0.807037353515625, 0.83392333984375, 0.860809326171875, 0.8876953125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 6.0, 14.0, 9.0, 12.0, 16.0, 24.0, 11.0, 22.0, 25.0, 24.0, 24.0, 35.0, 34.0, 25.0, 25.0, 35.0, 36.0, 36.0, 17.0, 1068.0, 30.0, 42.0, 32.0, 25.0, 30.0, 29.0, 32.0, 36.0, 34.0, 27.0, 24.0, 13.0, 20.0, 22.0, 11.0, 12.0, 9.0, 7.0, 14.0, 10.0, 12.0, 9.0, 9.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.1884765625, -1.15313720703125, -1.1177978515625, -1.08245849609375, -1.047119140625, -1.01177978515625, -0.9764404296875, -0.94110107421875, -0.90576171875, -0.87042236328125, -0.8350830078125, -0.79974365234375, -0.764404296875, -0.72906494140625, -0.6937255859375, -0.65838623046875, -0.623046875, -0.58770751953125, -0.5523681640625, -0.51702880859375, -0.481689453125, -0.44635009765625, -0.4110107421875, -0.37567138671875, -0.34033203125, -0.30499267578125, -0.2696533203125, -0.23431396484375, -0.198974609375, -0.16363525390625, -0.1282958984375, -0.09295654296875, -0.0576171875, -0.02227783203125, 0.0130615234375, 0.04840087890625, 0.083740234375, 0.11907958984375, 0.1544189453125, 0.18975830078125, 0.22509765625, 0.26043701171875, 0.2957763671875, 0.33111572265625, 0.366455078125, 0.40179443359375, 0.4371337890625, 0.47247314453125, 0.5078125, 0.54315185546875, 0.5784912109375, 0.61383056640625, 0.649169921875, 0.68450927734375, 0.7198486328125, 0.75518798828125, 0.79052734375, 0.82586669921875, 0.8612060546875, 0.89654541015625, 0.931884765625, 0.96722412109375, 1.0025634765625, 1.03790283203125, 1.0732421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 16.0, 23.0, 38.0, 63.0, 95.0, 161.0, 203.0, 404.0, 678.0, 1194.0, 2089.0, 3746.0, 7316.0, 14046.0, 29670.0, 134407.0, 1742614.0, 105161.0, 27167.0, 12794.0, 6796.0, 3613.0, 2006.0, 1138.0, 666.0, 375.0, 241.0, 157.0, 75.0, 59.0, 39.0, 17.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.99658203125, -0.9684677124023438, -0.9403533935546875, -0.9122390747070312, -0.884124755859375, -0.8560104370117188, -0.8278961181640625, -0.7997817993164062, -0.77166748046875, -0.7435531616210938, -0.7154388427734375, -0.6873245239257812, -0.659210205078125, -0.6310958862304688, -0.6029815673828125, -0.5748672485351562, -0.5467529296875, -0.5186386108398438, -0.4905242919921875, -0.46240997314453125, -0.434295654296875, -0.40618133544921875, -0.3780670166015625, -0.34995269775390625, -0.32183837890625, -0.29372406005859375, -0.2656097412109375, -0.23749542236328125, -0.209381103515625, -0.18126678466796875, -0.1531524658203125, -0.12503814697265625, -0.096923828125, -0.06880950927734375, -0.0406951904296875, -0.01258087158203125, 0.015533447265625, 0.04364776611328125, 0.0717620849609375, 0.09987640380859375, 0.12799072265625, 0.15610504150390625, 0.1842193603515625, 0.21233367919921875, 0.240447998046875, 0.26856231689453125, 0.2966766357421875, 0.32479095458984375, 0.3529052734375, 0.38101959228515625, 0.4091339111328125, 0.43724822998046875, 0.465362548828125, 0.49347686767578125, 0.5215911865234375, 0.5497055053710938, 0.57781982421875, 0.6059341430664062, 0.6340484619140625, 0.6621627807617188, 0.690277099609375, 0.7183914184570312, 0.7465057373046875, 0.7746200561523438, 0.802734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 7.0, 16.0, 13.0, 22.0, 19.0, 35.0, 37.0, 54.0, 70.0, 87.0, 108.0, 105.0, 73.0, 69.0, 53.0, 47.0, 38.0, 26.0, 12.0, 18.0, 21.0, 8.0, 14.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06060791015625, -0.058670997619628906, -0.05673408508300781, -0.05479717254638672, -0.052860260009765625, -0.05092334747314453, -0.04898643493652344, -0.047049522399902344, -0.04511260986328125, -0.043175697326660156, -0.04123878479003906, -0.03930187225341797, -0.037364959716796875, -0.03542804718017578, -0.03349113464355469, -0.031554222106933594, -0.0296173095703125, -0.027680397033691406, -0.025743484497070312, -0.02380657196044922, -0.021869659423828125, -0.01993274688720703, -0.017995834350585938, -0.016058921813964844, -0.01412200927734375, -0.012185096740722656, -0.010248184204101562, -0.008311271667480469, -0.006374359130859375, -0.004437446594238281, -0.0025005340576171875, -0.0005636215209960938, 0.001373291015625, 0.0033102035522460938, 0.0052471160888671875, 0.007184028625488281, 0.009120941162109375, 0.011057853698730469, 0.012994766235351562, 0.014931678771972656, 0.01686859130859375, 0.018805503845214844, 0.020742416381835938, 0.02267932891845703, 0.024616241455078125, 0.02655315399169922, 0.028490066528320312, 0.030426979064941406, 0.0323638916015625, 0.034300804138183594, 0.03623771667480469, 0.03817462921142578, 0.040111541748046875, 0.04204845428466797, 0.04398536682128906, 0.045922279357910156, 0.04785919189453125, 0.049796104431152344, 0.05173301696777344, 0.05366992950439453, 0.055606842041015625, 0.05754375457763672, 0.05948066711425781, 0.061417579650878906, 0.0633544921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 16.0, 10.0, 19.0, 23.0, 33.0, 35.0, 63.0, 106.0, 163.0, 329.0, 2081.0, 966864.0, 77434.0, 701.0, 247.0, 141.0, 85.0, 46.0, 36.0, 23.0, 21.0, 20.0, 17.0, 5.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3475799560546875, -1.306488037109375, -1.2653961181640625, -1.22430419921875, -1.1832122802734375, -1.142120361328125, -1.1010284423828125, -1.0599365234375, -1.0188446044921875, -0.977752685546875, -0.9366607666015625, -0.89556884765625, -0.8544769287109375, -0.813385009765625, -0.7722930908203125, -0.731201171875, -0.6901092529296875, -0.649017333984375, -0.6079254150390625, -0.56683349609375, -0.5257415771484375, -0.484649658203125, -0.4435577392578125, -0.4024658203125, -0.3613739013671875, -0.320281982421875, -0.2791900634765625, -0.23809814453125, -0.1970062255859375, -0.155914306640625, -0.1148223876953125, -0.07373046875, -0.0326385498046875, 0.008453369140625, 0.0495452880859375, 0.09063720703125, 0.1317291259765625, 0.172821044921875, 0.2139129638671875, 0.2550048828125, 0.2960968017578125, 0.337188720703125, 0.3782806396484375, 0.41937255859375, 0.4604644775390625, 0.501556396484375, 0.5426483154296875, 0.583740234375, 0.6248321533203125, 0.665924072265625, 0.7070159912109375, 0.74810791015625, 0.7891998291015625, 0.830291748046875, 0.8713836669921875, 0.9124755859375, 0.9535675048828125, 0.994659423828125, 1.0357513427734375, 1.07684326171875, 1.1179351806640625, 1.159027099609375, 1.2001190185546875, 1.2412109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 15.0, 37.0, 90.0, 247.0, 337.0, 162.0, 77.0, 25.0, 12.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5141112804412842, -0.5040780901908875, -0.49404487013816833, -0.4840116798877716, -0.4739784598350525, -0.46394526958465576, -0.45391207933425903, -0.4438788592815399, -0.4338456690311432, -0.42381247878074646, -0.41377925872802734, -0.4037460684776306, -0.3937128484249115, -0.38367965817451477, -0.37364643812179565, -0.3636132478713989, -0.3535800576210022, -0.34354686737060547, -0.33351364731788635, -0.3234804570674896, -0.3134472370147705, -0.3034140467643738, -0.29338085651397705, -0.28334763646125793, -0.2733144164085388, -0.2632812261581421, -0.253248006105423, -0.24321481585502625, -0.23318161070346832, -0.2231484055519104, -0.21311520040035248, -0.20308199524879456, -0.19304880499839783, -0.1830155998468399, -0.17298239469528198, -0.16294920444488525, -0.15291599929332733, -0.1428827941417694, -0.1328495889902115, -0.12281639128923416, -0.11278318613767624, -0.10274998098611832, -0.09271678328514099, -0.08268357813358307, -0.07265037298202515, -0.06261717528104782, -0.0525839701294899, -0.04255077242851257, -0.03251756727695465, -0.022484365850687027, -0.012451162561774254, -0.0024179592728614807, 0.007615242153406143, 0.017648443579673767, 0.02768164873123169, 0.037714846432209015, 0.04774805158376694, 0.05778125301003456, 0.06781445443630219, 0.07784765958786011, 0.08788086473941803, 0.09791406244039536, 0.10794726759195328, 0.1179804652929306, 0.12801367044448853]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 8.0, 19.0, 13.0, 20.0, 25.0, 23.0, 26.0, 27.0, 23.0, 37.0, 41.0, 40.0, 26.0, 35.0, 39.0, 39.0, 44.0, 43.0, 39.0, 32.0, 33.0, 54.0, 39.0, 35.0, 25.0, 29.0, 25.0, 19.0, 16.0, 14.0, 18.0, 15.0, 9.0, 10.0, 16.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08822470903396606, -0.08505868911743164, -0.08189266920089722, -0.0787266418337822, -0.07556062191724777, -0.07239460200071335, -0.06922857463359833, -0.0660625547170639, -0.06289653480052948, -0.059730514883995056, -0.056564491242170334, -0.05339846760034561, -0.05023244768381119, -0.047066427767276764, -0.04390040412545204, -0.04073438048362732, -0.037568360567092896, -0.03440234065055847, -0.03123631700873375, -0.028070295229554176, -0.024904273450374603, -0.02173825167119503, -0.018572229892015457, -0.015406208112835884, -0.012240186333656311, -0.009074164554476738, -0.005908142775297165, -0.002742120996117592, 0.0004239007830619812, 0.0035899225622415543, 0.006755944341421127, 0.0099219661206007, 0.013087987899780273, 0.016254009678959846, 0.01942003145813942, 0.022586053237318993, 0.025752075016498566, 0.02891809679567814, 0.03208411857485771, 0.035250142216682434, 0.03841616213321686, 0.04158218204975128, 0.044748205691576004, 0.047914229333400726, 0.05108024924993515, 0.054246269166469574, 0.057412292808294296, 0.06057831645011902, 0.06374433636665344, 0.06691035628318787, 0.07007637619972229, 0.07324240356683731, 0.07640842348337173, 0.07957444339990616, 0.08274047076702118, 0.0859064906835556, 0.08907251060009003, 0.09223853051662445, 0.09540455043315887, 0.0985705778002739, 0.10173659771680832, 0.10490261763334274, 0.10806864500045776, 0.11123466491699219, 0.11440068483352661]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 9.0, 17.0, 10.0, 21.0, 31.0, 35.0, 35.0, 34.0, 42.0, 47.0, 54.0, 44.0, 44.0, 57.0, 38.0, 34.0, 49.0, 39.0, 55.0, 49.0, 50.0, 38.0, 25.0, 20.0, 19.0, 19.0, 16.0, 11.0, 12.0, 8.0, 4.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.189453125, -2.125579833984375, -2.06170654296875, -1.997833251953125, -1.9339599609375, -1.870086669921875, -1.80621337890625, -1.742340087890625, -1.678466796875, -1.614593505859375, -1.55072021484375, -1.486846923828125, -1.4229736328125, -1.359100341796875, -1.29522705078125, -1.231353759765625, -1.16748046875, -1.103607177734375, -1.03973388671875, -0.975860595703125, -0.9119873046875, -0.848114013671875, -0.78424072265625, -0.720367431640625, -0.656494140625, -0.592620849609375, -0.52874755859375, -0.464874267578125, -0.4010009765625, -0.337127685546875, -0.27325439453125, -0.209381103515625, -0.1455078125, -0.081634521484375, -0.01776123046875, 0.046112060546875, 0.1099853515625, 0.173858642578125, 0.23773193359375, 0.301605224609375, 0.365478515625, 0.429351806640625, 0.49322509765625, 0.557098388671875, 0.6209716796875, 0.684844970703125, 0.74871826171875, 0.812591552734375, 0.87646484375, 0.940338134765625, 1.00421142578125, 1.068084716796875, 1.1319580078125, 1.195831298828125, 1.25970458984375, 1.323577880859375, 1.387451171875, 1.451324462890625, 1.51519775390625, 1.579071044921875, 1.6429443359375, 1.706817626953125, 1.77069091796875, 1.834564208984375, 1.8984375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 13.0, 16.0, 20.0, 38.0, 57.0, 68.0, 124.0, 158.0, 240.0, 370.0, 619.0, 971.0, 1536.0, 2674.0, 4809.0, 9218.0, 20206.0, 51054.0, 154082.0, 401034.0, 259309.0, 83534.0, 30287.0, 12912.0, 6345.0, 3508.0, 1998.0, 1174.0, 790.0, 467.0, 299.0, 204.0, 125.0, 91.0, 61.0, 43.0, 23.0, 15.0, 15.0, 9.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6328125, -2.549835205078125, -2.46685791015625, -2.383880615234375, -2.3009033203125, -2.217926025390625, -2.13494873046875, -2.051971435546875, -1.968994140625, -1.886016845703125, -1.80303955078125, -1.720062255859375, -1.6370849609375, -1.554107666015625, -1.47113037109375, -1.388153076171875, -1.30517578125, -1.222198486328125, -1.13922119140625, -1.056243896484375, -0.9732666015625, -0.890289306640625, -0.80731201171875, -0.724334716796875, -0.641357421875, -0.558380126953125, -0.47540283203125, -0.392425537109375, -0.3094482421875, -0.226470947265625, -0.14349365234375, -0.060516357421875, 0.0224609375, 0.105438232421875, 0.18841552734375, 0.271392822265625, 0.3543701171875, 0.437347412109375, 0.52032470703125, 0.603302001953125, 0.686279296875, 0.769256591796875, 0.85223388671875, 0.935211181640625, 1.0181884765625, 1.101165771484375, 1.18414306640625, 1.267120361328125, 1.35009765625, 1.433074951171875, 1.51605224609375, 1.599029541015625, 1.6820068359375, 1.764984130859375, 1.84796142578125, 1.930938720703125, 2.013916015625, 2.096893310546875, 2.17987060546875, 2.262847900390625, 2.3458251953125, 2.428802490234375, 2.51177978515625, 2.594757080078125, 2.677734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 10.0, 9.0, 7.0, 17.0, 16.0, 15.0, 20.0, 24.0, 12.0, 24.0, 21.0, 32.0, 39.0, 42.0, 42.0, 56.0, 91.0, 178.0, 875.0, 840.0, 152.0, 87.0, 47.0, 47.0, 34.0, 36.0, 35.0, 40.0, 17.0, 34.0, 26.0, 19.0, 20.0, 14.0, 17.0, 12.0, 4.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.927734375, -4.7578125, -4.587890625, -4.41796875, -4.248046875, -4.078125, -3.908203125, -3.73828125, -3.568359375, -3.3984375, -3.228515625, -3.05859375, -2.888671875, -2.71875, -2.548828125, -2.37890625, -2.208984375, -2.0390625, -1.869140625, -1.69921875, -1.529296875, -1.359375, -1.189453125, -1.01953125, -0.849609375, -0.6796875, -0.509765625, -0.33984375, -0.169921875, 0.0, 0.169921875, 0.33984375, 0.509765625, 0.6796875, 0.849609375, 1.01953125, 1.189453125, 1.359375, 1.529296875, 1.69921875, 1.869140625, 2.0390625, 2.208984375, 2.37890625, 2.548828125, 2.71875, 2.888671875, 3.05859375, 3.228515625, 3.3984375, 3.568359375, 3.73828125, 3.908203125, 4.078125, 4.248046875, 4.41796875, 4.587890625, 4.7578125, 4.927734375, 5.09765625, 5.267578125, 5.4375, 5.607421875, 5.77734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 5.0, 11.0, 15.0, 14.0, 26.0, 38.0, 32.0, 50.0, 67.0, 94.0, 125.0, 264.0, 567.0, 1641.0, 5423.0, 25714.0, 535481.0, 2501181.0, 61390.0, 9334.0, 2476.0, 842.0, 369.0, 164.0, 92.0, 67.0, 39.0, 40.0, 28.0, 20.0, 16.0, 19.0, 18.0, 13.0, 3.0, 8.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3560791015625, -8.079345703125, -7.8026123046875, -7.52587890625, -7.2491455078125, -6.972412109375, -6.6956787109375, -6.4189453125, -6.1422119140625, -5.865478515625, -5.5887451171875, -5.31201171875, -5.0352783203125, -4.758544921875, -4.4818115234375, -4.205078125, -3.9283447265625, -3.651611328125, -3.3748779296875, -3.09814453125, -2.8214111328125, -2.544677734375, -2.2679443359375, -1.9912109375, -1.7144775390625, -1.437744140625, -1.1610107421875, -0.88427734375, -0.6075439453125, -0.330810546875, -0.0540771484375, 0.22265625, 0.4993896484375, 0.776123046875, 1.0528564453125, 1.32958984375, 1.6063232421875, 1.883056640625, 2.1597900390625, 2.4365234375, 2.7132568359375, 2.989990234375, 3.2667236328125, 3.54345703125, 3.8201904296875, 4.096923828125, 4.3736572265625, 4.650390625, 4.9271240234375, 5.203857421875, 5.4805908203125, 5.75732421875, 6.0340576171875, 6.310791015625, 6.5875244140625, 6.8642578125, 7.1409912109375, 7.417724609375, 7.6944580078125, 7.97119140625, 8.2479248046875, 8.524658203125, 8.8013916015625, 9.078125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 43.0, 935.0, 38.0, 2.0], "bins": [-259.7878112792969, -255.5616455078125, -251.33547973632812, -247.10931396484375, -242.88314819335938, -238.65699768066406, -234.4308319091797, -230.2046661376953, -225.97850036621094, -221.75233459472656, -217.5261688232422, -213.3000030517578, -209.0738525390625, -204.84768676757812, -200.62152099609375, -196.39535522460938, -192.169189453125, -187.94302368164062, -183.71685791015625, -179.49069213867188, -175.2645263671875, -171.0383758544922, -166.8122100830078, -162.58604431152344, -158.35987854003906, -154.1337127685547, -149.9075469970703, -145.68138122558594, -141.45523071289062, -137.22906494140625, -133.00289916992188, -128.7767333984375, -124.55058288574219, -120.32441711425781, -116.09825134277344, -111.8720932006836, -107.64592742919922, -103.41976165771484, -99.193603515625, -94.96743774414062, -90.74127197265625, -86.51510620117188, -82.2889404296875, -78.06278228759766, -73.83661651611328, -69.6104507446289, -65.38429260253906, -61.15812683105469, -56.93195724487305, -52.70579528808594, -48.47962951660156, -44.25346374511719, -40.02730178833008, -35.80113983154297, -31.574974060058594, -27.34881019592285, -23.12264633178711, -18.896482467651367, -14.670318603515625, -10.444154739379883, -6.217990875244141, -1.9918270111083984, 2.2343368530273438, 6.460500717163086, 10.686663627624512]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 10.0, 10.0, 13.0, 9.0, 15.0, 19.0, 16.0, 25.0, 19.0, 36.0, 28.0, 34.0, 28.0, 39.0, 37.0, 35.0, 40.0, 30.0, 29.0, 31.0, 43.0, 38.0, 35.0, 39.0, 26.0, 27.0, 30.0, 26.0, 25.0, 27.0, 24.0, 13.0, 23.0, 19.0, 15.0, 11.0, 9.0, 3.0, 15.0, 6.0, 8.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.471179962158203, -13.046581268310547, -12.621981620788574, -12.197382926940918, -11.772784233093262, -11.348184585571289, -10.923585891723633, -10.498987197875977, -10.07438850402832, -9.649789810180664, -9.225190162658691, -8.800591468811035, -8.375992774963379, -7.9513936042785645, -7.52679443359375, -7.102195739746094, -6.677596092224121, -6.252996921539307, -5.82839822769165, -5.403799057006836, -4.97920036315918, -4.554601192474365, -4.130002021789551, -3.7054030895233154, -3.28080415725708, -2.8562052249908447, -2.4316062927246094, -2.007007122039795, -1.5824081897735596, -1.1578092575073242, -0.7332100868225098, -0.3086111545562744, 0.11598682403564453, 0.5405858159065247, 0.9651848077774048, 1.3897838592529297, 1.814382791519165, 2.2389817237854004, 2.663580894470215, 3.08817982673645, 3.5127787590026855, 3.937377691268921, 4.361976623535156, 4.786575794219971, 5.211174964904785, 5.635773658752441, 6.060372829437256, 6.48497200012207, 6.909570693969727, 7.334169864654541, 7.758768558502197, 8.183367729187012, 8.607966423034668, 9.03256607055664, 9.457164764404297, 9.881763458251953, 10.30636215209961, 10.730960845947266, 11.155560493469238, 11.580159187316895, 12.00475788116455, 12.429357528686523, 12.85395622253418, 13.278554916381836, 13.703154563903809]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 8.0, 4.0, 18.0, 18.0, 18.0, 29.0, 40.0, 38.0, 40.0, 44.0, 49.0, 51.0, 50.0, 46.0, 44.0, 50.0, 52.0, 48.0, 40.0, 39.0, 38.0, 47.0, 35.0, 33.0, 26.0, 13.0, 16.0, 10.0, 13.0, 5.0, 5.0, 5.0, 8.0, 3.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.5384674072265625, -2.467559814453125, -2.3966522216796875, -2.32574462890625, -2.2548370361328125, -2.183929443359375, -2.1130218505859375, -2.0421142578125, -1.9712066650390625, -1.900299072265625, -1.8293914794921875, -1.75848388671875, -1.6875762939453125, -1.616668701171875, -1.5457611083984375, -1.474853515625, -1.4039459228515625, -1.333038330078125, -1.2621307373046875, -1.19122314453125, -1.1203155517578125, -1.049407958984375, -0.9785003662109375, -0.9075927734375, -0.8366851806640625, -0.765777587890625, -0.6948699951171875, -0.62396240234375, -0.5530548095703125, -0.482147216796875, -0.4112396240234375, -0.34033203125, -0.2694244384765625, -0.198516845703125, -0.1276092529296875, -0.05670166015625, 0.0142059326171875, 0.085113525390625, 0.1560211181640625, 0.2269287109375, 0.2978363037109375, 0.368743896484375, 0.4396514892578125, 0.51055908203125, 0.5814666748046875, 0.652374267578125, 0.7232818603515625, 0.794189453125, 0.8650970458984375, 0.936004638671875, 1.0069122314453125, 1.07781982421875, 1.1487274169921875, 1.219635009765625, 1.2905426025390625, 1.3614501953125, 1.4323577880859375, 1.503265380859375, 1.5741729736328125, 1.64508056640625, 1.7159881591796875, 1.786895751953125, 1.8578033447265625, 1.9287109375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 12.0, 24.0, 33.0, 39.0, 54.0, 111.0, 177.0, 303.0, 481.0, 947.0, 1885.0, 4012.0, 9456.0, 26780.0, 122000.0, 1294368.0, 2421550.0, 247331.0, 41499.0, 13088.0, 5182.0, 2339.0, 1156.0, 594.0, 331.0, 198.0, 104.0, 63.0, 45.0, 32.0, 22.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.9415283203125, -4.801025390625, -4.6605224609375, -4.52001953125, -4.3795166015625, -4.239013671875, -4.0985107421875, -3.9580078125, -3.8175048828125, -3.677001953125, -3.5364990234375, -3.39599609375, -3.2554931640625, -3.114990234375, -2.9744873046875, -2.833984375, -2.6934814453125, -2.552978515625, -2.4124755859375, -2.27197265625, -2.1314697265625, -1.990966796875, -1.8504638671875, -1.7099609375, -1.5694580078125, -1.428955078125, -1.2884521484375, -1.14794921875, -1.0074462890625, -0.866943359375, -0.7264404296875, -0.5859375, -0.4454345703125, -0.304931640625, -0.1644287109375, -0.02392578125, 0.1165771484375, 0.257080078125, 0.3975830078125, 0.5380859375, 0.6785888671875, 0.819091796875, 0.9595947265625, 1.10009765625, 1.2406005859375, 1.381103515625, 1.5216064453125, 1.662109375, 1.8026123046875, 1.943115234375, 2.0836181640625, 2.22412109375, 2.3646240234375, 2.505126953125, 2.6456298828125, 2.7861328125, 2.9266357421875, 3.067138671875, 3.2076416015625, 3.34814453125, 3.4886474609375, 3.629150390625, 3.7696533203125, 3.91015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 20.0, 22.0, 25.0, 30.0, 35.0, 46.0, 64.0, 82.0, 105.0, 150.0, 215.0, 311.0, 373.0, 505.0, 463.0, 390.0, 318.0, 212.0, 164.0, 114.0, 95.0, 49.0, 46.0, 29.0, 32.0, 32.0, 18.0, 19.0, 13.0, 11.0, 8.0, 10.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.307342529296875, -2.21820068359375, -2.129058837890625, -2.0399169921875, -1.950775146484375, -1.86163330078125, -1.772491455078125, -1.683349609375, -1.594207763671875, -1.50506591796875, -1.415924072265625, -1.3267822265625, -1.237640380859375, -1.14849853515625, -1.059356689453125, -0.97021484375, -0.881072998046875, -0.79193115234375, -0.702789306640625, -0.6136474609375, -0.524505615234375, -0.43536376953125, -0.346221923828125, -0.257080078125, -0.167938232421875, -0.07879638671875, 0.010345458984375, 0.0994873046875, 0.188629150390625, 0.27777099609375, 0.366912841796875, 0.4560546875, 0.545196533203125, 0.63433837890625, 0.723480224609375, 0.8126220703125, 0.901763916015625, 0.99090576171875, 1.080047607421875, 1.169189453125, 1.258331298828125, 1.34747314453125, 1.436614990234375, 1.5257568359375, 1.614898681640625, 1.70404052734375, 1.793182373046875, 1.88232421875, 1.971466064453125, 2.06060791015625, 2.149749755859375, 2.2388916015625, 2.328033447265625, 2.41717529296875, 2.506317138671875, 2.595458984375, 2.684600830078125, 2.77374267578125, 2.862884521484375, 2.9520263671875, 3.041168212890625, 3.13031005859375, 3.219451904296875, 3.30859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 11.0, 9.0, 14.0, 10.0, 17.0, 22.0, 27.0, 37.0, 49.0, 56.0, 97.0, 145.0, 214.0, 413.0, 1068.0, 3922.0, 21481.0, 261723.0, 3660902.0, 219109.0, 19495.0, 3491.0, 933.0, 391.0, 196.0, 117.0, 83.0, 71.0, 31.0, 39.0, 28.0, 18.0, 11.0, 6.0, 7.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0], "bins": [-12.3046875, -11.976318359375, -11.64794921875, -11.319580078125, -10.9912109375, -10.662841796875, -10.33447265625, -10.006103515625, -9.677734375, -9.349365234375, -9.02099609375, -8.692626953125, -8.3642578125, -8.035888671875, -7.70751953125, -7.379150390625, -7.05078125, -6.722412109375, -6.39404296875, -6.065673828125, -5.7373046875, -5.408935546875, -5.08056640625, -4.752197265625, -4.423828125, -4.095458984375, -3.76708984375, -3.438720703125, -3.1103515625, -2.781982421875, -2.45361328125, -2.125244140625, -1.796875, -1.468505859375, -1.14013671875, -0.811767578125, -0.4833984375, -0.155029296875, 0.17333984375, 0.501708984375, 0.830078125, 1.158447265625, 1.48681640625, 1.815185546875, 2.1435546875, 2.471923828125, 2.80029296875, 3.128662109375, 3.45703125, 3.785400390625, 4.11376953125, 4.442138671875, 4.7705078125, 5.098876953125, 5.42724609375, 5.755615234375, 6.083984375, 6.412353515625, 6.74072265625, 7.069091796875, 7.3974609375, 7.725830078125, 8.05419921875, 8.382568359375, 8.7109375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 39.0, 230.0, 435.0, 257.0, 40.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.31867218017578, -74.43461608886719, -72.5505599975586, -70.66650390625, -68.78244018554688, -66.89838409423828, -65.01432800292969, -63.130271911621094, -61.2462158203125, -59.362159729003906, -57.47809982299805, -55.59404373168945, -53.70998764038086, -51.825927734375, -49.941871643066406, -48.05781555175781, -46.17375946044922, -44.289703369140625, -42.405643463134766, -40.52158737182617, -38.63753128051758, -36.75347137451172, -34.869415283203125, -32.98535919189453, -31.101299285888672, -29.217241287231445, -27.33318519592285, -25.449127197265625, -23.56507110595703, -21.681013107299805, -19.796955108642578, -17.912899017333984, -16.02884292602539, -14.14478588104248, -12.26072883605957, -10.376670837402344, -8.49261474609375, -6.608556747436523, -4.724499702453613, -2.840442657470703, -0.956385612487793, 0.9276715517044067, 2.8117287158966064, 4.695785999298096, 6.579843044281006, 8.463900566101074, 10.347957611083984, 12.232014656066895, 14.116071701049805, 16.00012969970703, 17.884185791015625, 19.76824378967285, 21.652299880981445, 23.536357879638672, 25.420413970947266, 27.304471969604492, 29.18852996826172, 31.072587966918945, 32.95664596557617, 34.840702056884766, 36.72475814819336, 38.60881805419922, 40.49287414550781, 42.376930236816406, 44.260986328125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 14.0, 21.0, 14.0, 12.0, 20.0, 22.0, 27.0, 26.0, 26.0, 27.0, 40.0, 36.0, 27.0, 38.0, 38.0, 38.0, 43.0, 29.0, 36.0, 28.0, 33.0, 42.0, 37.0, 26.0, 30.0, 24.0, 29.0, 21.0, 26.0, 13.0, 26.0, 12.0, 15.0, 12.0, 13.0, 5.0, 12.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.702871322631836, -9.389101028442383, -9.07533073425293, -8.76155948638916, -8.447789192199707, -8.134018898010254, -7.820248603820801, -7.5064778327941895, -7.192707061767578, -6.878936767578125, -6.565165996551514, -6.2513957023620605, -5.937624931335449, -5.623854637145996, -5.310084342956543, -4.996313571929932, -4.6825432777404785, -4.368772983551025, -4.055002212524414, -3.741231918334961, -3.4274611473083496, -3.1136908531188965, -2.7999203205108643, -2.486149787902832, -2.1723792552948, -1.8586087226867676, -1.5448381900787354, -1.2310677766799927, -0.9172972440719604, -0.6035267114639282, -0.28975629806518555, 0.02401423454284668, 0.3377847671508789, 0.6515552997589111, 0.9653257727622986, 1.279096245765686, 1.5928667783737183, 1.9066373109817505, 2.220407724380493, 2.5341782569885254, 2.8479487895965576, 3.16171932220459, 3.475489854812622, 3.7892603874206543, 4.103030681610107, 4.416801452636719, 4.730571746826172, 5.044342041015625, 5.358112812042236, 5.6718831062316895, 5.985653877258301, 6.299424171447754, 6.613194942474365, 6.926965236663818, 7.24073600769043, 7.554506301879883, 7.868276596069336, 8.182046890258789, 8.495817184448242, 8.809588432312012, 9.123358726501465, 9.437129020690918, 9.750899314880371, 10.06467056274414, 10.378440856933594]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 14.0, 19.0, 13.0, 18.0, 25.0, 17.0, 31.0, 30.0, 38.0, 30.0, 34.0, 52.0, 50.0, 45.0, 44.0, 35.0, 43.0, 55.0, 46.0, 35.0, 47.0, 39.0, 35.0, 34.0, 31.0, 23.0, 17.0, 11.0, 15.0, 10.0, 13.0, 11.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.9836273193359375, -1.922332763671875, -1.8610382080078125, -1.79974365234375, -1.7384490966796875, -1.677154541015625, -1.6158599853515625, -1.5545654296875, -1.4932708740234375, -1.431976318359375, -1.3706817626953125, -1.30938720703125, -1.2480926513671875, -1.186798095703125, -1.1255035400390625, -1.064208984375, -1.0029144287109375, -0.941619873046875, -0.8803253173828125, -0.81903076171875, -0.7577362060546875, -0.696441650390625, -0.6351470947265625, -0.5738525390625, -0.5125579833984375, -0.451263427734375, -0.3899688720703125, -0.32867431640625, -0.2673797607421875, -0.206085205078125, -0.1447906494140625, -0.08349609375, -0.0222015380859375, 0.039093017578125, 0.1003875732421875, 0.16168212890625, 0.2229766845703125, 0.284271240234375, 0.3455657958984375, 0.4068603515625, 0.4681549072265625, 0.529449462890625, 0.5907440185546875, 0.65203857421875, 0.7133331298828125, 0.774627685546875, 0.8359222412109375, 0.897216796875, 0.9585113525390625, 1.019805908203125, 1.0811004638671875, 1.14239501953125, 1.2036895751953125, 1.264984130859375, 1.3262786865234375, 1.3875732421875, 1.4488677978515625, 1.510162353515625, 1.5714569091796875, 1.63275146484375, 1.6940460205078125, 1.755340576171875, 1.8166351318359375, 1.8779296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 13.0, 16.0, 32.0, 37.0, 63.0, 78.0, 133.0, 195.0, 301.0, 501.0, 780.0, 1288.0, 2031.0, 3287.0, 5304.0, 8825.0, 14365.0, 23304.0, 36963.0, 57630.0, 87477.0, 122450.0, 150784.0, 151746.0, 126280.0, 91144.0, 60698.0, 38935.0, 24491.0, 15214.0, 9322.0, 5675.0, 3462.0, 2200.0, 1324.0, 785.0, 516.0, 319.0, 197.0, 131.0, 87.0, 66.0, 36.0, 24.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.293212890625, -0.28406524658203125, -0.2749176025390625, -0.26576995849609375, -0.256622314453125, -0.24747467041015625, -0.2383270263671875, -0.22917938232421875, -0.22003173828125, -0.21088409423828125, -0.2017364501953125, -0.19258880615234375, -0.183441162109375, -0.17429351806640625, -0.1651458740234375, -0.15599822998046875, -0.1468505859375, -0.13770294189453125, -0.1285552978515625, -0.11940765380859375, -0.110260009765625, -0.10111236572265625, -0.0919647216796875, -0.08281707763671875, -0.07366943359375, -0.06452178955078125, -0.0553741455078125, -0.04622650146484375, -0.037078857421875, -0.02793121337890625, -0.0187835693359375, -0.00963592529296875, -0.00048828125, 0.00865936279296875, 0.0178070068359375, 0.02695465087890625, 0.036102294921875, 0.04524993896484375, 0.0543975830078125, 0.06354522705078125, 0.07269287109375, 0.08184051513671875, 0.0909881591796875, 0.10013580322265625, 0.109283447265625, 0.11843109130859375, 0.1275787353515625, 0.13672637939453125, 0.1458740234375, 0.15502166748046875, 0.1641693115234375, 0.17331695556640625, 0.182464599609375, 0.19161224365234375, 0.2007598876953125, 0.20990753173828125, 0.21905517578125, 0.22820281982421875, 0.2373504638671875, 0.24649810791015625, 0.255645751953125, 0.26479339599609375, 0.2739410400390625, 0.28308868408203125, 0.292236328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 8.0, 5.0, 9.0, 11.0, 19.0, 8.0, 20.0, 25.0, 22.0, 29.0, 25.0, 32.0, 28.0, 38.0, 43.0, 48.0, 46.0, 42.0, 1066.0, 30.0, 40.0, 38.0, 46.0, 40.0, 28.0, 41.0, 33.0, 28.0, 29.0, 15.0, 26.0, 9.0, 11.0, 9.0, 13.0, 11.0, 8.0, 5.0, 5.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2763671875, -1.2359466552734375, -1.195526123046875, -1.1551055908203125, -1.11468505859375, -1.0742645263671875, -1.033843994140625, -0.9934234619140625, -0.9530029296875, -0.9125823974609375, -0.872161865234375, -0.8317413330078125, -0.79132080078125, -0.7509002685546875, -0.710479736328125, -0.6700592041015625, -0.629638671875, -0.5892181396484375, -0.548797607421875, -0.5083770751953125, -0.46795654296875, -0.4275360107421875, -0.387115478515625, -0.3466949462890625, -0.3062744140625, -0.2658538818359375, -0.225433349609375, -0.1850128173828125, -0.14459228515625, -0.1041717529296875, -0.063751220703125, -0.0233306884765625, 0.01708984375, 0.0575103759765625, 0.097930908203125, 0.1383514404296875, 0.17877197265625, 0.2191925048828125, 0.259613037109375, 0.3000335693359375, 0.3404541015625, 0.3808746337890625, 0.421295166015625, 0.4617156982421875, 0.50213623046875, 0.5425567626953125, 0.582977294921875, 0.6233978271484375, 0.663818359375, 0.7042388916015625, 0.744659423828125, 0.7850799560546875, 0.82550048828125, 0.8659210205078125, 0.906341552734375, 0.9467620849609375, 0.9871826171875, 1.0276031494140625, 1.068023681640625, 1.1084442138671875, 1.14886474609375, 1.1892852783203125, 1.229705810546875, 1.2701263427734375, 1.310546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 17.0, 8.0, 13.0, 26.0, 43.0, 63.0, 121.0, 189.0, 291.0, 541.0, 914.0, 1548.0, 2754.0, 4841.0, 8723.0, 15564.0, 32896.0, 207312.0, 1693730.0, 75538.0, 23621.0, 12585.0, 6692.0, 3908.0, 2218.0, 1249.0, 680.0, 431.0, 249.0, 134.0, 91.0, 50.0, 35.0, 26.0, 12.0, 13.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.77978515625, -0.7599449157714844, -0.7401046752929688, -0.7202644348144531, -0.7004241943359375, -0.6805839538574219, -0.6607437133789062, -0.6409034729003906, -0.621063232421875, -0.6012229919433594, -0.5813827514648438, -0.5615425109863281, -0.5417022705078125, -0.5218620300292969, -0.5020217895507812, -0.4821815490722656, -0.46234130859375, -0.4425010681152344, -0.42266082763671875, -0.4028205871582031, -0.3829803466796875, -0.3631401062011719, -0.34329986572265625, -0.3234596252441406, -0.303619384765625, -0.2837791442871094, -0.26393890380859375, -0.24409866333007812, -0.2242584228515625, -0.20441818237304688, -0.18457794189453125, -0.16473770141601562, -0.1448974609375, -0.12505722045898438, -0.10521697998046875, -0.08537673950195312, -0.0655364990234375, -0.045696258544921875, -0.02585601806640625, -0.006015777587890625, 0.013824462890625, 0.033664703369140625, 0.05350494384765625, 0.07334518432617188, 0.0931854248046875, 0.11302566528320312, 0.13286590576171875, 0.15270614624023438, 0.17254638671875, 0.19238662719726562, 0.21222686767578125, 0.23206710815429688, 0.2519073486328125, 0.2717475891113281, 0.29158782958984375, 0.3114280700683594, 0.331268310546875, 0.3511085510253906, 0.37094879150390625, 0.3907890319824219, 0.4106292724609375, 0.4304695129394531, 0.45030975341796875, 0.4701499938964844, 0.489990234375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 15.0, 15.0, 18.0, 18.0, 26.0, 36.0, 38.0, 53.0, 72.0, 62.0, 89.0, 74.0, 78.0, 82.0, 61.0, 40.0, 55.0, 29.0, 24.0, 19.0, 20.0, 16.0, 9.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050048828125, -0.04844999313354492, -0.046851158142089844, -0.045252323150634766, -0.04365348815917969, -0.04205465316772461, -0.04045581817626953, -0.03885698318481445, -0.037258148193359375, -0.0356593132019043, -0.03406047821044922, -0.03246164321899414, -0.030862808227539062, -0.029263973236083984, -0.027665138244628906, -0.026066303253173828, -0.02446746826171875, -0.022868633270263672, -0.021269798278808594, -0.019670963287353516, -0.018072128295898438, -0.01647329330444336, -0.014874458312988281, -0.013275623321533203, -0.011676788330078125, -0.010077953338623047, -0.008479118347167969, -0.006880283355712891, -0.0052814483642578125, -0.0036826133728027344, -0.0020837783813476562, -0.0004849433898925781, 0.0011138916015625, 0.002712726593017578, 0.004311561584472656, 0.005910396575927734, 0.0075092315673828125, 0.00910806655883789, 0.010706901550292969, 0.012305736541748047, 0.013904571533203125, 0.015503406524658203, 0.01710224151611328, 0.01870107650756836, 0.020299911499023438, 0.021898746490478516, 0.023497581481933594, 0.025096416473388672, 0.02669525146484375, 0.028294086456298828, 0.029892921447753906, 0.031491756439208984, 0.03309059143066406, 0.03468942642211914, 0.03628826141357422, 0.0378870964050293, 0.039485931396484375, 0.04108476638793945, 0.04268360137939453, 0.04428243637084961, 0.04588127136230469, 0.047480106353759766, 0.049078941345214844, 0.05067777633666992, 0.052276611328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 3.0, 7.0, 12.0, 11.0, 21.0, 28.0, 38.0, 41.0, 64.0, 110.0, 159.0, 317.0, 1799.0, 585239.0, 458295.0, 1549.0, 325.0, 183.0, 91.0, 65.0, 34.0, 36.0, 22.0, 29.0, 14.0, 14.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.1123046875, -1.078582763671875, -1.04486083984375, -1.011138916015625, -0.9774169921875, -0.943695068359375, -0.90997314453125, -0.876251220703125, -0.842529296875, -0.808807373046875, -0.77508544921875, -0.741363525390625, -0.7076416015625, -0.673919677734375, -0.64019775390625, -0.606475830078125, -0.57275390625, -0.539031982421875, -0.50531005859375, -0.471588134765625, -0.4378662109375, -0.404144287109375, -0.37042236328125, -0.336700439453125, -0.302978515625, -0.269256591796875, -0.23553466796875, -0.201812744140625, -0.1680908203125, -0.134368896484375, -0.10064697265625, -0.066925048828125, -0.033203125, 0.000518798828125, 0.03424072265625, 0.067962646484375, 0.1016845703125, 0.135406494140625, 0.16912841796875, 0.202850341796875, 0.236572265625, 0.270294189453125, 0.30401611328125, 0.337738037109375, 0.3714599609375, 0.405181884765625, 0.43890380859375, 0.472625732421875, 0.50634765625, 0.540069580078125, 0.57379150390625, 0.607513427734375, 0.6412353515625, 0.674957275390625, 0.70867919921875, 0.742401123046875, 0.776123046875, 0.809844970703125, 0.84356689453125, 0.877288818359375, 0.9110107421875, 0.944732666015625, 0.97845458984375, 1.012176513671875, 1.0458984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 28.0, 172.0, 457.0, 269.0, 62.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820741593837738, -0.17327998578548431, -0.16448581218719482, -0.15569162368774414, -0.14689745008945465, -0.13810327649116516, -0.12930908799171448, -0.12051491439342499, -0.1117207407951355, -0.10292656719684601, -0.09413238614797592, -0.08533820509910583, -0.07654403150081635, -0.06774985790252686, -0.05895567685365677, -0.05016149953007698, -0.04136732220649719, -0.032573144882917404, -0.023778967559337616, -0.014984790235757828, -0.0061906129121780396, 0.0026035644114017487, 0.011397741734981537, 0.020191919058561325, 0.028986096382141113, 0.0377802737057209, 0.04657445102930069, 0.05536862835288048, 0.06416280567646027, 0.07295697927474976, 0.08175116032361984, 0.09054534137248993, 0.09933948516845703, 0.10813365876674652, 0.11692783981561661, 0.1257220208644867, 0.13451619446277618, 0.14331036806106567, 0.15210455656051636, 0.16089873015880585, 0.16969290375709534, 0.17848707735538483, 0.18728125095367432, 0.196075439453125, 0.2048696130514145, 0.21366378664970398, 0.22245797514915466, 0.23125214874744415, 0.24004632234573364, 0.24884049594402313, 0.2576346695423126, 0.2664288580417633, 0.2752230167388916, 0.2840172052383423, 0.29281139373779297, 0.30160555243492126, 0.31039974093437195, 0.31919392943382263, 0.3279880881309509, 0.3367822766304016, 0.3455764651298523, 0.3543706238269806, 0.3631648123264313, 0.37195897102355957, 0.38075315952301025]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 8.0, 10.0, 14.0, 12.0, 18.0, 38.0, 35.0, 36.0, 32.0, 35.0, 54.0, 50.0, 47.0, 54.0, 62.0, 55.0, 52.0, 52.0, 44.0, 41.0, 44.0, 38.0, 29.0, 36.0, 16.0, 20.0, 12.0, 15.0, 6.0, 8.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06160688400268555, -0.059279914945364, -0.05695294588804245, -0.0546259768307209, -0.05229900777339935, -0.049972038716077805, -0.047645069658756256, -0.04531810060143471, -0.04299113154411316, -0.04066416248679161, -0.03833719342947006, -0.036010224372148514, -0.033683255314826965, -0.03135628625750542, -0.02902931720018387, -0.02670234814286232, -0.02437537908554077, -0.022048410028219223, -0.019721440970897675, -0.017394471913576126, -0.015067502856254578, -0.01274053379893303, -0.01041356474161148, -0.008086595684289932, -0.005759626626968384, -0.0034326575696468353, -0.0011056885123252869, 0.0012212805449962616, 0.00354824960231781, 0.0058752186596393585, 0.008202187716960907, 0.010529156774282455, 0.012856125831604004, 0.015183094888925552, 0.0175100639462471, 0.01983703300356865, 0.022164002060890198, 0.024490971118211746, 0.026817940175533295, 0.029144909232854843, 0.03147187829017639, 0.03379884734749794, 0.03612581640481949, 0.03845278546214104, 0.040779754519462585, 0.043106723576784134, 0.04543369263410568, 0.04776066169142723, 0.05008763074874878, 0.05241459980607033, 0.054741568863391876, 0.057068537920713425, 0.05939550697803497, 0.06172247603535652, 0.06404944509267807, 0.06637641787528992, 0.06870338320732117, 0.07103034853935242, 0.07335732132196426, 0.07568429410457611, 0.07801125943660736, 0.08033822476863861, 0.08266519755125046, 0.0849921703338623, 0.08731913566589355]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 9.0, 6.0, 13.0, 22.0, 21.0, 17.0, 28.0, 29.0, 37.0, 37.0, 42.0, 46.0, 42.0, 43.0, 43.0, 47.0, 52.0, 45.0, 56.0, 43.0, 38.0, 32.0, 31.0, 40.0, 22.0, 26.0, 30.0, 15.0, 21.0, 14.0, 10.0, 11.0, 12.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.20703125, -2.144195556640625, -2.08135986328125, -2.018524169921875, -1.9556884765625, -1.892852783203125, -1.83001708984375, -1.767181396484375, -1.704345703125, -1.641510009765625, -1.57867431640625, -1.515838623046875, -1.4530029296875, -1.390167236328125, -1.32733154296875, -1.264495849609375, -1.20166015625, -1.138824462890625, -1.07598876953125, -1.013153076171875, -0.9503173828125, -0.887481689453125, -0.82464599609375, -0.761810302734375, -0.698974609375, -0.636138916015625, -0.57330322265625, -0.510467529296875, -0.4476318359375, -0.384796142578125, -0.32196044921875, -0.259124755859375, -0.1962890625, -0.133453369140625, -0.07061767578125, -0.007781982421875, 0.0550537109375, 0.117889404296875, 0.18072509765625, 0.243560791015625, 0.306396484375, 0.369232177734375, 0.43206787109375, 0.494903564453125, 0.5577392578125, 0.620574951171875, 0.68341064453125, 0.746246337890625, 0.80908203125, 0.871917724609375, 0.93475341796875, 0.997589111328125, 1.0604248046875, 1.123260498046875, 1.18609619140625, 1.248931884765625, 1.311767578125, 1.374603271484375, 1.43743896484375, 1.500274658203125, 1.5631103515625, 1.625946044921875, 1.68878173828125, 1.751617431640625, 1.814453125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 13.0, 9.0, 12.0, 13.0, 23.0, 41.0, 59.0, 67.0, 111.0, 134.0, 203.0, 321.0, 458.0, 736.0, 1074.0, 1819.0, 2986.0, 5339.0, 10248.0, 21837.0, 55800.0, 178040.0, 470221.0, 192442.0, 59033.0, 23084.0, 10633.0, 5455.0, 3035.0, 1865.0, 1172.0, 775.0, 486.0, 317.0, 215.0, 115.0, 107.0, 77.0, 61.0, 37.0, 27.0, 19.0, 9.0, 14.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.55078125, -2.46722412109375, -2.3836669921875, -2.30010986328125, -2.216552734375, -2.13299560546875, -2.0494384765625, -1.96588134765625, -1.88232421875, -1.79876708984375, -1.7152099609375, -1.63165283203125, -1.548095703125, -1.46453857421875, -1.3809814453125, -1.29742431640625, -1.2138671875, -1.13031005859375, -1.0467529296875, -0.96319580078125, -0.879638671875, -0.79608154296875, -0.7125244140625, -0.62896728515625, -0.54541015625, -0.46185302734375, -0.3782958984375, -0.29473876953125, -0.211181640625, -0.12762451171875, -0.0440673828125, 0.03948974609375, 0.123046875, 0.20660400390625, 0.2901611328125, 0.37371826171875, 0.457275390625, 0.54083251953125, 0.6243896484375, 0.70794677734375, 0.79150390625, 0.87506103515625, 0.9586181640625, 1.04217529296875, 1.125732421875, 1.20928955078125, 1.2928466796875, 1.37640380859375, 1.4599609375, 1.54351806640625, 1.6270751953125, 1.71063232421875, 1.794189453125, 1.87774658203125, 1.9613037109375, 2.04486083984375, 2.12841796875, 2.21197509765625, 2.2955322265625, 2.37908935546875, 2.462646484375, 2.54620361328125, 2.6297607421875, 2.71331787109375, 2.796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 11.0, 7.0, 4.0, 9.0, 13.0, 11.0, 18.0, 28.0, 30.0, 28.0, 30.0, 27.0, 34.0, 48.0, 44.0, 59.0, 110.0, 290.0, 1456.0, 257.0, 106.0, 53.0, 42.0, 50.0, 29.0, 42.0, 37.0, 28.0, 21.0, 17.0, 18.0, 14.0, 12.0, 14.0, 11.0, 9.0, 6.0, 4.0, 7.0, 1.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.1014404296875, -5.913818359375, -5.7261962890625, -5.53857421875, -5.3509521484375, -5.163330078125, -4.9757080078125, -4.7880859375, -4.6004638671875, -4.412841796875, -4.2252197265625, -4.03759765625, -3.8499755859375, -3.662353515625, -3.4747314453125, -3.287109375, -3.0994873046875, -2.911865234375, -2.7242431640625, -2.53662109375, -2.3489990234375, -2.161376953125, -1.9737548828125, -1.7861328125, -1.5985107421875, -1.410888671875, -1.2232666015625, -1.03564453125, -0.8480224609375, -0.660400390625, -0.4727783203125, -0.28515625, -0.0975341796875, 0.090087890625, 0.2777099609375, 0.46533203125, 0.6529541015625, 0.840576171875, 1.0281982421875, 1.2158203125, 1.4034423828125, 1.591064453125, 1.7786865234375, 1.96630859375, 2.1539306640625, 2.341552734375, 2.5291748046875, 2.716796875, 2.9044189453125, 3.092041015625, 3.2796630859375, 3.46728515625, 3.6549072265625, 3.842529296875, 4.0301513671875, 4.2177734375, 4.4053955078125, 4.593017578125, 4.7806396484375, 4.96826171875, 5.1558837890625, 5.343505859375, 5.5311279296875, 5.71875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 9.0, 9.0, 6.0, 5.0, 19.0, 10.0, 16.0, 18.0, 20.0, 34.0, 48.0, 37.0, 55.0, 96.0, 118.0, 178.0, 361.0, 759.0, 2081.0, 6754.0, 30124.0, 536881.0, 2478528.0, 71945.0, 11887.0, 3251.0, 1142.0, 499.0, 250.0, 125.0, 79.0, 81.0, 70.0, 42.0, 34.0, 20.0, 15.0, 15.0, 12.0, 17.0, 10.0, 11.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.15728759765625, -6.9122314453125, -6.66717529296875, -6.422119140625, -6.17706298828125, -5.9320068359375, -5.68695068359375, -5.44189453125, -5.19683837890625, -4.9517822265625, -4.70672607421875, -4.461669921875, -4.21661376953125, -3.9715576171875, -3.72650146484375, -3.4814453125, -3.23638916015625, -2.9913330078125, -2.74627685546875, -2.501220703125, -2.25616455078125, -2.0111083984375, -1.76605224609375, -1.52099609375, -1.27593994140625, -1.0308837890625, -0.78582763671875, -0.540771484375, -0.29571533203125, -0.0506591796875, 0.19439697265625, 0.439453125, 0.68450927734375, 0.9295654296875, 1.17462158203125, 1.419677734375, 1.66473388671875, 1.9097900390625, 2.15484619140625, 2.39990234375, 2.64495849609375, 2.8900146484375, 3.13507080078125, 3.380126953125, 3.62518310546875, 3.8702392578125, 4.11529541015625, 4.3603515625, 4.60540771484375, 4.8504638671875, 5.09552001953125, 5.340576171875, 5.58563232421875, 5.8306884765625, 6.07574462890625, 6.32080078125, 6.56585693359375, 6.8109130859375, 7.05596923828125, 7.301025390625, 7.54608154296875, 7.7911376953125, 8.03619384765625, 8.28125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 43.0, 496.0, 451.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.41239166259766, -105.45640563964844, -103.50041961669922, -101.54444122314453, -99.58845520019531, -97.6324691772461, -95.67648315429688, -93.72050476074219, -91.76451873779297, -89.80853271484375, -87.85254669189453, -85.89656829833984, -83.94058227539062, -81.9845962524414, -80.02861022949219, -78.0726318359375, -76.11663818359375, -74.16065216064453, -72.20466613769531, -70.24868774414062, -68.2927017211914, -66.33671569824219, -64.38072967529297, -62.424747467041016, -60.46876525878906, -58.512779235839844, -56.55679702758789, -54.60081100463867, -52.64482879638672, -50.6888427734375, -48.73285675048828, -46.77687454223633, -44.820892333984375, -42.864906311035156, -40.9089241027832, -38.952938079833984, -36.99695587158203, -35.04096984863281, -33.084983825683594, -31.12900161743164, -29.173019409179688, -27.2170352935791, -25.261051177978516, -23.305065155029297, -21.349082946777344, -19.393096923828125, -17.43711280822754, -15.481128692626953, -13.525144577026367, -11.569160461425781, -9.613176345825195, -7.657191276550293, -5.701207160949707, -3.745223045349121, -1.7892379760742188, 0.1667461395263672, 2.122730255126953, 4.078714370727539, 6.034698963165283, 7.990683555603027, 9.946667671203613, 11.9026517868042, 13.858636856079102, 15.814620971679688, 17.770605087280273]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 11.0, 16.0, 13.0, 15.0, 16.0, 16.0, 23.0, 17.0, 25.0, 31.0, 35.0, 25.0, 34.0, 45.0, 43.0, 44.0, 38.0, 39.0, 46.0, 44.0, 51.0, 44.0, 49.0, 36.0, 32.0, 28.0, 23.0, 30.0, 24.0, 24.0, 16.0, 13.0, 5.0, 13.0, 8.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.599956512451172, -15.074480056762695, -14.549003601074219, -14.023526191711426, -13.49804973602295, -12.972573280334473, -12.44709587097168, -11.921619415283203, -11.396142959594727, -10.87066650390625, -10.345190048217773, -9.81971263885498, -9.294236183166504, -8.768759727478027, -8.243282318115234, -7.717805862426758, -7.192329406738281, -6.666852951049805, -6.14137601852417, -5.615899085998535, -5.090422630310059, -4.564946174621582, -4.039469242095947, -3.5139925479888916, -2.988515853881836, -2.4630391597747803, -1.9375624656677246, -1.412085771560669, -0.8866090774536133, -0.3611323833465576, 0.16434431076049805, 0.6898210048675537, 1.2152976989746094, 1.740774393081665, 2.2662510871887207, 2.7917277812957764, 3.317204475402832, 3.8426811695098877, 4.368157863616943, 4.893634796142578, 5.419111251831055, 5.944587707519531, 6.470064640045166, 6.995541572570801, 7.521018028259277, 8.046494483947754, 8.571971893310547, 9.097448348999023, 9.6229248046875, 10.148401260375977, 10.673877716064453, 11.199355125427246, 11.724831581115723, 12.2503080368042, 12.775785446166992, 13.301261901855469, 13.826738357543945, 14.352214813232422, 14.877691268920898, 15.403168678283691, 15.928645133972168, 16.45412254333496, 16.979598999023438, 17.505075454711914, 18.03055191040039]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 11.0, 9.0, 14.0, 17.0, 16.0, 29.0, 27.0, 38.0, 42.0, 40.0, 52.0, 41.0, 36.0, 60.0, 54.0, 48.0, 46.0, 46.0, 36.0, 54.0, 49.0, 31.0, 37.0, 31.0, 23.0, 32.0, 20.0, 13.0, 16.0, 13.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.4537353515625, -2.380126953125, -2.3065185546875, -2.23291015625, -2.1593017578125, -2.085693359375, -2.0120849609375, -1.9384765625, -1.8648681640625, -1.791259765625, -1.7176513671875, -1.64404296875, -1.5704345703125, -1.496826171875, -1.4232177734375, -1.349609375, -1.2760009765625, -1.202392578125, -1.1287841796875, -1.05517578125, -0.9815673828125, -0.907958984375, -0.8343505859375, -0.7607421875, -0.6871337890625, -0.613525390625, -0.5399169921875, -0.46630859375, -0.3927001953125, -0.319091796875, -0.2454833984375, -0.171875, -0.0982666015625, -0.024658203125, 0.0489501953125, 0.12255859375, 0.1961669921875, 0.269775390625, 0.3433837890625, 0.4169921875, 0.4906005859375, 0.564208984375, 0.6378173828125, 0.71142578125, 0.7850341796875, 0.858642578125, 0.9322509765625, 1.005859375, 1.0794677734375, 1.153076171875, 1.2266845703125, 1.30029296875, 1.3739013671875, 1.447509765625, 1.5211181640625, 1.5947265625, 1.6683349609375, 1.741943359375, 1.8155517578125, 1.88916015625, 1.9627685546875, 2.036376953125, 2.1099853515625, 2.18359375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 21.0, 23.0, 31.0, 50.0, 86.0, 116.0, 174.0, 316.0, 578.0, 1001.0, 1924.0, 3775.0, 8596.0, 23391.0, 97549.0, 795864.0, 2596692.0, 554987.0, 74760.0, 20025.0, 7379.0, 3304.0, 1622.0, 877.0, 489.0, 258.0, 174.0, 70.0, 60.0, 34.0, 18.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2109375, -4.092041015625, -3.97314453125, -3.854248046875, -3.7353515625, -3.616455078125, -3.49755859375, -3.378662109375, -3.259765625, -3.140869140625, -3.02197265625, -2.903076171875, -2.7841796875, -2.665283203125, -2.54638671875, -2.427490234375, -2.30859375, -2.189697265625, -2.07080078125, -1.951904296875, -1.8330078125, -1.714111328125, -1.59521484375, -1.476318359375, -1.357421875, -1.238525390625, -1.11962890625, -1.000732421875, -0.8818359375, -0.762939453125, -0.64404296875, -0.525146484375, -0.40625, -0.287353515625, -0.16845703125, -0.049560546875, 0.0693359375, 0.188232421875, 0.30712890625, 0.426025390625, 0.544921875, 0.663818359375, 0.78271484375, 0.901611328125, 1.0205078125, 1.139404296875, 1.25830078125, 1.377197265625, 1.49609375, 1.614990234375, 1.73388671875, 1.852783203125, 1.9716796875, 2.090576171875, 2.20947265625, 2.328369140625, 2.447265625, 2.566162109375, 2.68505859375, 2.803955078125, 2.9228515625, 3.041748046875, 3.16064453125, 3.279541015625, 3.3984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 15.0, 21.0, 23.0, 33.0, 46.0, 54.0, 89.0, 133.0, 222.0, 323.0, 434.0, 615.0, 568.0, 471.0, 353.0, 198.0, 128.0, 86.0, 51.0, 53.0, 37.0, 33.0, 16.0, 17.0, 6.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.28125, -3.17218017578125, -3.0631103515625, -2.95404052734375, -2.844970703125, -2.73590087890625, -2.6268310546875, -2.51776123046875, -2.40869140625, -2.29962158203125, -2.1905517578125, -2.08148193359375, -1.972412109375, -1.86334228515625, -1.7542724609375, -1.64520263671875, -1.5361328125, -1.42706298828125, -1.3179931640625, -1.20892333984375, -1.099853515625, -0.99078369140625, -0.8817138671875, -0.77264404296875, -0.66357421875, -0.55450439453125, -0.4454345703125, -0.33636474609375, -0.227294921875, -0.11822509765625, -0.0091552734375, 0.09991455078125, 0.208984375, 0.31805419921875, 0.4271240234375, 0.53619384765625, 0.645263671875, 0.75433349609375, 0.8634033203125, 0.97247314453125, 1.08154296875, 1.19061279296875, 1.2996826171875, 1.40875244140625, 1.517822265625, 1.62689208984375, 1.7359619140625, 1.84503173828125, 1.9541015625, 2.06317138671875, 2.1722412109375, 2.28131103515625, 2.390380859375, 2.49945068359375, 2.6085205078125, 2.71759033203125, 2.82666015625, 2.93572998046875, 3.0447998046875, 3.15386962890625, 3.262939453125, 3.37200927734375, 3.4810791015625, 3.59014892578125, 3.69921875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 13.0, 10.0, 26.0, 32.0, 59.0, 73.0, 94.0, 163.0, 357.0, 686.0, 2264.0, 11299.0, 105897.0, 3402258.0, 631717.0, 32159.0, 4775.0, 1240.0, 477.0, 234.0, 135.0, 97.0, 64.0, 42.0, 32.0, 17.0, 8.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.6885986328125, -9.392822265625, -9.0970458984375, -8.80126953125, -8.5054931640625, -8.209716796875, -7.9139404296875, -7.6181640625, -7.3223876953125, -7.026611328125, -6.7308349609375, -6.43505859375, -6.1392822265625, -5.843505859375, -5.5477294921875, -5.251953125, -4.9561767578125, -4.660400390625, -4.3646240234375, -4.06884765625, -3.7730712890625, -3.477294921875, -3.1815185546875, -2.8857421875, -2.5899658203125, -2.294189453125, -1.9984130859375, -1.70263671875, -1.4068603515625, -1.111083984375, -0.8153076171875, -0.51953125, -0.2237548828125, 0.072021484375, 0.3677978515625, 0.66357421875, 0.9593505859375, 1.255126953125, 1.5509033203125, 1.8466796875, 2.1424560546875, 2.438232421875, 2.7340087890625, 3.02978515625, 3.3255615234375, 3.621337890625, 3.9171142578125, 4.212890625, 4.5086669921875, 4.804443359375, 5.1002197265625, 5.39599609375, 5.6917724609375, 5.987548828125, 6.2833251953125, 6.5791015625, 6.8748779296875, 7.170654296875, 7.4664306640625, 7.76220703125, 8.0579833984375, 8.353759765625, 8.6495361328125, 8.9453125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 57.0, 139.0, 348.0, 290.0, 136.0, 24.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.767168045043945, -22.44314956665039, -21.11913299560547, -19.795114517211914, -18.471097946166992, -17.147079467773438, -15.8230619430542, -14.499044418334961, -13.175026893615723, -11.851009368896484, -10.526991844177246, -9.202974319458008, -7.878956317901611, -6.554938793182373, -5.230920791625977, -3.9069032669067383, -2.5828857421875, -1.2588680982589722, 0.06514954566955566, 1.389167308807373, 2.7131848335266113, 4.03720235824585, 5.361220359802246, 6.685237884521484, 8.009255409240723, 9.333272933959961, 10.6572904586792, 11.981307983398438, 13.305326461791992, 14.629343032836914, 15.953361511230469, 17.27737808227539, 18.601398468017578, 19.925416946411133, 21.249433517456055, 22.57345199584961, 23.89746856689453, 25.221487045288086, 26.54550552368164, 27.869522094726562, 29.193538665771484, 30.51755714416504, 31.84157371520996, 33.165592193603516, 34.48960876464844, 35.81362533569336, 37.13764572143555, 38.46166229248047, 39.785682678222656, 41.10969924926758, 42.433719635009766, 43.75773620605469, 45.08175277709961, 46.40576934814453, 47.72978973388672, 49.05380630493164, 50.37782287597656, 51.701839447021484, 53.02585983276367, 54.349876403808594, 55.673892974853516, 56.99790954589844, 58.321929931640625, 59.64594650268555, 60.96996307373047]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 10.0, 8.0, 8.0, 4.0, 12.0, 20.0, 13.0, 22.0, 24.0, 20.0, 25.0, 27.0, 21.0, 26.0, 32.0, 18.0, 37.0, 29.0, 38.0, 46.0, 41.0, 31.0, 33.0, 39.0, 21.0, 31.0, 27.0, 26.0, 36.0, 35.0, 21.0, 27.0, 26.0, 28.0, 23.0, 20.0, 12.0, 13.0, 14.0, 10.0, 8.0, 7.0, 5.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-10.219720840454102, -9.927141189575195, -9.634560585021973, -9.341980934143066, -9.04940128326416, -8.756820678710938, -8.464241027832031, -8.171661376953125, -7.8790812492370605, -7.586501121520996, -7.29392147064209, -7.001341342926025, -6.708761215209961, -6.416181564331055, -6.12360143661499, -5.831021308898926, -5.5384416580200195, -5.245861530303955, -4.953281879425049, -4.660701751708984, -4.368122100830078, -4.075541973114014, -3.782961845397949, -3.490381956100464, -3.1978020668029785, -2.905222177505493, -2.612642288208008, -2.3200621604919434, -2.027482271194458, -1.7349023818969727, -1.4423223733901978, -1.1497423648834229, -0.8571615219116211, -0.564581573009491, -0.27200162410736084, 0.020578324794769287, 0.3131582736968994, 0.6057381629943848, 0.8983181715011597, 1.1908981800079346, 1.48347806930542, 1.7760579586029053, 2.0686378479003906, 2.361217975616455, 2.6537978649139404, 2.946377754211426, 3.2389578819274902, 3.5315377712249756, 3.824117660522461, 4.116697788238525, 4.409277439117432, 4.701857566833496, 4.994437217712402, 5.287017345428467, 5.579597473144531, 5.8721771240234375, 6.164757251739502, 6.457337379455566, 6.749917030334473, 7.042497158050537, 7.335077285766602, 7.627656936645508, 7.920237064361572, 8.212817192077637, 8.505396842956543]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 2.0, 11.0, 12.0, 14.0, 23.0, 25.0, 29.0, 29.0, 44.0, 43.0, 44.0, 49.0, 43.0, 48.0, 59.0, 51.0, 54.0, 43.0, 35.0, 43.0, 43.0, 37.0, 29.0, 28.0, 23.0, 23.0, 15.0, 20.0, 13.0, 13.0, 8.0, 11.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.072784423828125, -2.00494384765625, -1.937103271484375, -1.8692626953125, -1.801422119140625, -1.73358154296875, -1.665740966796875, -1.597900390625, -1.530059814453125, -1.46221923828125, -1.394378662109375, -1.3265380859375, -1.258697509765625, -1.19085693359375, -1.123016357421875, -1.05517578125, -0.987335205078125, -0.91949462890625, -0.851654052734375, -0.7838134765625, -0.715972900390625, -0.64813232421875, -0.580291748046875, -0.512451171875, -0.444610595703125, -0.37677001953125, -0.308929443359375, -0.2410888671875, -0.173248291015625, -0.10540771484375, -0.037567138671875, 0.0302734375, 0.098114013671875, 0.16595458984375, 0.233795166015625, 0.3016357421875, 0.369476318359375, 0.43731689453125, 0.505157470703125, 0.572998046875, 0.640838623046875, 0.70867919921875, 0.776519775390625, 0.8443603515625, 0.912200927734375, 0.98004150390625, 1.047882080078125, 1.11572265625, 1.183563232421875, 1.25140380859375, 1.319244384765625, 1.3870849609375, 1.454925537109375, 1.52276611328125, 1.590606689453125, 1.658447265625, 1.726287841796875, 1.79412841796875, 1.861968994140625, 1.9298095703125, 1.997650146484375, 2.06549072265625, 2.133331298828125, 2.201171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 9.0, 4.0, 7.0, 4.0, 14.0, 21.0, 22.0, 40.0, 60.0, 79.0, 123.0, 207.0, 305.0, 463.0, 729.0, 1056.0, 1597.0, 2487.0, 3945.0, 5743.0, 8950.0, 13489.0, 20983.0, 32343.0, 49225.0, 72627.0, 103707.0, 135156.0, 148718.0, 133144.0, 102622.0, 71553.0, 48141.0, 31759.0, 20605.0, 13390.0, 8652.0, 5657.0, 3751.0, 2402.0, 1673.0, 1042.0, 677.0, 442.0, 328.0, 204.0, 131.0, 92.0, 70.0, 42.0, 16.0, 22.0, 14.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.25927734375, -0.25077056884765625, -0.2422637939453125, -0.23375701904296875, -0.225250244140625, -0.21674346923828125, -0.2082366943359375, -0.19972991943359375, -0.19122314453125, -0.18271636962890625, -0.1742095947265625, -0.16570281982421875, -0.157196044921875, -0.14868927001953125, -0.1401824951171875, -0.13167572021484375, -0.1231689453125, -0.11466217041015625, -0.1061553955078125, -0.09764862060546875, -0.089141845703125, -0.08063507080078125, -0.0721282958984375, -0.06362152099609375, -0.05511474609375, -0.04660797119140625, -0.0381011962890625, -0.02959442138671875, -0.021087646484375, -0.01258087158203125, -0.0040740966796875, 0.00443267822265625, 0.012939453125, 0.02144622802734375, 0.0299530029296875, 0.03845977783203125, 0.046966552734375, 0.05547332763671875, 0.0639801025390625, 0.07248687744140625, 0.08099365234375, 0.08950042724609375, 0.0980072021484375, 0.10651397705078125, 0.115020751953125, 0.12352752685546875, 0.1320343017578125, 0.14054107666015625, 0.1490478515625, 0.15755462646484375, 0.1660614013671875, 0.17456817626953125, 0.183074951171875, 0.19158172607421875, 0.2000885009765625, 0.20859527587890625, 0.21710205078125, 0.22560882568359375, 0.2341156005859375, 0.24262237548828125, 0.251129150390625, 0.25963592529296875, 0.2681427001953125, 0.27664947509765625, 0.28515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 4.0, 6.0, 13.0, 14.0, 13.0, 18.0, 27.0, 24.0, 24.0, 25.0, 25.0, 39.0, 43.0, 43.0, 35.0, 37.0, 41.0, 45.0, 1068.0, 51.0, 42.0, 43.0, 44.0, 37.0, 32.0, 41.0, 34.0, 25.0, 19.0, 24.0, 13.0, 11.0, 12.0, 14.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4580078125, -1.41290283203125, -1.3677978515625, -1.32269287109375, -1.277587890625, -1.23248291015625, -1.1873779296875, -1.14227294921875, -1.09716796875, -1.05206298828125, -1.0069580078125, -0.96185302734375, -0.916748046875, -0.87164306640625, -0.8265380859375, -0.78143310546875, -0.736328125, -0.69122314453125, -0.6461181640625, -0.60101318359375, -0.555908203125, -0.51080322265625, -0.4656982421875, -0.42059326171875, -0.37548828125, -0.33038330078125, -0.2852783203125, -0.24017333984375, -0.195068359375, -0.14996337890625, -0.1048583984375, -0.05975341796875, -0.0146484375, 0.03045654296875, 0.0755615234375, 0.12066650390625, 0.165771484375, 0.21087646484375, 0.2559814453125, 0.30108642578125, 0.34619140625, 0.39129638671875, 0.4364013671875, 0.48150634765625, 0.526611328125, 0.57171630859375, 0.6168212890625, 0.66192626953125, 0.70703125, 0.75213623046875, 0.7972412109375, 0.84234619140625, 0.887451171875, 0.93255615234375, 0.9776611328125, 1.02276611328125, 1.06787109375, 1.11297607421875, 1.1580810546875, 1.20318603515625, 1.248291015625, 1.29339599609375, 1.3385009765625, 1.38360595703125, 1.4287109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 8.0, 11.0, 12.0, 17.0, 26.0, 39.0, 54.0, 71.0, 136.0, 174.0, 285.0, 440.0, 659.0, 1080.0, 1672.0, 2634.0, 4301.0, 6575.0, 10419.0, 17671.0, 37556.0, 252411.0, 1616510.0, 83028.0, 24990.0, 13523.0, 8366.0, 5249.0, 3285.0, 2108.0, 1330.0, 893.0, 559.0, 354.0, 210.0, 166.0, 104.0, 70.0, 38.0, 37.0, 23.0, 12.0, 13.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5859375, -0.5697822570800781, -0.5536270141601562, -0.5374717712402344, -0.5213165283203125, -0.5051612854003906, -0.48900604248046875, -0.4728507995605469, -0.456695556640625, -0.4405403137207031, -0.42438507080078125, -0.4082298278808594, -0.3920745849609375, -0.3759193420410156, -0.35976409912109375, -0.3436088562011719, -0.32745361328125, -0.3112983703613281, -0.29514312744140625, -0.2789878845214844, -0.2628326416015625, -0.24667739868164062, -0.23052215576171875, -0.21436691284179688, -0.198211669921875, -0.18205642700195312, -0.16590118408203125, -0.14974594116210938, -0.1335906982421875, -0.11743545532226562, -0.10128021240234375, -0.08512496948242188, -0.0689697265625, -0.052814483642578125, -0.03665924072265625, -0.020503997802734375, -0.0043487548828125, 0.011806488037109375, 0.02796173095703125, 0.044116973876953125, 0.060272216796875, 0.07642745971679688, 0.09258270263671875, 0.10873794555664062, 0.1248931884765625, 0.14104843139648438, 0.15720367431640625, 0.17335891723632812, 0.18951416015625, 0.20566940307617188, 0.22182464599609375, 0.23797988891601562, 0.2541351318359375, 0.2702903747558594, 0.28644561767578125, 0.3026008605957031, 0.318756103515625, 0.3349113464355469, 0.35106658935546875, 0.3672218322753906, 0.3833770751953125, 0.3995323181152344, 0.41568756103515625, 0.4318428039550781, 0.447998046875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 17.0, 27.0, 26.0, 31.0, 42.0, 62.0, 60.0, 79.0, 84.0, 74.0, 84.0, 81.0, 76.0, 49.0, 48.0, 31.0, 30.0, 16.0, 18.0, 10.0, 6.0, 9.0, 7.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0546875, -0.053189754486083984, -0.05169200897216797, -0.05019426345825195, -0.04869651794433594, -0.04719877243041992, -0.045701026916503906, -0.04420328140258789, -0.042705535888671875, -0.04120779037475586, -0.039710044860839844, -0.03821229934692383, -0.03671455383300781, -0.0352168083190918, -0.03371906280517578, -0.032221317291259766, -0.03072357177734375, -0.029225826263427734, -0.02772808074951172, -0.026230335235595703, -0.024732589721679688, -0.023234844207763672, -0.021737098693847656, -0.02023935317993164, -0.018741607666015625, -0.01724386215209961, -0.015746116638183594, -0.014248371124267578, -0.012750625610351562, -0.011252880096435547, -0.009755134582519531, -0.008257389068603516, -0.0067596435546875, -0.005261898040771484, -0.0037641525268554688, -0.002266407012939453, -0.0007686614990234375, 0.0007290840148925781, 0.0022268295288085938, 0.0037245750427246094, 0.005222320556640625, 0.006720066070556641, 0.008217811584472656, 0.009715557098388672, 0.011213302612304688, 0.012711048126220703, 0.014208793640136719, 0.015706539154052734, 0.01720428466796875, 0.018702030181884766, 0.02019977569580078, 0.021697521209716797, 0.023195266723632812, 0.024693012237548828, 0.026190757751464844, 0.02768850326538086, 0.029186248779296875, 0.03068399429321289, 0.032181739807128906, 0.03367948532104492, 0.03517723083496094, 0.03667497634887695, 0.03817272186279297, 0.039670467376708984, 0.041168212890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 11.0, 10.0, 8.0, 21.0, 17.0, 40.0, 38.0, 65.0, 93.0, 190.0, 379.0, 1923.0, 994101.0, 50292.0, 698.0, 229.0, 154.0, 91.0, 43.0, 41.0, 24.0, 29.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8355026245117188, -0.8043060302734375, -0.7731094360351562, -0.741912841796875, -0.7107162475585938, -0.6795196533203125, -0.6483230590820312, -0.61712646484375, -0.5859298706054688, -0.5547332763671875, -0.5235366821289062, -0.492340087890625, -0.46114349365234375, -0.4299468994140625, -0.39875030517578125, -0.3675537109375, -0.33635711669921875, -0.3051605224609375, -0.27396392822265625, -0.242767333984375, -0.21157073974609375, -0.1803741455078125, -0.14917755126953125, -0.11798095703125, -0.08678436279296875, -0.0555877685546875, -0.02439117431640625, 0.006805419921875, 0.03800201416015625, 0.0691986083984375, 0.10039520263671875, 0.131591796875, 0.16278839111328125, 0.1939849853515625, 0.22518157958984375, 0.256378173828125, 0.28757476806640625, 0.3187713623046875, 0.34996795654296875, 0.38116455078125, 0.41236114501953125, 0.4435577392578125, 0.47475433349609375, 0.505950927734375, 0.5371475219726562, 0.5683441162109375, 0.5995407104492188, 0.6307373046875, 0.6619338989257812, 0.6931304931640625, 0.7243270874023438, 0.755523681640625, 0.7867202758789062, 0.8179168701171875, 0.8491134643554688, 0.88031005859375, 0.9115066528320312, 0.9427032470703125, 0.9738998413085938, 1.005096435546875, 1.0362930297851562, 1.0674896240234375, 1.0986862182617188, 1.1298828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 19.0, 855.0, 144.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9690470695495605, -0.9509902596473694, -0.9329334497451782, -0.9148766398429871, -0.8968198299407959, -0.8787630796432495, -0.8607062101364136, -0.8426494598388672, -0.824592649936676, -0.8065358400344849, -0.7884790301322937, -0.7704222202301025, -0.7523654103279114, -0.7343086004257202, -0.7162518501281738, -0.6981950402259827, -0.6801382303237915, -0.6620814204216003, -0.6440246105194092, -0.625967800617218, -0.6079109907150269, -0.5898542404174805, -0.5717973709106445, -0.5537406206130981, -0.5356837511062622, -0.517626941204071, -0.4995701313018799, -0.4815133213996887, -0.46345654129981995, -0.4453997313976288, -0.4273429214954376, -0.40928614139556885, -0.3912293314933777, -0.3731725215911865, -0.35511571168899536, -0.3370589017868042, -0.3190021216869354, -0.30094531178474426, -0.2828885018825531, -0.2648317217826843, -0.24677488207817078, -0.22871807217597961, -0.21066127717494965, -0.19260446727275848, -0.17454767227172852, -0.15649086236953735, -0.1384340524673462, -0.12037725746631622, -0.10232044756412506, -0.0842636451125145, -0.06620684266090393, -0.04815003275871277, -0.030093230307102203, -0.012036427855491638, 0.006020382046699524, 0.024077177047729492, 0.042133986949920654, 0.06019078940153122, 0.07824759185314178, 0.09630440175533295, 0.11436120420694351, 0.13241800665855408, 0.15047481656074524, 0.1685316115617752, 0.18658842146396637]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 0.0, 2.0, 2.0, 7.0, 8.0, 10.0, 13.0, 24.0, 22.0, 32.0, 20.0, 38.0, 42.0, 59.0, 40.0, 51.0, 46.0, 53.0, 55.0, 47.0, 56.0, 55.0, 54.0, 40.0, 39.0, 36.0, 33.0, 25.0, 21.0, 17.0, 13.0, 8.0, 16.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056599974632263184, -0.054925937205553055, -0.053251899778842926, -0.0515778586268425, -0.04990382120013237, -0.04822978377342224, -0.046555742621421814, -0.044881705194711685, -0.043207667768001556, -0.04153363034129143, -0.0398595929145813, -0.03818555176258087, -0.03651151433587074, -0.034837476909160614, -0.03316343575716019, -0.03148939833045006, -0.02981536090373993, -0.0281413234770298, -0.026467284187674522, -0.024793244898319244, -0.023119207471609116, -0.021445170044898987, -0.01977113075554371, -0.01809709146618843, -0.016423054039478302, -0.014749015681445599, -0.013074977323412895, -0.011400938965380192, -0.009726900607347488, -0.008052862249314785, -0.006378823891282082, -0.004704785533249378, -0.003030747175216675, -0.0013567088171839714, 0.000317329540848732, 0.0019913678988814354, 0.003665406256914139, 0.005339444614946842, 0.007013482972979546, 0.008687521331012249, 0.010361559689044952, 0.012035598047077656, 0.01370963640511036, 0.015383674763143063, 0.017057713121175766, 0.018731750547885895, 0.020405789837241173, 0.02207982912659645, 0.02375386655330658, 0.02542790398001671, 0.027101943269371986, 0.028775982558727264, 0.030450019985437393, 0.03212405741214752, 0.03379809856414795, 0.03547213599085808, 0.03714617341756821, 0.038820210844278336, 0.040494248270988464, 0.04216828942298889, 0.04384232684969902, 0.04551636427640915, 0.047190405428409576, 0.048864442855119705, 0.050538480281829834]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 13.0, 14.0, 12.0, 13.0, 14.0, 23.0, 32.0, 44.0, 35.0, 40.0, 45.0, 43.0, 47.0, 51.0, 56.0, 52.0, 52.0, 34.0, 47.0, 50.0, 26.0, 28.0, 33.0, 25.0, 35.0, 19.0, 19.0, 14.0, 16.0, 13.0, 6.0, 9.0, 4.0, 2.0, 10.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -1.99066162109375, -1.9246826171875, -1.85870361328125, -1.792724609375, -1.72674560546875, -1.6607666015625, -1.59478759765625, -1.52880859375, -1.46282958984375, -1.3968505859375, -1.33087158203125, -1.264892578125, -1.19891357421875, -1.1329345703125, -1.06695556640625, -1.0009765625, -0.93499755859375, -0.8690185546875, -0.80303955078125, -0.737060546875, -0.67108154296875, -0.6051025390625, -0.53912353515625, -0.47314453125, -0.40716552734375, -0.3411865234375, -0.27520751953125, -0.209228515625, -0.14324951171875, -0.0772705078125, -0.01129150390625, 0.0546875, 0.12066650390625, 0.1866455078125, 0.25262451171875, 0.318603515625, 0.38458251953125, 0.4505615234375, 0.51654052734375, 0.58251953125, 0.64849853515625, 0.7144775390625, 0.78045654296875, 0.846435546875, 0.91241455078125, 0.9783935546875, 1.04437255859375, 1.1103515625, 1.17633056640625, 1.2423095703125, 1.30828857421875, 1.374267578125, 1.44024658203125, 1.5062255859375, 1.57220458984375, 1.63818359375, 1.70416259765625, 1.7701416015625, 1.83612060546875, 1.902099609375, 1.96807861328125, 2.0340576171875, 2.10003662109375, 2.166015625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 2.0, 8.0, 10.0, 11.0, 13.0, 21.0, 23.0, 37.0, 54.0, 96.0, 138.0, 248.0, 344.0, 661.0, 1137.0, 2438.0, 4732.0, 10098.0, 23275.0, 62255.0, 379513.0, 449678.0, 67501.0, 24849.0, 10899.0, 5122.0, 2452.0, 1281.0, 655.0, 363.0, 205.0, 118.0, 88.0, 59.0, 41.0, 29.0, 23.0, 21.0, 15.0, 9.0, 8.0, 5.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.293426513671875, -3.16693115234375, -3.040435791015625, -2.9139404296875, -2.787445068359375, -2.66094970703125, -2.534454345703125, -2.407958984375, -2.281463623046875, -2.15496826171875, -2.028472900390625, -1.9019775390625, -1.775482177734375, -1.64898681640625, -1.522491455078125, -1.39599609375, -1.269500732421875, -1.14300537109375, -1.016510009765625, -0.8900146484375, -0.763519287109375, -0.63702392578125, -0.510528564453125, -0.384033203125, -0.257537841796875, -0.13104248046875, -0.004547119140625, 0.1219482421875, 0.248443603515625, 0.37493896484375, 0.501434326171875, 0.6279296875, 0.754425048828125, 0.88092041015625, 1.007415771484375, 1.1339111328125, 1.260406494140625, 1.38690185546875, 1.513397216796875, 1.639892578125, 1.766387939453125, 1.89288330078125, 2.019378662109375, 2.1458740234375, 2.272369384765625, 2.39886474609375, 2.525360107421875, 2.65185546875, 2.778350830078125, 2.90484619140625, 3.031341552734375, 3.1578369140625, 3.284332275390625, 3.41082763671875, 3.537322998046875, 3.663818359375, 3.790313720703125, 3.91680908203125, 4.043304443359375, 4.1697998046875, 4.296295166015625, 4.42279052734375, 4.549285888671875, 4.67578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 5.0, 7.0, 14.0, 14.0, 26.0, 24.0, 21.0, 26.0, 26.0, 30.0, 40.0, 46.0, 39.0, 46.0, 67.0, 121.0, 348.0, 1444.0, 155.0, 85.0, 47.0, 51.0, 38.0, 46.0, 41.0, 28.0, 23.0, 18.0, 25.0, 24.0, 22.0, 20.0, 9.0, 8.0, 10.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.2982177734375, -5.127685546875, -4.9571533203125, -4.78662109375, -4.6160888671875, -4.445556640625, -4.2750244140625, -4.1044921875, -3.9339599609375, -3.763427734375, -3.5928955078125, -3.42236328125, -3.2518310546875, -3.081298828125, -2.9107666015625, -2.740234375, -2.5697021484375, -2.399169921875, -2.2286376953125, -2.05810546875, -1.8875732421875, -1.717041015625, -1.5465087890625, -1.3759765625, -1.2054443359375, -1.034912109375, -0.8643798828125, -0.69384765625, -0.5233154296875, -0.352783203125, -0.1822509765625, -0.01171875, 0.1588134765625, 0.329345703125, 0.4998779296875, 0.67041015625, 0.8409423828125, 1.011474609375, 1.1820068359375, 1.3525390625, 1.5230712890625, 1.693603515625, 1.8641357421875, 2.03466796875, 2.2052001953125, 2.375732421875, 2.5462646484375, 2.716796875, 2.8873291015625, 3.057861328125, 3.2283935546875, 3.39892578125, 3.5694580078125, 3.739990234375, 3.9105224609375, 4.0810546875, 4.2515869140625, 4.422119140625, 4.5926513671875, 4.76318359375, 4.9337158203125, 5.104248046875, 5.2747802734375, 5.4453125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 13.0, 5.0, 12.0, 23.0, 29.0, 25.0, 35.0, 60.0, 93.0, 116.0, 196.0, 413.0, 864.0, 2332.0, 9270.0, 71169.0, 2889610.0, 151773.0, 14224.0, 3195.0, 1074.0, 448.0, 241.0, 137.0, 91.0, 58.0, 45.0, 34.0, 25.0, 22.0, 15.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.625, -10.29931640625, -9.9736328125, -9.64794921875, -9.322265625, -8.99658203125, -8.6708984375, -8.34521484375, -8.01953125, -7.69384765625, -7.3681640625, -7.04248046875, -6.716796875, -6.39111328125, -6.0654296875, -5.73974609375, -5.4140625, -5.08837890625, -4.7626953125, -4.43701171875, -4.111328125, -3.78564453125, -3.4599609375, -3.13427734375, -2.80859375, -2.48291015625, -2.1572265625, -1.83154296875, -1.505859375, -1.18017578125, -0.8544921875, -0.52880859375, -0.203125, 0.12255859375, 0.4482421875, 0.77392578125, 1.099609375, 1.42529296875, 1.7509765625, 2.07666015625, 2.40234375, 2.72802734375, 3.0537109375, 3.37939453125, 3.705078125, 4.03076171875, 4.3564453125, 4.68212890625, 5.0078125, 5.33349609375, 5.6591796875, 5.98486328125, 6.310546875, 6.63623046875, 6.9619140625, 7.28759765625, 7.61328125, 7.93896484375, 8.2646484375, 8.59033203125, 8.916015625, 9.24169921875, 9.5673828125, 9.89306640625, 10.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 13.0, 26.0, 56.0, 90.0, 120.0, 185.0, 181.0, 140.0, 91.0, 60.0, 20.0, 13.0, 11.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.342370986938477, -16.93958854675293, -16.536806106567383, -16.134023666381836, -15.731240272521973, -15.328457832336426, -14.925675392150879, -14.522891998291016, -14.120109558105469, -13.717327117919922, -13.314544677734375, -12.911761283874512, -12.508978843688965, -12.106196403503418, -11.703413963317871, -11.300630569458008, -10.897848129272461, -10.495065689086914, -10.092283248901367, -9.689499855041504, -9.286717414855957, -8.88393497467041, -8.481152534484863, -8.078369140625, -7.6755876541137695, -7.272805213928223, -6.870022296905518, -6.467239856719971, -6.064456939697266, -5.661674499511719, -5.258892059326172, -4.856109142303467, -4.453326225280762, -4.050543785095215, -3.6477608680725098, -3.244978427886963, -2.842195510864258, -2.439413070678711, -2.036630392074585, -1.633847713470459, -1.231065034866333, -0.828282356262207, -0.42549973726272583, -0.02271711826324463, 0.38006556034088135, 0.7828481197357178, 1.1856307983398438, 1.5884134769439697, 1.9911961555480957, 2.3939788341522217, 2.7967615127563477, 3.1995439529418945, 3.6023268699645996, 4.0051093101501465, 4.407892227172852, 4.810674667358398, 5.213457107543945, 5.616239547729492, 6.019022464752197, 6.421804904937744, 6.824587821960449, 7.227370262145996, 7.630152702331543, 8.032936096191406, 8.435718536376953]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 1.0, 8.0, 14.0, 11.0, 10.0, 22.0, 14.0, 21.0, 22.0, 18.0, 20.0, 25.0, 28.0, 31.0, 41.0, 46.0, 33.0, 56.0, 42.0, 32.0, 37.0, 53.0, 41.0, 39.0, 36.0, 37.0, 32.0, 31.0, 34.0, 24.0, 19.0, 18.0, 17.0, 12.0, 13.0, 8.0, 5.0, 10.0, 8.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.799412727355957, -13.32646369934082, -12.853514671325684, -12.380565643310547, -11.907617568969727, -11.43466854095459, -10.961719512939453, -10.488770484924316, -10.01582145690918, -9.542872428894043, -9.069923400878906, -8.596975326538086, -8.12402629852295, -7.6510772705078125, -7.178128242492676, -6.705179214477539, -6.232231140136719, -5.759282112121582, -5.2863335609436035, -4.813384532928467, -4.340435981750488, -3.8674869537353516, -3.394537925720215, -2.9215891361236572, -2.4486403465270996, -1.975691556930542, -1.5027426481246948, -1.0297937393188477, -0.55684494972229, -0.08389616012573242, 0.3890528678894043, 0.8620016574859619, 1.3349494934082031, 1.8078982830047607, 2.2808470726013184, 2.753796100616455, 3.2267448902130127, 3.6996936798095703, 4.172642707824707, 4.645591735839844, 5.118540287017822, 5.591489315032959, 6.0644378662109375, 6.537386894226074, 7.010335922241211, 7.4832844734191895, 7.956233501434326, 8.429182052612305, 8.902131080627441, 9.375080108642578, 9.848029136657715, 10.320978164672852, 10.793926239013672, 11.266875267028809, 11.739824295043945, 12.212773323059082, 12.685722351074219, 13.158671379089355, 13.631620407104492, 14.104568481445312, 14.57751750946045, 15.050466537475586, 15.523415565490723, 15.99636459350586, 16.46931266784668]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 3.0, 12.0, 14.0, 11.0, 26.0, 15.0, 14.0, 31.0, 38.0, 36.0, 37.0, 36.0, 38.0, 56.0, 40.0, 42.0, 51.0, 30.0, 44.0, 48.0, 59.0, 46.0, 30.0, 32.0, 28.0, 24.0, 26.0, 15.0, 23.0, 10.0, 15.0, 13.0, 9.0, 9.0, 6.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.0925445556640625, -2.028839111328125, -1.9651336669921875, -1.90142822265625, -1.8377227783203125, -1.774017333984375, -1.7103118896484375, -1.6466064453125, -1.5829010009765625, -1.519195556640625, -1.4554901123046875, -1.39178466796875, -1.3280792236328125, -1.264373779296875, -1.2006683349609375, -1.136962890625, -1.0732574462890625, -1.009552001953125, -0.9458465576171875, -0.88214111328125, -0.8184356689453125, -0.754730224609375, -0.6910247802734375, -0.6273193359375, -0.5636138916015625, -0.499908447265625, -0.4362030029296875, -0.37249755859375, -0.3087921142578125, -0.245086669921875, -0.1813812255859375, -0.11767578125, -0.0539703369140625, 0.009735107421875, 0.0734405517578125, 0.13714599609375, 0.2008514404296875, 0.264556884765625, 0.3282623291015625, 0.3919677734375, 0.4556732177734375, 0.519378662109375, 0.5830841064453125, 0.64678955078125, 0.7104949951171875, 0.774200439453125, 0.8379058837890625, 0.901611328125, 0.9653167724609375, 1.029022216796875, 1.0927276611328125, 1.15643310546875, 1.2201385498046875, 1.283843994140625, 1.3475494384765625, 1.4112548828125, 1.4749603271484375, 1.538665771484375, 1.6023712158203125, 1.66607666015625, 1.7297821044921875, 1.793487548828125, 1.8571929931640625, 1.9208984375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 7.0, 10.0, 10.0, 14.0, 17.0, 25.0, 43.0, 47.0, 98.0, 111.0, 208.0, 311.0, 530.0, 825.0, 1512.0, 2720.0, 5484.0, 12120.0, 31892.0, 125431.0, 842991.0, 2412240.0, 610684.0, 97824.0, 27526.0, 10628.0, 4987.0, 2532.0, 1431.0, 775.0, 492.0, 272.0, 174.0, 106.0, 65.0, 40.0, 32.0, 21.0, 12.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.587890625, -3.48052978515625, -3.3731689453125, -3.26580810546875, -3.158447265625, -3.05108642578125, -2.9437255859375, -2.83636474609375, -2.72900390625, -2.62164306640625, -2.5142822265625, -2.40692138671875, -2.299560546875, -2.19219970703125, -2.0848388671875, -1.97747802734375, -1.8701171875, -1.76275634765625, -1.6553955078125, -1.54803466796875, -1.440673828125, -1.33331298828125, -1.2259521484375, -1.11859130859375, -1.01123046875, -0.90386962890625, -0.7965087890625, -0.68914794921875, -0.581787109375, -0.47442626953125, -0.3670654296875, -0.25970458984375, -0.15234375, -0.04498291015625, 0.0623779296875, 0.16973876953125, 0.277099609375, 0.38446044921875, 0.4918212890625, 0.59918212890625, 0.70654296875, 0.81390380859375, 0.9212646484375, 1.02862548828125, 1.135986328125, 1.24334716796875, 1.3507080078125, 1.45806884765625, 1.5654296875, 1.67279052734375, 1.7801513671875, 1.88751220703125, 1.994873046875, 2.10223388671875, 2.2095947265625, 2.31695556640625, 2.42431640625, 2.53167724609375, 2.6390380859375, 2.74639892578125, 2.853759765625, 2.96112060546875, 3.0684814453125, 3.17584228515625, 3.283203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 5.0, 4.0, 12.0, 16.0, 16.0, 21.0, 27.0, 38.0, 76.0, 78.0, 99.0, 129.0, 186.0, 294.0, 389.0, 508.0, 528.0, 459.0, 329.0, 230.0, 154.0, 113.0, 72.0, 71.0, 54.0, 32.0, 29.0, 35.0, 14.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.96484375, -2.875396728515625, -2.78594970703125, -2.696502685546875, -2.6070556640625, -2.517608642578125, -2.42816162109375, -2.338714599609375, -2.249267578125, -2.159820556640625, -2.07037353515625, -1.980926513671875, -1.8914794921875, -1.802032470703125, -1.71258544921875, -1.623138427734375, -1.53369140625, -1.444244384765625, -1.35479736328125, -1.265350341796875, -1.1759033203125, -1.086456298828125, -0.99700927734375, -0.907562255859375, -0.818115234375, -0.728668212890625, -0.63922119140625, -0.549774169921875, -0.4603271484375, -0.370880126953125, -0.28143310546875, -0.191986083984375, -0.1025390625, -0.013092041015625, 0.07635498046875, 0.165802001953125, 0.2552490234375, 0.344696044921875, 0.43414306640625, 0.523590087890625, 0.613037109375, 0.702484130859375, 0.79193115234375, 0.881378173828125, 0.9708251953125, 1.060272216796875, 1.14971923828125, 1.239166259765625, 1.32861328125, 1.418060302734375, 1.50750732421875, 1.596954345703125, 1.6864013671875, 1.775848388671875, 1.86529541015625, 1.954742431640625, 2.044189453125, 2.133636474609375, 2.22308349609375, 2.312530517578125, 2.4019775390625, 2.491424560546875, 2.58087158203125, 2.670318603515625, 2.759765625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 15.0, 30.0, 41.0, 50.0, 68.0, 119.0, 182.0, 232.0, 481.0, 914.0, 2104.0, 6826.0, 30855.0, 274431.0, 3461930.0, 366515.0, 36954.0, 7972.0, 2280.0, 953.0, 478.0, 274.0, 171.0, 122.0, 62.0, 50.0, 24.0, 18.0, 23.0, 17.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.4248046875, -7.189453125, -6.9541015625, -6.71875, -6.4833984375, -6.248046875, -6.0126953125, -5.77734375, -5.5419921875, -5.306640625, -5.0712890625, -4.8359375, -4.6005859375, -4.365234375, -4.1298828125, -3.89453125, -3.6591796875, -3.423828125, -3.1884765625, -2.953125, -2.7177734375, -2.482421875, -2.2470703125, -2.01171875, -1.7763671875, -1.541015625, -1.3056640625, -1.0703125, -0.8349609375, -0.599609375, -0.3642578125, -0.12890625, 0.1064453125, 0.341796875, 0.5771484375, 0.8125, 1.0478515625, 1.283203125, 1.5185546875, 1.75390625, 1.9892578125, 2.224609375, 2.4599609375, 2.6953125, 2.9306640625, 3.166015625, 3.4013671875, 3.63671875, 3.8720703125, 4.107421875, 4.3427734375, 4.578125, 4.8134765625, 5.048828125, 5.2841796875, 5.51953125, 5.7548828125, 5.990234375, 6.2255859375, 6.4609375, 6.6962890625, 6.931640625, 7.1669921875, 7.40234375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 43.0, 121.0, 303.0, 323.0, 152.0, 49.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.864646911621094, -43.6187744140625, -42.37290573120117, -41.127037048339844, -39.88116455078125, -38.635292053222656, -37.38942337036133, -36.1435546875, -34.897682189941406, -33.65180969238281, -32.405941009521484, -31.160070419311523, -29.914199829101562, -28.6683292388916, -27.42245864868164, -26.17658805847168, -24.93071746826172, -23.684846878051758, -22.438976287841797, -21.193105697631836, -19.947235107421875, -18.701364517211914, -17.455493927001953, -16.209623336791992, -14.963752746582031, -13.71788215637207, -12.47201156616211, -11.226140975952148, -9.980270385742188, -8.734399795532227, -7.488529205322266, -6.242658615112305, -4.996788024902344, -3.750917434692383, -2.505046844482422, -1.259176254272461, -0.0133056640625, 1.232564926147461, 2.478435516357422, 3.724306106567383, 4.970176696777344, 6.216047286987305, 7.461917877197266, 8.707788467407227, 9.953659057617188, 11.199529647827148, 12.44540023803711, 13.69127082824707, 14.937141418457031, 16.183012008666992, 17.428882598876953, 18.674753189086914, 19.920623779296875, 21.166494369506836, 22.412364959716797, 23.658235549926758, 24.90410614013672, 26.14997673034668, 27.39584732055664, 28.6417179107666, 29.887588500976562, 31.133459091186523, 32.379329681396484, 33.62519836425781, 34.871070861816406]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 6.0, 9.0, 6.0, 16.0, 15.0, 16.0, 23.0, 28.0, 21.0, 25.0, 31.0, 28.0, 34.0, 33.0, 42.0, 42.0, 45.0, 27.0, 42.0, 40.0, 36.0, 35.0, 44.0, 37.0, 35.0, 29.0, 35.0, 27.0, 24.0, 29.0, 16.0, 19.0, 19.0, 16.0, 13.0, 7.0, 13.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.684999465942383, -8.395992279052734, -8.10698413848877, -7.817976951599121, -7.5289692878723145, -7.239961624145508, -6.950954437255859, -6.661946773529053, -6.372939109802246, -6.0839314460754395, -5.794924259185791, -5.505916595458984, -5.216908931732178, -4.927901268005371, -4.638894081115723, -4.349886417388916, -4.060879230499268, -3.77187180519104, -3.4828641414642334, -3.193856716156006, -2.904849052429199, -2.6158416271209717, -2.326834201812744, -2.0378265380859375, -1.74881911277771, -1.4598115682601929, -1.1708040237426758, -0.8817965984344482, -0.5927890539169312, -0.30378150939941406, -0.014774084091186523, 0.2742335796356201, 0.5632410049438477, 0.8522485494613647, 1.1412560939788818, 1.4302635192871094, 1.7192710638046265, 2.0082786083221436, 2.297286033630371, 2.5862936973571777, 2.8753011226654053, 3.164308547973633, 3.4533162117004395, 3.742323637008667, 4.0313310623168945, 4.320338726043701, 4.609346389770508, 4.898353576660156, 5.187361240386963, 5.4763689041137695, 5.765376091003418, 6.054383754730225, 6.343391418457031, 6.63239860534668, 6.921406269073486, 7.210413932800293, 7.499421119689941, 7.788428783416748, 8.077436447143555, 8.366443634033203, 8.655450820922852, 8.944458961486816, 9.233466148376465, 9.52247428894043, 9.811481475830078]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 9.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 15.0, 15.0, 21.0, 30.0, 31.0, 30.0, 31.0, 45.0, 36.0, 35.0, 43.0, 40.0, 49.0, 53.0, 59.0, 52.0, 49.0, 31.0, 45.0, 29.0, 24.0, 28.0, 30.0, 15.0, 18.0, 14.0, 11.0, 12.0, 11.0, 14.0, 5.0, 8.0, 3.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.158203125, -2.0951690673828125, -2.032135009765625, -1.9691009521484375, -1.90606689453125, -1.8430328369140625, -1.779998779296875, -1.7169647216796875, -1.6539306640625, -1.5908966064453125, -1.527862548828125, -1.4648284912109375, -1.40179443359375, -1.3387603759765625, -1.275726318359375, -1.2126922607421875, -1.149658203125, -1.0866241455078125, -1.023590087890625, -0.9605560302734375, -0.89752197265625, -0.8344879150390625, -0.771453857421875, -0.7084197998046875, -0.6453857421875, -0.5823516845703125, -0.519317626953125, -0.4562835693359375, -0.39324951171875, -0.3302154541015625, -0.267181396484375, -0.2041473388671875, -0.14111328125, -0.0780792236328125, -0.015045166015625, 0.0479888916015625, 0.11102294921875, 0.1740570068359375, 0.237091064453125, 0.3001251220703125, 0.3631591796875, 0.4261932373046875, 0.489227294921875, 0.5522613525390625, 0.61529541015625, 0.6783294677734375, 0.741363525390625, 0.8043975830078125, 0.867431640625, 0.9304656982421875, 0.993499755859375, 1.0565338134765625, 1.11956787109375, 1.1826019287109375, 1.245635986328125, 1.3086700439453125, 1.3717041015625, 1.4347381591796875, 1.497772216796875, 1.5608062744140625, 1.62384033203125, 1.6868743896484375, 1.749908447265625, 1.8129425048828125, 1.8759765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 19.0, 16.0, 35.0, 48.0, 91.0, 154.0, 233.0, 356.0, 520.0, 870.0, 1424.0, 2172.0, 3503.0, 5448.0, 8578.0, 13411.0, 20996.0, 32253.0, 48264.0, 72016.0, 102473.0, 132454.0, 148352.0, 134352.0, 104011.0, 74081.0, 49665.0, 33284.0, 21473.0, 13749.0, 8790.0, 5554.0, 3619.0, 2264.0, 1468.0, 937.0, 631.0, 378.0, 216.0, 134.0, 96.0, 60.0, 28.0, 20.0, 22.0, 13.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2476806640625, -0.23956871032714844, -0.23145675659179688, -0.2233448028564453, -0.21523284912109375, -0.2071208953857422, -0.19900894165039062, -0.19089698791503906, -0.1827850341796875, -0.17467308044433594, -0.16656112670898438, -0.1584491729736328, -0.15033721923828125, -0.1422252655029297, -0.13411331176757812, -0.12600135803222656, -0.117889404296875, -0.10977745056152344, -0.10166549682617188, -0.09355354309082031, -0.08544158935546875, -0.07732963562011719, -0.06921768188476562, -0.06110572814941406, -0.0529937744140625, -0.04488182067871094, -0.036769866943359375, -0.028657913208007812, -0.02054595947265625, -0.012434005737304688, -0.004322052001953125, 0.0037899017333984375, 0.01190185546875, 0.020013809204101562, 0.028125762939453125, 0.03623771667480469, 0.04434967041015625, 0.05246162414550781, 0.060573577880859375, 0.06868553161621094, 0.0767974853515625, 0.08490943908691406, 0.09302139282226562, 0.10113334655761719, 0.10924530029296875, 0.11735725402832031, 0.12546920776367188, 0.13358116149902344, 0.141693115234375, 0.14980506896972656, 0.15791702270507812, 0.1660289764404297, 0.17414093017578125, 0.1822528839111328, 0.19036483764648438, 0.19847679138183594, 0.2065887451171875, 0.21470069885253906, 0.22281265258789062, 0.2309246063232422, 0.23903656005859375, 0.2471485137939453, 0.2552604675292969, 0.26337242126464844, 0.271484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 7.0, 13.0, 7.0, 16.0, 23.0, 20.0, 22.0, 18.0, 27.0, 22.0, 32.0, 27.0, 26.0, 32.0, 50.0, 29.0, 38.0, 48.0, 1064.0, 40.0, 46.0, 27.0, 45.0, 33.0, 29.0, 32.0, 31.0, 28.0, 27.0, 23.0, 21.0, 20.0, 13.0, 11.0, 7.0, 12.0, 11.0, 6.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2666015625, -1.22613525390625, -1.1856689453125, -1.14520263671875, -1.104736328125, -1.06427001953125, -1.0238037109375, -0.98333740234375, -0.94287109375, -0.90240478515625, -0.8619384765625, -0.82147216796875, -0.781005859375, -0.74053955078125, -0.7000732421875, -0.65960693359375, -0.619140625, -0.57867431640625, -0.5382080078125, -0.49774169921875, -0.457275390625, -0.41680908203125, -0.3763427734375, -0.33587646484375, -0.29541015625, -0.25494384765625, -0.2144775390625, -0.17401123046875, -0.133544921875, -0.09307861328125, -0.0526123046875, -0.01214599609375, 0.0283203125, 0.06878662109375, 0.1092529296875, 0.14971923828125, 0.190185546875, 0.23065185546875, 0.2711181640625, 0.31158447265625, 0.35205078125, 0.39251708984375, 0.4329833984375, 0.47344970703125, 0.513916015625, 0.55438232421875, 0.5948486328125, 0.63531494140625, 0.67578125, 0.71624755859375, 0.7567138671875, 0.79718017578125, 0.837646484375, 0.87811279296875, 0.9185791015625, 0.95904541015625, 0.99951171875, 1.03997802734375, 1.0804443359375, 1.12091064453125, 1.161376953125, 1.20184326171875, 1.2423095703125, 1.28277587890625, 1.3232421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 14.0, 19.0, 30.0, 47.0, 54.0, 100.0, 123.0, 180.0, 231.0, 314.0, 471.0, 712.0, 990.0, 1456.0, 2315.0, 3339.0, 4974.0, 7474.0, 11378.0, 18604.0, 41612.0, 262182.0, 1571324.0, 98122.0, 27431.0, 14745.0, 9313.0, 6198.0, 4155.0, 2946.0, 1902.0, 1355.0, 907.0, 612.0, 432.0, 297.0, 223.0, 148.0, 102.0, 72.0, 60.0, 46.0, 26.0, 28.0, 15.0, 14.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412841796875, -0.39920806884765625, -0.3855743408203125, -0.37194061279296875, -0.358306884765625, -0.34467315673828125, -0.3310394287109375, -0.31740570068359375, -0.30377197265625, -0.29013824462890625, -0.2765045166015625, -0.26287078857421875, -0.249237060546875, -0.23560333251953125, -0.2219696044921875, -0.20833587646484375, -0.1947021484375, -0.18106842041015625, -0.1674346923828125, -0.15380096435546875, -0.140167236328125, -0.12653350830078125, -0.1128997802734375, -0.09926605224609375, -0.08563232421875, -0.07199859619140625, -0.0583648681640625, -0.04473114013671875, -0.031097412109375, -0.01746368408203125, -0.0038299560546875, 0.00980377197265625, 0.0234375, 0.03707122802734375, 0.0507049560546875, 0.06433868408203125, 0.077972412109375, 0.09160614013671875, 0.1052398681640625, 0.11887359619140625, 0.13250732421875, 0.14614105224609375, 0.1597747802734375, 0.17340850830078125, 0.187042236328125, 0.20067596435546875, 0.2143096923828125, 0.22794342041015625, 0.2415771484375, 0.25521087646484375, 0.2688446044921875, 0.28247833251953125, 0.296112060546875, 0.30974578857421875, 0.3233795166015625, 0.33701324462890625, 0.35064697265625, 0.36428070068359375, 0.3779144287109375, 0.39154815673828125, 0.405181884765625, 0.41881561279296875, 0.4324493408203125, 0.44608306884765625, 0.459716796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 4.0, 6.0, 10.0, 10.0, 7.0, 12.0, 15.0, 22.0, 36.0, 27.0, 26.0, 35.0, 40.0, 43.0, 44.0, 56.0, 55.0, 48.0, 64.0, 54.0, 49.0, 60.0, 38.0, 40.0, 34.0, 20.0, 22.0, 15.0, 12.0, 14.0, 17.0, 8.0, 9.0, 10.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0222625732421875, -0.02152729034423828, -0.020792007446289062, -0.020056724548339844, -0.019321441650390625, -0.018586158752441406, -0.017850875854492188, -0.01711559295654297, -0.01638031005859375, -0.01564502716064453, -0.014909744262695312, -0.014174461364746094, -0.013439178466796875, -0.012703895568847656, -0.011968612670898438, -0.011233329772949219, -0.010498046875, -0.009762763977050781, -0.009027481079101562, -0.008292198181152344, -0.007556915283203125, -0.006821632385253906, -0.0060863494873046875, -0.005351066589355469, -0.00461578369140625, -0.0038805007934570312, -0.0031452178955078125, -0.0024099349975585938, -0.001674652099609375, -0.0009393692016601562, -0.0002040863037109375, 0.0005311965942382812, 0.0012664794921875, 0.0020017623901367188, 0.0027370452880859375, 0.0034723281860351562, 0.004207611083984375, 0.004942893981933594, 0.0056781768798828125, 0.006413459777832031, 0.00714874267578125, 0.007884025573730469, 0.008619308471679688, 0.009354591369628906, 0.010089874267578125, 0.010825157165527344, 0.011560440063476562, 0.012295722961425781, 0.013031005859375, 0.013766288757324219, 0.014501571655273438, 0.015236854553222656, 0.015972137451171875, 0.016707420349121094, 0.017442703247070312, 0.01817798614501953, 0.01891326904296875, 0.01964855194091797, 0.020383834838867188, 0.021119117736816406, 0.021854400634765625, 0.022589683532714844, 0.023324966430664062, 0.02406024932861328, 0.0247955322265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 8.0, 11.0, 11.0, 16.0, 21.0, 15.0, 27.0, 38.0, 60.0, 71.0, 102.0, 139.0, 223.0, 471.0, 2133.0, 260482.0, 778236.0, 5083.0, 571.0, 232.0, 165.0, 101.0, 61.0, 56.0, 34.0, 43.0, 30.0, 15.0, 14.0, 13.0, 7.0, 6.0, 5.0, 5.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52734375, -0.5118904113769531, -0.49643707275390625, -0.4809837341308594, -0.4655303955078125, -0.4500770568847656, -0.43462371826171875, -0.4191703796386719, -0.403717041015625, -0.3882637023925781, -0.37281036376953125, -0.3573570251464844, -0.3419036865234375, -0.3264503479003906, -0.31099700927734375, -0.2955436706542969, -0.28009033203125, -0.2646369934082031, -0.24918365478515625, -0.23373031616210938, -0.2182769775390625, -0.20282363891601562, -0.18737030029296875, -0.17191696166992188, -0.156463623046875, -0.14101028442382812, -0.12555694580078125, -0.11010360717773438, -0.0946502685546875, -0.07919692993164062, -0.06374359130859375, -0.048290252685546875, -0.0328369140625, -0.017383575439453125, -0.00193023681640625, 0.013523101806640625, 0.0289764404296875, 0.044429779052734375, 0.05988311767578125, 0.07533645629882812, 0.090789794921875, 0.10624313354492188, 0.12169647216796875, 0.13714981079101562, 0.1526031494140625, 0.16805648803710938, 0.18350982666015625, 0.19896316528320312, 0.21441650390625, 0.22986984252929688, 0.24532318115234375, 0.2607765197753906, 0.2762298583984375, 0.2916831970214844, 0.30713653564453125, 0.3225898742675781, 0.338043212890625, 0.3534965515136719, 0.36894989013671875, 0.3844032287597656, 0.3998565673828125, 0.4153099060058594, 0.43076324462890625, 0.4462165832519531, 0.461669921875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 606.0, 387.0, 13.0], "bins": [-0.7706297636032104, -0.7581807374954224, -0.7457316517829895, -0.7332825660705566, -0.7208335399627686, -0.7083845138549805, -0.6959354281425476, -0.6834863424301147, -0.6710373163223267, -0.6585882902145386, -0.6461392045021057, -0.6336901187896729, -0.6212410926818848, -0.6087920665740967, -0.5963429808616638, -0.583893895149231, -0.5714448690414429, -0.5589958429336548, -0.5465467572212219, -0.5340976715087891, -0.521648645401001, -0.5091996192932129, -0.49675053358078003, -0.48430147767066956, -0.4718524217605591, -0.4594033658504486, -0.44695430994033813, -0.43450525403022766, -0.4220561981201172, -0.4096071422100067, -0.39715808629989624, -0.38470903038978577, -0.3722599446773529, -0.35981088876724243, -0.34736183285713196, -0.3349127769470215, -0.322463721036911, -0.31001466512680054, -0.29756560921669006, -0.2851165533065796, -0.2726674973964691, -0.26021844148635864, -0.24776938557624817, -0.2353203296661377, -0.22287127375602722, -0.21042221784591675, -0.19797316193580627, -0.1855241060256958, -0.17307506501674652, -0.16062600910663605, -0.14817695319652557, -0.1357278972864151, -0.12327884137630463, -0.11082978546619415, -0.09838072955608368, -0.0859316736459732, -0.07348261028528214, -0.06103355437517166, -0.04858449846506119, -0.036135442554950714, -0.02368638664484024, -0.011237330734729767, 0.0012117251753807068, 0.01366078108549118, 0.026109835132956505]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 10.0, 5.0, 8.0, 11.0, 13.0, 12.0, 14.0, 19.0, 25.0, 31.0, 36.0, 27.0, 27.0, 33.0, 53.0, 42.0, 49.0, 42.0, 38.0, 39.0, 50.0, 39.0, 43.0, 38.0, 39.0, 37.0, 30.0, 30.0, 30.0, 22.0, 16.0, 16.0, 16.0, 7.0, 12.0, 5.0, 7.0, 7.0, 2.0, 5.0, 1.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02419590950012207, -0.02327083796262741, -0.0223457682877779, -0.02142069861292839, -0.02049562707543373, -0.01957055553793907, -0.01864548586308956, -0.01772041618824005, -0.016795344650745392, -0.015870273113250732, -0.014945203438401222, -0.014020132832229137, -0.013095062226057053, -0.012169991619884968, -0.011244921013712883, -0.010319850407540798, -0.009394779801368713, -0.008469709195196629, -0.007544638589024544, -0.006619567982852459, -0.005694497376680374, -0.004769426770508289, -0.0038443561643362045, -0.0029192855581641197, -0.001994214951992035, -0.00106914434581995, -0.0001440737396478653, 0.0007809968665242195, 0.0017060674726963043, 0.002631138078868389, 0.003556208685040474, 0.004481279291212559, 0.0054063498973846436, 0.006331420503556728, 0.007256491109728813, 0.008181561715900898, 0.009106632322072983, 0.010031702928245068, 0.010956773534417152, 0.011881844140589237, 0.012806914746761322, 0.013731985352933407, 0.014657055959105492, 0.015582126565277576, 0.01650719717144966, 0.01743226870894432, 0.01835733838379383, 0.01928240805864334, 0.020207479596138, 0.02113255113363266, 0.02205762080848217, 0.02298269048333168, 0.02390776202082634, 0.024832833558321, 0.02575790323317051, 0.02668297290802002, 0.02760804444551468, 0.02853311598300934, 0.02945818565785885, 0.03038325533270836, 0.03130832687020302, 0.03223339840769768, 0.03315846621990204, 0.0340835377573967, 0.03500860929489136]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 5.0, 8.0, 16.0, 9.0, 12.0, 9.0, 17.0, 11.0, 19.0, 39.0, 36.0, 30.0, 35.0, 36.0, 41.0, 48.0, 53.0, 39.0, 32.0, 30.0, 59.0, 60.0, 49.0, 32.0, 30.0, 37.0, 44.0, 27.0, 21.0, 14.0, 16.0, 12.0, 10.0, 15.0, 8.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.0547637939453125, -1.992340087890625, -1.9299163818359375, -1.86749267578125, -1.8050689697265625, -1.742645263671875, -1.6802215576171875, -1.6177978515625, -1.5553741455078125, -1.492950439453125, -1.4305267333984375, -1.36810302734375, -1.3056793212890625, -1.243255615234375, -1.1808319091796875, -1.118408203125, -1.0559844970703125, -0.993560791015625, -0.9311370849609375, -0.86871337890625, -0.8062896728515625, -0.743865966796875, -0.6814422607421875, -0.6190185546875, -0.5565948486328125, -0.494171142578125, -0.4317474365234375, -0.36932373046875, -0.3069000244140625, -0.244476318359375, -0.1820526123046875, -0.11962890625, -0.0572052001953125, 0.005218505859375, 0.0676422119140625, 0.13006591796875, 0.1924896240234375, 0.254913330078125, 0.3173370361328125, 0.3797607421875, 0.4421844482421875, 0.504608154296875, 0.5670318603515625, 0.62945556640625, 0.6918792724609375, 0.754302978515625, 0.8167266845703125, 0.879150390625, 0.9415740966796875, 1.003997802734375, 1.0664215087890625, 1.12884521484375, 1.1912689208984375, 1.253692626953125, 1.3161163330078125, 1.3785400390625, 1.4409637451171875, 1.503387451171875, 1.5658111572265625, 1.62823486328125, 1.6906585693359375, 1.753082275390625, 1.8155059814453125, 1.8779296875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 11.0, 19.0, 27.0, 40.0, 56.0, 100.0, 109.0, 205.0, 310.0, 496.0, 784.0, 1225.0, 2176.0, 3475.0, 6252.0, 12274.0, 25550.0, 61560.0, 166665.0, 387771.0, 231774.0, 81061.0, 32797.0, 15308.0, 7870.0, 4235.0, 2503.0, 1442.0, 923.0, 512.0, 359.0, 231.0, 142.0, 80.0, 61.0, 48.0, 28.0, 26.0, 15.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0], "bins": [-3.044921875, -2.96405029296875, -2.8831787109375, -2.80230712890625, -2.721435546875, -2.64056396484375, -2.5596923828125, -2.47882080078125, -2.39794921875, -2.31707763671875, -2.2362060546875, -2.15533447265625, -2.074462890625, -1.99359130859375, -1.9127197265625, -1.83184814453125, -1.7509765625, -1.67010498046875, -1.5892333984375, -1.50836181640625, -1.427490234375, -1.34661865234375, -1.2657470703125, -1.18487548828125, -1.10400390625, -1.02313232421875, -0.9422607421875, -0.86138916015625, -0.780517578125, -0.69964599609375, -0.6187744140625, -0.53790283203125, -0.45703125, -0.37615966796875, -0.2952880859375, -0.21441650390625, -0.133544921875, -0.05267333984375, 0.0281982421875, 0.10906982421875, 0.18994140625, 0.27081298828125, 0.3516845703125, 0.43255615234375, 0.513427734375, 0.59429931640625, 0.6751708984375, 0.75604248046875, 0.8369140625, 0.91778564453125, 0.9986572265625, 1.07952880859375, 1.160400390625, 1.24127197265625, 1.3221435546875, 1.40301513671875, 1.48388671875, 1.56475830078125, 1.6456298828125, 1.72650146484375, 1.807373046875, 1.88824462890625, 1.9691162109375, 2.04998779296875, 2.130859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 12.0, 9.0, 17.0, 21.0, 16.0, 18.0, 26.0, 25.0, 23.0, 39.0, 30.0, 50.0, 51.0, 66.0, 110.0, 231.0, 1442.0, 275.0, 130.0, 81.0, 61.0, 41.0, 41.0, 33.0, 27.0, 32.0, 25.0, 20.0, 18.0, 13.0, 16.0, 10.0, 6.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.86328125, -3.6927490234375, -3.522216796875, -3.3516845703125, -3.18115234375, -3.0106201171875, -2.840087890625, -2.6695556640625, -2.4990234375, -2.3284912109375, -2.157958984375, -1.9874267578125, -1.81689453125, -1.6463623046875, -1.475830078125, -1.3052978515625, -1.134765625, -0.9642333984375, -0.793701171875, -0.6231689453125, -0.45263671875, -0.2821044921875, -0.111572265625, 0.0589599609375, 0.2294921875, 0.4000244140625, 0.570556640625, 0.7410888671875, 0.91162109375, 1.0821533203125, 1.252685546875, 1.4232177734375, 1.59375, 1.7642822265625, 1.934814453125, 2.1053466796875, 2.27587890625, 2.4464111328125, 2.616943359375, 2.7874755859375, 2.9580078125, 3.1285400390625, 3.299072265625, 3.4696044921875, 3.64013671875, 3.8106689453125, 3.981201171875, 4.1517333984375, 4.322265625, 4.4927978515625, 4.663330078125, 4.8338623046875, 5.00439453125, 5.1749267578125, 5.345458984375, 5.5159912109375, 5.6865234375, 5.8570556640625, 6.027587890625, 6.1981201171875, 6.36865234375, 6.5391845703125, 6.709716796875, 6.8802490234375, 7.05078125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 13.0, 13.0, 13.0, 20.0, 46.0, 57.0, 77.0, 126.0, 300.0, 664.0, 1954.0, 6869.0, 37737.0, 1083012.0, 1953373.0, 49513.0, 8178.0, 2279.0, 789.0, 289.0, 144.0, 85.0, 51.0, 29.0, 16.0, 14.0, 9.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.171875, -8.92437744140625, -8.6768798828125, -8.42938232421875, -8.181884765625, -7.93438720703125, -7.6868896484375, -7.43939208984375, -7.19189453125, -6.94439697265625, -6.6968994140625, -6.44940185546875, -6.201904296875, -5.95440673828125, -5.7069091796875, -5.45941162109375, -5.2119140625, -4.96441650390625, -4.7169189453125, -4.46942138671875, -4.221923828125, -3.97442626953125, -3.7269287109375, -3.47943115234375, -3.23193359375, -2.98443603515625, -2.7369384765625, -2.48944091796875, -2.241943359375, -1.99444580078125, -1.7469482421875, -1.49945068359375, -1.251953125, -1.00445556640625, -0.7569580078125, -0.50946044921875, -0.261962890625, -0.01446533203125, 0.2330322265625, 0.48052978515625, 0.72802734375, 0.97552490234375, 1.2230224609375, 1.47052001953125, 1.718017578125, 1.96551513671875, 2.2130126953125, 2.46051025390625, 2.7080078125, 2.95550537109375, 3.2030029296875, 3.45050048828125, 3.697998046875, 3.94549560546875, 4.1929931640625, 4.44049072265625, 4.68798828125, 4.93548583984375, 5.1829833984375, 5.43048095703125, 5.677978515625, 5.92547607421875, 6.1729736328125, 6.42047119140625, 6.66796875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 444.0, 558.0, 9.0], "bins": [-203.25067138671875, -199.97491455078125, -196.69915771484375, -193.4234161376953, -190.1476593017578, -186.8719024658203, -183.5961456298828, -180.32040405273438, -177.04464721679688, -173.76889038085938, -170.49313354492188, -167.21739196777344, -163.94163513183594, -160.66587829589844, -157.39012145996094, -154.1143798828125, -150.838623046875, -147.5628662109375, -144.287109375, -141.01136779785156, -137.73561096191406, -134.45985412597656, -131.18409729003906, -127.9083480834961, -124.63258361816406, -121.35682678222656, -118.0810775756836, -114.8053207397461, -111.52957153320312, -108.25381469726562, -104.97805786132812, -101.70230865478516, -98.42655944824219, -95.15080261230469, -91.87505340576172, -88.59929656982422, -85.32354736328125, -82.04779052734375, -78.77203369140625, -75.49628448486328, -72.22053527832031, -68.94477844238281, -65.66902923583984, -62.393272399902344, -59.117523193359375, -55.841766357421875, -52.56601333618164, -49.290260314941406, -46.014503479003906, -42.73875045776367, -39.46299743652344, -36.18724060058594, -32.91149139404297, -29.6357364654541, -26.359981536865234, -23.084228515625, -19.808475494384766, -16.53272247314453, -13.25696849822998, -9.98121452331543, -6.705461502075195, -3.429708480834961, -0.15395355224609375, 3.1217994689941406, 6.397552490234375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 5.0, 10.0, 14.0, 16.0, 10.0, 20.0, 19.0, 19.0, 34.0, 31.0, 25.0, 31.0, 37.0, 27.0, 38.0, 29.0, 39.0, 50.0, 36.0, 53.0, 44.0, 49.0, 38.0, 35.0, 26.0, 28.0, 30.0, 26.0, 15.0, 25.0, 17.0, 16.0, 12.0, 12.0, 16.0, 4.0, 10.0, 4.0, 12.0, 9.0, 6.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7178955078125, -11.34408187866211, -10.970268249511719, -10.596454620361328, -10.222640037536621, -9.84882640838623, -9.47501277923584, -9.10119915008545, -8.727384567260742, -8.353570938110352, -7.979756832122803, -7.605943202972412, -7.232129096984863, -6.858315467834473, -6.484501838684082, -6.110688209533691, -5.736874580383301, -5.36306095123291, -4.989246845245361, -4.615433216094971, -4.241619110107422, -3.8678054809570312, -3.4939918518066406, -3.120177984237671, -2.746364116668701, -2.3725502490997314, -1.9987365007400513, -1.624922752380371, -1.2511088848114014, -0.8772950172424316, -0.503481388092041, -0.1296675205230713, 0.24414634704589844, 0.6179601550102234, 0.9917739629745483, 1.3655877113342285, 1.7394015789031982, 2.113215446472168, 2.4870290756225586, 2.8608429431915283, 3.234656810760498, 3.6084706783294678, 3.9822845458984375, 4.356098175048828, 4.729911804199219, 5.103725910186768, 5.477539539337158, 5.851353645324707, 6.225167274475098, 6.598980903625488, 6.972795009613037, 7.346608638763428, 7.720422744750977, 8.094236373901367, 8.468050003051758, 8.841863632202148, 9.215677261352539, 9.58949089050293, 9.96330451965332, 10.337118148803711, 10.710932731628418, 11.084746360778809, 11.4585599899292, 11.83237361907959, 12.206188201904297]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 9.0, 10.0, 10.0, 13.0, 21.0, 21.0, 19.0, 28.0, 34.0, 42.0, 38.0, 34.0, 44.0, 40.0, 46.0, 47.0, 45.0, 43.0, 39.0, 50.0, 37.0, 39.0, 38.0, 42.0, 30.0, 26.0, 29.0, 22.0, 11.0, 8.0, 11.0, 9.0, 11.0, 6.0, 7.0, 4.0, 6.0, 7.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.189453125, -2.1242218017578125, -2.058990478515625, -1.9937591552734375, -1.92852783203125, -1.8632965087890625, -1.798065185546875, -1.7328338623046875, -1.6676025390625, -1.6023712158203125, -1.537139892578125, -1.4719085693359375, -1.40667724609375, -1.3414459228515625, -1.276214599609375, -1.2109832763671875, -1.145751953125, -1.0805206298828125, -1.015289306640625, -0.9500579833984375, -0.88482666015625, -0.8195953369140625, -0.754364013671875, -0.6891326904296875, -0.6239013671875, -0.5586700439453125, -0.493438720703125, -0.4282073974609375, -0.36297607421875, -0.2977447509765625, -0.232513427734375, -0.1672821044921875, -0.10205078125, -0.0368194580078125, 0.028411865234375, 0.0936431884765625, 0.15887451171875, 0.2241058349609375, 0.289337158203125, 0.3545684814453125, 0.4197998046875, 0.4850311279296875, 0.550262451171875, 0.6154937744140625, 0.68072509765625, 0.7459564208984375, 0.811187744140625, 0.8764190673828125, 0.941650390625, 1.0068817138671875, 1.072113037109375, 1.1373443603515625, 1.20257568359375, 1.2678070068359375, 1.333038330078125, 1.3982696533203125, 1.4635009765625, 1.5287322998046875, 1.593963623046875, 1.6591949462890625, 1.72442626953125, 1.7896575927734375, 1.854888916015625, 1.9201202392578125, 1.9853515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 12.0, 7.0, 7.0, 7.0, 7.0, 18.0, 18.0, 27.0, 52.0, 67.0, 85.0, 90.0, 160.0, 239.0, 306.0, 478.0, 659.0, 1048.0, 1721.0, 2689.0, 4738.0, 8844.0, 19592.0, 58414.0, 290522.0, 1647571.0, 1747638.0, 306015.0, 60990.0, 20366.0, 9255.0, 4824.0, 2776.0, 1707.0, 1057.0, 708.0, 456.0, 326.0, 222.0, 167.0, 112.0, 85.0, 51.0, 47.0, 39.0, 22.0, 11.0, 17.0, 9.0, 5.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.033203125, -2.9354248046875, -2.837646484375, -2.7398681640625, -2.64208984375, -2.5443115234375, -2.446533203125, -2.3487548828125, -2.2509765625, -2.1531982421875, -2.055419921875, -1.9576416015625, -1.85986328125, -1.7620849609375, -1.664306640625, -1.5665283203125, -1.46875, -1.3709716796875, -1.273193359375, -1.1754150390625, -1.07763671875, -0.9798583984375, -0.882080078125, -0.7843017578125, -0.6865234375, -0.5887451171875, -0.490966796875, -0.3931884765625, -0.29541015625, -0.1976318359375, -0.099853515625, -0.0020751953125, 0.095703125, 0.1934814453125, 0.291259765625, 0.3890380859375, 0.48681640625, 0.5845947265625, 0.682373046875, 0.7801513671875, 0.8779296875, 0.9757080078125, 1.073486328125, 1.1712646484375, 1.26904296875, 1.3668212890625, 1.464599609375, 1.5623779296875, 1.66015625, 1.7579345703125, 1.855712890625, 1.9534912109375, 2.05126953125, 2.1490478515625, 2.246826171875, 2.3446044921875, 2.4423828125, 2.5401611328125, 2.637939453125, 2.7357177734375, 2.83349609375, 2.9312744140625, 3.029052734375, 3.1268310546875, 3.224609375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 7.0, 8.0, 12.0, 11.0, 21.0, 29.0, 33.0, 47.0, 84.0, 99.0, 177.0, 212.0, 327.0, 501.0, 565.0, 548.0, 454.0, 281.0, 194.0, 150.0, 87.0, 36.0, 45.0, 34.0, 22.0, 16.0, 13.0, 13.0, 13.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.743804931640625, -2.65167236328125, -2.559539794921875, -2.4674072265625, -2.375274658203125, -2.28314208984375, -2.191009521484375, -2.098876953125, -2.006744384765625, -1.91461181640625, -1.822479248046875, -1.7303466796875, -1.638214111328125, -1.54608154296875, -1.453948974609375, -1.36181640625, -1.269683837890625, -1.17755126953125, -1.085418701171875, -0.9932861328125, -0.901153564453125, -0.80902099609375, -0.716888427734375, -0.624755859375, -0.532623291015625, -0.44049072265625, -0.348358154296875, -0.2562255859375, -0.164093017578125, -0.07196044921875, 0.020172119140625, 0.1123046875, 0.204437255859375, 0.29656982421875, 0.388702392578125, 0.4808349609375, 0.572967529296875, 0.66510009765625, 0.757232666015625, 0.849365234375, 0.941497802734375, 1.03363037109375, 1.125762939453125, 1.2178955078125, 1.310028076171875, 1.40216064453125, 1.494293212890625, 1.58642578125, 1.678558349609375, 1.77069091796875, 1.862823486328125, 1.9549560546875, 2.047088623046875, 2.13922119140625, 2.231353759765625, 2.323486328125, 2.415618896484375, 2.50775146484375, 2.599884033203125, 2.6920166015625, 2.784149169921875, 2.87628173828125, 2.968414306640625, 3.060546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 11.0, 12.0, 7.0, 22.0, 24.0, 34.0, 39.0, 59.0, 90.0, 131.0, 219.0, 350.0, 618.0, 1222.0, 2482.0, 5656.0, 14776.0, 46947.0, 209281.0, 2047530.0, 1626829.0, 173670.0, 41053.0, 13158.0, 5034.0, 2364.0, 1106.0, 598.0, 323.0, 205.0, 120.0, 73.0, 63.0, 53.0, 22.0, 24.0, 17.0, 10.0, 13.0, 5.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.64093017578125, -3.5006103515625, -3.36029052734375, -3.219970703125, -3.07965087890625, -2.9393310546875, -2.79901123046875, -2.65869140625, -2.51837158203125, -2.3780517578125, -2.23773193359375, -2.097412109375, -1.95709228515625, -1.8167724609375, -1.67645263671875, -1.5361328125, -1.39581298828125, -1.2554931640625, -1.11517333984375, -0.974853515625, -0.83453369140625, -0.6942138671875, -0.55389404296875, -0.41357421875, -0.27325439453125, -0.1329345703125, 0.00738525390625, 0.147705078125, 0.28802490234375, 0.4283447265625, 0.56866455078125, 0.708984375, 0.84930419921875, 0.9896240234375, 1.12994384765625, 1.270263671875, 1.41058349609375, 1.5509033203125, 1.69122314453125, 1.83154296875, 1.97186279296875, 2.1121826171875, 2.25250244140625, 2.392822265625, 2.53314208984375, 2.6734619140625, 2.81378173828125, 2.9541015625, 3.09442138671875, 3.2347412109375, 3.37506103515625, 3.515380859375, 3.65570068359375, 3.7960205078125, 3.93634033203125, 4.07666015625, 4.21697998046875, 4.3572998046875, 4.49761962890625, 4.637939453125, 4.77825927734375, 4.9185791015625, 5.05889892578125, 5.19921875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 6.0, 33.0, 112.0, 228.0, 315.0, 191.0, 97.0, 21.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-53.51313018798828, -52.47252655029297, -51.431922912597656, -50.39132308959961, -49.3507194519043, -48.310115814208984, -47.26951217651367, -46.22890853881836, -45.18830871582031, -44.147705078125, -43.10710144042969, -42.06650161743164, -41.02589797973633, -39.985294342041016, -38.9446907043457, -37.90408706665039, -36.86348342895508, -35.822879791259766, -34.78227615356445, -33.741676330566406, -32.701072692871094, -31.66046905517578, -30.61986541748047, -29.579261779785156, -28.538660049438477, -27.498056411743164, -26.457454681396484, -25.416851043701172, -24.37624740600586, -23.33564567565918, -22.295042037963867, -21.254440307617188, -20.21384048461914, -19.173236846923828, -18.13263511657715, -17.092031478881836, -16.051429748535156, -15.010826110839844, -13.970222473144531, -12.929619789123535, -11.889016151428223, -10.848413467407227, -9.807809829711914, -8.767207145690918, -7.726604461669922, -6.686001777648926, -5.6453986167907715, -4.604795455932617, -3.564192771911621, -2.523589849472046, -1.4829869270324707, -0.4423840045928955, 0.5982189178466797, 1.6388216018676758, 2.67942476272583, 3.7200279235839844, 4.7606306076049805, 5.801233291625977, 6.841836452484131, 7.882439613342285, 8.923042297363281, 9.963644981384277, 11.004247665405273, 12.044851303100586, 13.085453987121582]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 9.0, 13.0, 23.0, 20.0, 28.0, 28.0, 27.0, 33.0, 24.0, 27.0, 28.0, 45.0, 33.0, 40.0, 47.0, 32.0, 42.0, 33.0, 29.0, 44.0, 32.0, 35.0, 38.0, 34.0, 31.0, 26.0, 21.0, 20.0, 29.0, 14.0, 15.0, 14.0, 9.0, 8.0, 8.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.486639022827148, -8.215720176696777, -7.9448018074035645, -7.673883438110352, -7.4029645919799805, -7.132046222686768, -6.861127853393555, -6.590209007263184, -6.3192901611328125, -6.0483717918396, -5.7774529457092285, -5.506534576416016, -5.2356157302856445, -4.964697360992432, -4.693778991699219, -4.422860145568848, -4.151941776275635, -3.8810231685638428, -3.610104560852051, -3.339186191558838, -3.068267345428467, -2.797348976135254, -2.526430368423462, -2.25551176071167, -1.984593152999878, -1.713674545288086, -1.442755937576294, -1.1718374490737915, -0.9009188413619995, -0.6300002336502075, -0.3590817451477051, -0.08816313743591309, 0.1827554702758789, 0.4536740481853485, 0.7245926260948181, 0.9955111742019653, 1.2664297819137573, 1.5373483896255493, 1.8082668781280518, 2.0791854858398438, 2.3501040935516357, 2.6210227012634277, 2.8919413089752197, 3.1628599166870117, 3.4337782859802246, 3.7046971321105957, 3.9756155014038086, 4.24653434753418, 4.517452716827393, 4.7883710861206055, 5.059289932250977, 5.3302083015441895, 5.6011271476745605, 5.872045516967773, 6.1429643630981445, 6.413882732391357, 6.68480110168457, 6.955719470977783, 7.226638317108154, 7.497556686401367, 7.768475532531738, 8.03939437866211, 8.310312271118164, 8.581231117248535, 8.852149963378906]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 10.0, 14.0, 27.0, 23.0, 20.0, 27.0, 25.0, 37.0, 42.0, 24.0, 30.0, 35.0, 45.0, 43.0, 44.0, 58.0, 35.0, 40.0, 47.0, 50.0, 42.0, 36.0, 39.0, 31.0, 26.0, 17.0, 14.0, 15.0, 14.0, 14.0, 18.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9453125, -1.881927490234375, -1.81854248046875, -1.755157470703125, -1.6917724609375, -1.628387451171875, -1.56500244140625, -1.501617431640625, -1.438232421875, -1.374847412109375, -1.31146240234375, -1.248077392578125, -1.1846923828125, -1.121307373046875, -1.05792236328125, -0.994537353515625, -0.93115234375, -0.867767333984375, -0.80438232421875, -0.740997314453125, -0.6776123046875, -0.614227294921875, -0.55084228515625, -0.487457275390625, -0.424072265625, -0.360687255859375, -0.29730224609375, -0.233917236328125, -0.1705322265625, -0.107147216796875, -0.04376220703125, 0.019622802734375, 0.0830078125, 0.146392822265625, 0.20977783203125, 0.273162841796875, 0.3365478515625, 0.399932861328125, 0.46331787109375, 0.526702880859375, 0.590087890625, 0.653472900390625, 0.71685791015625, 0.780242919921875, 0.8436279296875, 0.907012939453125, 0.97039794921875, 1.033782958984375, 1.09716796875, 1.160552978515625, 1.22393798828125, 1.287322998046875, 1.3507080078125, 1.414093017578125, 1.47747802734375, 1.540863037109375, 1.604248046875, 1.667633056640625, 1.73101806640625, 1.794403076171875, 1.8577880859375, 1.921173095703125, 1.98455810546875, 2.047943115234375, 2.111328125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 17.0, 42.0, 54.0, 91.0, 128.0, 194.0, 269.0, 433.0, 577.0, 954.0, 1424.0, 2141.0, 3259.0, 4668.0, 6819.0, 10029.0, 14470.0, 21230.0, 30143.0, 42377.0, 58204.0, 77067.0, 96527.0, 113979.0, 118736.0, 108615.0, 90181.0, 70549.0, 52026.0, 38076.0, 26474.0, 18547.0, 12766.0, 8815.0, 6053.0, 4155.0, 2854.0, 1846.0, 1281.0, 842.0, 553.0, 383.0, 201.0, 156.0, 136.0, 65.0, 48.0, 31.0, 18.0, 17.0, 9.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.211181640625, -0.20444107055664062, -0.19770050048828125, -0.19095993041992188, -0.1842193603515625, -0.17747879028320312, -0.17073822021484375, -0.16399765014648438, -0.157257080078125, -0.15051651000976562, -0.14377593994140625, -0.13703536987304688, -0.1302947998046875, -0.12355422973632812, -0.11681365966796875, -0.11007308959960938, -0.10333251953125, -0.09659194946289062, -0.08985137939453125, -0.08311080932617188, -0.0763702392578125, -0.06962966918945312, -0.06288909912109375, -0.056148529052734375, -0.049407958984375, -0.042667388916015625, -0.03592681884765625, -0.029186248779296875, -0.0224456787109375, -0.015705108642578125, -0.00896453857421875, -0.002223968505859375, 0.0045166015625, 0.011257171630859375, 0.01799774169921875, 0.024738311767578125, 0.0314788818359375, 0.038219451904296875, 0.04496002197265625, 0.051700592041015625, 0.058441162109375, 0.06518173217773438, 0.07192230224609375, 0.07866287231445312, 0.0854034423828125, 0.09214401245117188, 0.09888458251953125, 0.10562515258789062, 0.11236572265625, 0.11910629272460938, 0.12584686279296875, 0.13258743286132812, 0.1393280029296875, 0.14606857299804688, 0.15280914306640625, 0.15954971313476562, 0.166290283203125, 0.17303085327148438, 0.17977142333984375, 0.18651199340820312, 0.1932525634765625, 0.19999313354492188, 0.20673370361328125, 0.21347427368164062, 0.22021484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 14.0, 14.0, 14.0, 15.0, 19.0, 27.0, 28.0, 20.0, 21.0, 36.0, 28.0, 43.0, 43.0, 39.0, 32.0, 41.0, 44.0, 1056.0, 42.0, 44.0, 40.0, 39.0, 33.0, 22.0, 27.0, 24.0, 33.0, 25.0, 20.0, 19.0, 22.0, 23.0, 11.0, 13.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0819091796875, -1.042724609375, -1.0035400390625, -0.96435546875, -0.9251708984375, -0.885986328125, -0.8468017578125, -0.8076171875, -0.7684326171875, -0.729248046875, -0.6900634765625, -0.65087890625, -0.6116943359375, -0.572509765625, -0.5333251953125, -0.494140625, -0.4549560546875, -0.415771484375, -0.3765869140625, -0.33740234375, -0.2982177734375, -0.259033203125, -0.2198486328125, -0.1806640625, -0.1414794921875, -0.102294921875, -0.0631103515625, -0.02392578125, 0.0152587890625, 0.054443359375, 0.0936279296875, 0.1328125, 0.1719970703125, 0.211181640625, 0.2503662109375, 0.28955078125, 0.3287353515625, 0.367919921875, 0.4071044921875, 0.4462890625, 0.4854736328125, 0.524658203125, 0.5638427734375, 0.60302734375, 0.6422119140625, 0.681396484375, 0.7205810546875, 0.759765625, 0.7989501953125, 0.838134765625, 0.8773193359375, 0.91650390625, 0.9556884765625, 0.994873046875, 1.0340576171875, 1.0732421875, 1.1124267578125, 1.151611328125, 1.1907958984375, 1.22998046875, 1.2691650390625, 1.308349609375, 1.3475341796875, 1.38671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 9.0, 11.0, 17.0, 22.0, 32.0, 49.0, 69.0, 95.0, 121.0, 203.0, 286.0, 427.0, 724.0, 1011.0, 1546.0, 2471.0, 3748.0, 5561.0, 8788.0, 13700.0, 25266.0, 83370.0, 1569257.0, 289506.0, 40619.0, 18312.0, 11341.0, 7154.0, 4605.0, 3029.0, 1947.0, 1313.0, 842.0, 525.0, 386.0, 256.0, 156.0, 111.0, 75.0, 48.0, 39.0, 25.0, 15.0, 13.0, 7.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.456298828125, -0.44193267822265625, -0.4275665283203125, -0.41320037841796875, -0.398834228515625, -0.38446807861328125, -0.3701019287109375, -0.35573577880859375, -0.34136962890625, -0.32700347900390625, -0.3126373291015625, -0.29827117919921875, -0.283905029296875, -0.26953887939453125, -0.2551727294921875, -0.24080657958984375, -0.2264404296875, -0.21207427978515625, -0.1977081298828125, -0.18334197998046875, -0.168975830078125, -0.15460968017578125, -0.1402435302734375, -0.12587738037109375, -0.11151123046875, -0.09714508056640625, -0.0827789306640625, -0.06841278076171875, -0.054046630859375, -0.03968048095703125, -0.0253143310546875, -0.01094818115234375, 0.00341796875, 0.01778411865234375, 0.0321502685546875, 0.04651641845703125, 0.060882568359375, 0.07524871826171875, 0.0896148681640625, 0.10398101806640625, 0.11834716796875, 0.13271331787109375, 0.1470794677734375, 0.16144561767578125, 0.175811767578125, 0.19017791748046875, 0.2045440673828125, 0.21891021728515625, 0.2332763671875, 0.24764251708984375, 0.2620086669921875, 0.27637481689453125, 0.290740966796875, 0.30510711669921875, 0.3194732666015625, 0.33383941650390625, 0.34820556640625, 0.36257171630859375, 0.3769378662109375, 0.39130401611328125, 0.405670166015625, 0.42003631591796875, 0.4344024658203125, 0.44876861572265625, 0.463134765625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 5.0, 4.0, 8.0, 5.0, 13.0, 8.0, 5.0, 12.0, 23.0, 17.0, 17.0, 22.0, 19.0, 26.0, 39.0, 31.0, 41.0, 56.0, 51.0, 49.0, 50.0, 50.0, 51.0, 45.0, 42.0, 41.0, 36.0, 44.0, 35.0, 20.0, 30.0, 12.0, 17.0, 14.0, 13.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0], "bins": [-0.0213775634765625, -0.02080690860748291, -0.02023625373840332, -0.01966559886932373, -0.01909494400024414, -0.01852428913116455, -0.01795363426208496, -0.01738297939300537, -0.01681232452392578, -0.01624166965484619, -0.0156710147857666, -0.015100359916687012, -0.014529705047607422, -0.013959050178527832, -0.013388395309448242, -0.012817740440368652, -0.012247085571289062, -0.011676430702209473, -0.011105775833129883, -0.010535120964050293, -0.009964466094970703, -0.009393811225891113, -0.008823156356811523, -0.008252501487731934, -0.007681846618652344, -0.007111191749572754, -0.006540536880493164, -0.005969882011413574, -0.005399227142333984, -0.0048285722732543945, -0.004257917404174805, -0.003687262535095215, -0.003116607666015625, -0.002545952796936035, -0.0019752979278564453, -0.0014046430587768555, -0.0008339881896972656, -0.0002633333206176758, 0.00030732154846191406, 0.0008779764175415039, 0.0014486312866210938, 0.0020192861557006836, 0.0025899410247802734, 0.0031605958938598633, 0.003731250762939453, 0.004301905632019043, 0.004872560501098633, 0.005443215370178223, 0.0060138702392578125, 0.006584525108337402, 0.007155179977416992, 0.007725834846496582, 0.008296489715576172, 0.008867144584655762, 0.009437799453735352, 0.010008454322814941, 0.010579109191894531, 0.011149764060974121, 0.011720418930053711, 0.0122910737991333, 0.01286172866821289, 0.01343238353729248, 0.01400303840637207, 0.01457369327545166, 0.01514434814453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 10.0, 12.0, 13.0, 16.0, 24.0, 24.0, 32.0, 38.0, 65.0, 84.0, 98.0, 158.0, 241.0, 461.0, 1720.0, 60969.0, 954081.0, 28185.0, 1148.0, 405.0, 230.0, 133.0, 84.0, 66.0, 55.0, 34.0, 26.0, 27.0, 22.0, 15.0, 18.0, 3.0, 6.0, 5.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3455085754394531, -0.33335113525390625, -0.3211936950683594, -0.3090362548828125, -0.2968788146972656, -0.28472137451171875, -0.2725639343261719, -0.260406494140625, -0.24824905395507812, -0.23609161376953125, -0.22393417358398438, -0.2117767333984375, -0.19961929321289062, -0.18746185302734375, -0.17530441284179688, -0.16314697265625, -0.15098953247070312, -0.13883209228515625, -0.12667465209960938, -0.1145172119140625, -0.10235977172851562, -0.09020233154296875, -0.07804489135742188, -0.065887451171875, -0.053730010986328125, -0.04157257080078125, -0.029415130615234375, -0.0172576904296875, -0.005100250244140625, 0.00705718994140625, 0.019214630126953125, 0.0313720703125, 0.043529510498046875, 0.05568695068359375, 0.06784439086914062, 0.0800018310546875, 0.09215927124023438, 0.10431671142578125, 0.11647415161132812, 0.128631591796875, 0.14078903198242188, 0.15294647216796875, 0.16510391235351562, 0.1772613525390625, 0.18941879272460938, 0.20157623291015625, 0.21373367309570312, 0.22589111328125, 0.23804855346679688, 0.25020599365234375, 0.2623634338378906, 0.2745208740234375, 0.2866783142089844, 0.29883575439453125, 0.3109931945800781, 0.323150634765625, 0.3353080749511719, 0.34746551513671875, 0.3596229553222656, 0.3717803955078125, 0.3839378356933594, 0.39609527587890625, 0.4082527160644531, 0.42041015625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 23.0, 82.0, 164.0, 297.0, 271.0, 110.0, 43.0, 12.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1401641070842743, -0.13740800321102142, -0.13465189933776855, -0.13189579546451569, -0.12913969159126282, -0.12638358771800995, -0.12362748384475708, -0.12087137997150421, -0.11811527609825134, -0.11535917222499847, -0.1126030683517456, -0.10984696447849274, -0.10709086060523987, -0.104334756731987, -0.10157865285873413, -0.09882254898548126, -0.0960664451122284, -0.09331034123897552, -0.09055423736572266, -0.08779813349246979, -0.08504202961921692, -0.08228592574596405, -0.07952982187271118, -0.07677371799945831, -0.07401761412620544, -0.07126151025295258, -0.06850540637969971, -0.06574930250644684, -0.06299319863319397, -0.0602370947599411, -0.05748099088668823, -0.054724887013435364, -0.05196879059076309, -0.04921268671751022, -0.046456582844257355, -0.043700478971004486, -0.04094437509775162, -0.03818827122449875, -0.03543216735124588, -0.03267606347799301, -0.029919959604740143, -0.027163855731487274, -0.024407751858234406, -0.021651647984981537, -0.018895544111728668, -0.0161394402384758, -0.013383336365222931, -0.010627232491970062, -0.007871128618717194, -0.005115024745464325, -0.0023589208722114563, 0.00039718300104141235, 0.003153286874294281, 0.00590939074754715, 0.008665494620800018, 0.011421598494052887, 0.014177702367305756, 0.016933806240558624, 0.019689910113811493, 0.02244601398706436, 0.02520211786031723, 0.0279582217335701, 0.030714325606822968, 0.033470429480075836, 0.036226533353328705]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 13.0, 11.0, 17.0, 15.0, 12.0, 15.0, 18.0, 27.0, 18.0, 27.0, 25.0, 44.0, 28.0, 34.0, 23.0, 24.0, 28.0, 25.0, 51.0, 38.0, 47.0, 40.0, 47.0, 30.0, 42.0, 35.0, 18.0, 28.0, 21.0, 35.0, 20.0, 15.0, 18.0, 18.0, 10.0, 11.0, 8.0, 12.0, 2.0, 6.0, 9.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019772648811340332, -0.01914995163679123, -0.018527252599596977, -0.017904553562402725, -0.017281856387853622, -0.01665915921330452, -0.016036460176110268, -0.01541376207023859, -0.014791063964366913, -0.014168365858495235, -0.013545667752623558, -0.01292296964675188, -0.012300271540880203, -0.011677573435008526, -0.011054875329136848, -0.010432177223265171, -0.009809479117393494, -0.009186781011521816, -0.008564082905650139, -0.007941384799778461, -0.007318686693906784, -0.006695988588035107, -0.006073290482163429, -0.005450592376291752, -0.0048278942704200745, -0.004205196164548397, -0.0035824980586767197, -0.0029597999528050423, -0.002337101846933365, -0.0017144037410616875, -0.00109170563519001, -0.00046900752931833267, 0.00015369057655334473, 0.0007763886824250221, 0.0013990867882966995, 0.002021784894168377, 0.0026444830000400543, 0.0032671811059117317, 0.003889879211783409, 0.0045125773176550865, 0.005135275423526764, 0.005757973529398441, 0.006380671635270119, 0.007003369741141796, 0.0076260678470134735, 0.008248765952885151, 0.008871464058756828, 0.009494162164628506, 0.010116860270500183, 0.01073955837637186, 0.011362256482243538, 0.011984954588115215, 0.012607652693986893, 0.01323035079985857, 0.013853048905730247, 0.014475747011601925, 0.015098445117473602, 0.015721142292022705, 0.016343841329216957, 0.01696654036641121, 0.017589237540960312, 0.018211934715509415, 0.018834633752703667, 0.01945733278989792, 0.02008002996444702]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 4.0, 5.0, 9.0, 16.0, 19.0, 23.0, 24.0, 27.0, 17.0, 36.0, 28.0, 41.0, 52.0, 30.0, 42.0, 53.0, 61.0, 45.0, 45.0, 45.0, 46.0, 29.0, 41.0, 27.0, 29.0, 23.0, 34.0, 35.0, 24.0, 16.0, 19.0, 12.0, 11.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03826904296875, -1.9710693359375, -1.90386962890625, -1.836669921875, -1.76947021484375, -1.7022705078125, -1.63507080078125, -1.56787109375, -1.50067138671875, -1.4334716796875, -1.36627197265625, -1.299072265625, -1.23187255859375, -1.1646728515625, -1.09747314453125, -1.0302734375, -0.96307373046875, -0.8958740234375, -0.82867431640625, -0.761474609375, -0.69427490234375, -0.6270751953125, -0.55987548828125, -0.49267578125, -0.42547607421875, -0.3582763671875, -0.29107666015625, -0.223876953125, -0.15667724609375, -0.0894775390625, -0.02227783203125, 0.044921875, 0.11212158203125, 0.1793212890625, 0.24652099609375, 0.313720703125, 0.38092041015625, 0.4481201171875, 0.51531982421875, 0.58251953125, 0.64971923828125, 0.7169189453125, 0.78411865234375, 0.851318359375, 0.91851806640625, 0.9857177734375, 1.05291748046875, 1.1201171875, 1.18731689453125, 1.2545166015625, 1.32171630859375, 1.388916015625, 1.45611572265625, 1.5233154296875, 1.59051513671875, 1.65771484375, 1.72491455078125, 1.7921142578125, 1.85931396484375, 1.926513671875, 1.99371337890625, 2.0609130859375, 2.12811279296875, 2.1953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 12.0, 21.0, 27.0, 45.0, 56.0, 82.0, 137.0, 181.0, 231.0, 353.0, 500.0, 806.0, 1147.0, 1754.0, 2760.0, 4396.0, 7277.0, 12211.0, 21839.0, 41930.0, 96429.0, 272927.0, 345207.0, 124591.0, 51265.0, 25668.0, 14284.0, 8279.0, 5070.0, 3056.0, 1925.0, 1376.0, 851.0, 534.0, 419.0, 271.0, 189.0, 129.0, 82.0, 65.0, 43.0, 41.0, 18.0, 20.0, 13.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.058258056640625, -1.98760986328125, -1.916961669921875, -1.8463134765625, -1.775665283203125, -1.70501708984375, -1.634368896484375, -1.563720703125, -1.493072509765625, -1.42242431640625, -1.351776123046875, -1.2811279296875, -1.210479736328125, -1.13983154296875, -1.069183349609375, -0.99853515625, -0.927886962890625, -0.85723876953125, -0.786590576171875, -0.7159423828125, -0.645294189453125, -0.57464599609375, -0.503997802734375, -0.433349609375, -0.362701416015625, -0.29205322265625, -0.221405029296875, -0.1507568359375, -0.080108642578125, -0.00946044921875, 0.061187744140625, 0.1318359375, 0.202484130859375, 0.27313232421875, 0.343780517578125, 0.4144287109375, 0.485076904296875, 0.55572509765625, 0.626373291015625, 0.697021484375, 0.767669677734375, 0.83831787109375, 0.908966064453125, 0.9796142578125, 1.050262451171875, 1.12091064453125, 1.191558837890625, 1.26220703125, 1.332855224609375, 1.40350341796875, 1.474151611328125, 1.5447998046875, 1.615447998046875, 1.68609619140625, 1.756744384765625, 1.827392578125, 1.898040771484375, 1.96868896484375, 2.039337158203125, 2.1099853515625, 2.180633544921875, 2.25128173828125, 2.321929931640625, 2.392578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 13.0, 13.0, 10.0, 21.0, 17.0, 23.0, 21.0, 27.0, 36.0, 28.0, 41.0, 36.0, 68.0, 62.0, 135.0, 271.0, 1451.0, 221.0, 119.0, 57.0, 51.0, 19.0, 43.0, 33.0, 22.0, 32.0, 23.0, 24.0, 20.0, 10.0, 13.0, 11.0, 12.0, 4.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.9716796875, -3.826171875, -3.6806640625, -3.53515625, -3.3896484375, -3.244140625, -3.0986328125, -2.953125, -2.8076171875, -2.662109375, -2.5166015625, -2.37109375, -2.2255859375, -2.080078125, -1.9345703125, -1.7890625, -1.6435546875, -1.498046875, -1.3525390625, -1.20703125, -1.0615234375, -0.916015625, -0.7705078125, -0.625, -0.4794921875, -0.333984375, -0.1884765625, -0.04296875, 0.1025390625, 0.248046875, 0.3935546875, 0.5390625, 0.6845703125, 0.830078125, 0.9755859375, 1.12109375, 1.2666015625, 1.412109375, 1.5576171875, 1.703125, 1.8486328125, 1.994140625, 2.1396484375, 2.28515625, 2.4306640625, 2.576171875, 2.7216796875, 2.8671875, 3.0126953125, 3.158203125, 3.3037109375, 3.44921875, 3.5947265625, 3.740234375, 3.8857421875, 4.03125, 4.1767578125, 4.322265625, 4.4677734375, 4.61328125, 4.7587890625, 4.904296875, 5.0498046875, 5.1953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 20.0, 7.0, 20.0, 26.0, 37.0, 59.0, 66.0, 99.0, 150.0, 204.0, 449.0, 1076.0, 3644.0, 18637.0, 184267.0, 2775068.0, 140706.0, 15777.0, 3280.0, 971.0, 406.0, 228.0, 135.0, 97.0, 72.0, 53.0, 33.0, 29.0, 24.0, 9.0, 11.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.82684326171875, -5.6146240234375, -5.40240478515625, -5.190185546875, -4.97796630859375, -4.7657470703125, -4.55352783203125, -4.34130859375, -4.12908935546875, -3.9168701171875, -3.70465087890625, -3.492431640625, -3.28021240234375, -3.0679931640625, -2.85577392578125, -2.6435546875, -2.43133544921875, -2.2191162109375, -2.00689697265625, -1.794677734375, -1.58245849609375, -1.3702392578125, -1.15802001953125, -0.94580078125, -0.73358154296875, -0.5213623046875, -0.30914306640625, -0.096923828125, 0.11529541015625, 0.3275146484375, 0.53973388671875, 0.751953125, 0.96417236328125, 1.1763916015625, 1.38861083984375, 1.600830078125, 1.81304931640625, 2.0252685546875, 2.23748779296875, 2.44970703125, 2.66192626953125, 2.8741455078125, 3.08636474609375, 3.298583984375, 3.51080322265625, 3.7230224609375, 3.93524169921875, 4.1474609375, 4.35968017578125, 4.5718994140625, 4.78411865234375, 4.996337890625, 5.20855712890625, 5.4207763671875, 5.63299560546875, 5.84521484375, 6.05743408203125, 6.2696533203125, 6.48187255859375, 6.694091796875, 6.90631103515625, 7.1185302734375, 7.33074951171875, 7.54296875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 36.0, 72.0, 164.0, 222.0, 209.0, 150.0, 96.0, 29.0, 17.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.279764175415039, -5.797384738922119, -5.315005302429199, -4.832625865936279, -4.350246429443359, -3.8678667545318604, -3.3854873180389404, -2.9031078815460205, -2.4207284450531006, -1.9383490085601807, -1.4559695720672607, -0.9735900163650513, -0.49121057987213135, -0.008831024169921875, 0.47354841232299805, 0.955927848815918, 1.438307285308838, 1.9206867218017578, 2.4030661582946777, 2.8854455947875977, 3.3678250312805176, 3.8502047061920166, 4.332584381103516, 4.814963340759277, 5.2973432540893555, 5.779722690582275, 6.262102127075195, 6.744481563568115, 7.226861000061035, 7.709240913391113, 8.191619873046875, 8.673999786376953, 9.156378746032715, 9.638758659362793, 10.121137619018555, 10.603517532348633, 11.085896492004395, 11.568276405334473, 12.050655364990234, 12.533035278320312, 13.015414237976074, 13.497794151306152, 13.980173110961914, 14.462553024291992, 14.944931983947754, 15.427311897277832, 15.909690856933594, 16.392070770263672, 16.87445068359375, 17.356830596923828, 17.839210510253906, 18.32158851623535, 18.80396842956543, 19.286348342895508, 19.768728256225586, 20.25110626220703, 20.73348617553711, 21.215866088867188, 21.698246002197266, 22.18062400817871, 22.66300392150879, 23.145383834838867, 23.627763748168945, 24.11014175415039, 24.59252166748047]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 14.0, 18.0, 9.0, 14.0, 17.0, 20.0, 25.0, 19.0, 33.0, 24.0, 32.0, 32.0, 43.0, 30.0, 43.0, 39.0, 49.0, 51.0, 53.0, 47.0, 47.0, 53.0, 21.0, 33.0, 25.0, 42.0, 25.0, 15.0, 23.0, 16.0, 15.0, 10.0, 8.0, 18.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.374507904052734, -10.02049446105957, -9.666481018066406, -9.312467575073242, -8.958453178405762, -8.604439735412598, -8.250426292419434, -7.8964128494262695, -7.542398929595947, -7.188385486602783, -6.834371566772461, -6.480358123779297, -6.126344680786133, -5.7723307609558105, -5.4183173179626465, -5.064303398132324, -4.71028995513916, -4.356276512145996, -4.002262592315674, -3.6482491493225098, -3.2942354679107666, -2.9402217864990234, -2.5862083435058594, -2.232194662094116, -1.878180980682373, -1.5241672992706299, -1.1701537370681763, -0.8161401748657227, -0.4621264934539795, -0.10811281204223633, 0.24590063095092773, 0.5999143123626709, 0.9539289474487305, 1.3079426288604736, 1.6619561910629272, 2.015969753265381, 2.369983434677124, 2.723997116088867, 3.0780105590820312, 3.4320242404937744, 3.7860379219055176, 4.140051364898682, 4.494065284729004, 4.848078727722168, 5.202092170715332, 5.556106090545654, 5.910119533538818, 6.264133453369141, 6.618146896362305, 6.972160339355469, 7.326174259185791, 7.680187702178955, 8.034201622009277, 8.388215065002441, 8.742228507995605, 9.09624195098877, 9.45025634765625, 9.804269790649414, 10.158283233642578, 10.512296676635742, 10.866311073303223, 11.220324516296387, 11.57433795928955, 11.928351402282715, 12.282364845275879]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 9.0, 12.0, 10.0, 18.0, 14.0, 27.0, 20.0, 24.0, 23.0, 34.0, 30.0, 45.0, 45.0, 34.0, 51.0, 45.0, 42.0, 37.0, 45.0, 50.0, 41.0, 41.0, 32.0, 28.0, 36.0, 35.0, 19.0, 22.0, 18.0, 23.0, 17.0, 24.0, 10.0, 9.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7138671875, -1.6490325927734375, -1.584197998046875, -1.5193634033203125, -1.45452880859375, -1.3896942138671875, -1.324859619140625, -1.2600250244140625, -1.1951904296875, -1.1303558349609375, -1.065521240234375, -1.0006866455078125, -0.93585205078125, -0.8710174560546875, -0.806182861328125, -0.7413482666015625, -0.676513671875, -0.6116790771484375, -0.546844482421875, -0.4820098876953125, -0.41717529296875, -0.3523406982421875, -0.287506103515625, -0.2226715087890625, -0.1578369140625, -0.0930023193359375, -0.028167724609375, 0.0366668701171875, 0.10150146484375, 0.1663360595703125, 0.231170654296875, 0.2960052490234375, 0.36083984375, 0.4256744384765625, 0.490509033203125, 0.5553436279296875, 0.62017822265625, 0.6850128173828125, 0.749847412109375, 0.8146820068359375, 0.8795166015625, 0.9443511962890625, 1.009185791015625, 1.0740203857421875, 1.13885498046875, 1.2036895751953125, 1.268524169921875, 1.3333587646484375, 1.398193359375, 1.4630279541015625, 1.527862548828125, 1.5926971435546875, 1.65753173828125, 1.7223663330078125, 1.787200927734375, 1.8520355224609375, 1.9168701171875, 1.9817047119140625, 2.046539306640625, 2.1113739013671875, 2.17620849609375, 2.2410430908203125, 2.305877685546875, 2.3707122802734375, 2.435546875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 12.0, 8.0, 9.0, 9.0, 13.0, 9.0, 21.0, 39.0, 46.0, 40.0, 54.0, 82.0, 127.0, 152.0, 180.0, 323.0, 553.0, 1746.0, 19588.0, 4005665.0, 159571.0, 3911.0, 844.0, 376.0, 218.0, 157.0, 144.0, 91.0, 57.0, 50.0, 52.0, 36.0, 15.0, 15.0, 15.0, 10.0, 8.0, 9.0, 14.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.722412109375, -15.21044921875, -14.698486328125, -14.1865234375, -13.674560546875, -13.16259765625, -12.650634765625, -12.138671875, -11.626708984375, -11.11474609375, -10.602783203125, -10.0908203125, -9.578857421875, -9.06689453125, -8.554931640625, -8.04296875, -7.531005859375, -7.01904296875, -6.507080078125, -5.9951171875, -5.483154296875, -4.97119140625, -4.459228515625, -3.947265625, -3.435302734375, -2.92333984375, -2.411376953125, -1.8994140625, -1.387451171875, -0.87548828125, -0.363525390625, 0.1484375, 0.660400390625, 1.17236328125, 1.684326171875, 2.1962890625, 2.708251953125, 3.22021484375, 3.732177734375, 4.244140625, 4.756103515625, 5.26806640625, 5.780029296875, 6.2919921875, 6.803955078125, 7.31591796875, 7.827880859375, 8.33984375, 8.851806640625, 9.36376953125, 9.875732421875, 10.3876953125, 10.899658203125, 11.41162109375, 11.923583984375, 12.435546875, 12.947509765625, 13.45947265625, 13.971435546875, 14.4833984375, 14.995361328125, 15.50732421875, 16.019287109375, 16.53125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 22.0, 30.0, 36.0, 36.0, 63.0, 83.0, 118.0, 176.0, 269.0, 379.0, 515.0, 590.0, 468.0, 350.0, 241.0, 152.0, 95.0, 98.0, 80.0, 38.0, 44.0, 28.0, 22.0, 19.0, 15.0, 12.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.67578125, -2.593048095703125, -2.51031494140625, -2.427581787109375, -2.3448486328125, -2.262115478515625, -2.17938232421875, -2.096649169921875, -2.013916015625, -1.931182861328125, -1.84844970703125, -1.765716552734375, -1.6829833984375, -1.600250244140625, -1.51751708984375, -1.434783935546875, -1.35205078125, -1.269317626953125, -1.18658447265625, -1.103851318359375, -1.0211181640625, -0.938385009765625, -0.85565185546875, -0.772918701171875, -0.690185546875, -0.607452392578125, -0.52471923828125, -0.441986083984375, -0.3592529296875, -0.276519775390625, -0.19378662109375, -0.111053466796875, -0.0283203125, 0.054412841796875, 0.13714599609375, 0.219879150390625, 0.3026123046875, 0.385345458984375, 0.46807861328125, 0.550811767578125, 0.633544921875, 0.716278076171875, 0.79901123046875, 0.881744384765625, 0.9644775390625, 1.047210693359375, 1.12994384765625, 1.212677001953125, 1.29541015625, 1.378143310546875, 1.46087646484375, 1.543609619140625, 1.6263427734375, 1.709075927734375, 1.79180908203125, 1.874542236328125, 1.957275390625, 2.040008544921875, 2.12274169921875, 2.205474853515625, 2.2882080078125, 2.370941162109375, 2.45367431640625, 2.536407470703125, 2.619140625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 11.0, 8.0, 18.0, 25.0, 28.0, 44.0, 47.0, 84.0, 157.0, 303.0, 845.0, 2884.0, 17314.0, 235744.0, 3741221.0, 176995.0, 14580.0, 2565.0, 702.0, 276.0, 154.0, 81.0, 40.0, 30.0, 24.0, 17.0, 17.0, 10.0, 3.0, 10.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1875, -7.8997802734375, -7.612060546875, -7.3243408203125, -7.03662109375, -6.7489013671875, -6.461181640625, -6.1734619140625, -5.8857421875, -5.5980224609375, -5.310302734375, -5.0225830078125, -4.73486328125, -4.4471435546875, -4.159423828125, -3.8717041015625, -3.583984375, -3.2962646484375, -3.008544921875, -2.7208251953125, -2.43310546875, -2.1453857421875, -1.857666015625, -1.5699462890625, -1.2822265625, -0.9945068359375, -0.706787109375, -0.4190673828125, -0.13134765625, 0.1563720703125, 0.444091796875, 0.7318115234375, 1.01953125, 1.3072509765625, 1.594970703125, 1.8826904296875, 2.17041015625, 2.4581298828125, 2.745849609375, 3.0335693359375, 3.3212890625, 3.6090087890625, 3.896728515625, 4.1844482421875, 4.47216796875, 4.7598876953125, 5.047607421875, 5.3353271484375, 5.623046875, 5.9107666015625, 6.198486328125, 6.4862060546875, 6.77392578125, 7.0616455078125, 7.349365234375, 7.6370849609375, 7.9248046875, 8.2125244140625, 8.500244140625, 8.7879638671875, 9.07568359375, 9.3634033203125, 9.651123046875, 9.9388427734375, 10.2265625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 44.0, 168.0, 387.0, 292.0, 99.0, 19.0, 3.0, 2.0, 2.0, 1.0], "bins": [-71.2143325805664, -69.9607162475586, -68.70709991455078, -67.45347595214844, -66.19985961914062, -64.94624328613281, -63.692626953125, -62.43901062011719, -61.18539047241211, -59.9317741394043, -58.67815399169922, -57.424537658691406, -56.170921325683594, -54.917301177978516, -53.6636848449707, -52.410064697265625, -51.15644836425781, -49.90283203125, -48.64921188354492, -47.39559555053711, -46.14197540283203, -44.88835906982422, -43.634742736816406, -42.381126403808594, -41.127506256103516, -39.8738899230957, -38.620269775390625, -37.36665344238281, -36.113037109375, -34.85941696166992, -33.60580062866211, -32.35218048095703, -31.098560333251953, -29.844942092895508, -28.591323852539062, -27.33770751953125, -26.084089279174805, -24.83047103881836, -23.576854705810547, -22.3232364654541, -21.069618225097656, -19.81599998474121, -18.562381744384766, -17.308765411376953, -16.055147171020508, -14.801528930664062, -13.547911643981934, -12.294294357299805, -11.040677070617676, -9.787059783935547, -8.533441543579102, -7.2798237800598145, -6.026206016540527, -4.77258825302124, -3.518970489501953, -2.265353202819824, -1.011734962463379, 0.2418828010559082, 1.4955005645751953, 2.7491183280944824, 4.0027360916137695, 5.256353855133057, 6.509971618652344, 7.763588905334473, 9.017207145690918]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 1.0, 9.0, 10.0, 12.0, 12.0, 14.0, 20.0, 15.0, 20.0, 18.0, 16.0, 29.0, 20.0, 32.0, 38.0, 43.0, 29.0, 36.0, 34.0, 38.0, 42.0, 43.0, 39.0, 38.0, 38.0, 48.0, 39.0, 22.0, 33.0, 33.0, 18.0, 19.0, 20.0, 18.0, 16.0, 15.0, 11.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.180791854858398, -7.923776149749756, -7.666760444641113, -7.4097442626953125, -7.15272855758667, -6.895712852478027, -6.638696670532227, -6.381680965423584, -6.124665260314941, -5.867649555206299, -5.610633850097656, -5.3536176681518555, -5.096601963043213, -4.83958625793457, -4.5825700759887695, -4.325554370880127, -4.068538665771484, -3.811522960662842, -3.55450701713562, -3.2974910736083984, -3.040475368499756, -2.7834596633911133, -2.5264437198638916, -2.26942777633667, -2.0124120712280273, -1.7553962469100952, -1.498380422592163, -1.241364598274231, -0.9843487739562988, -0.7273329496383667, -0.47031712532043457, -0.21330130100250244, 0.043715476989746094, 0.3007313013076782, 0.5577471256256104, 0.8147629499435425, 1.0717787742614746, 1.3287945985794067, 1.5858104228973389, 1.842826247215271, 2.099842071533203, 2.3568577766418457, 2.6138737201690674, 2.870889663696289, 3.1279053688049316, 3.384921073913574, 3.641937017440796, 3.8989529609680176, 4.15596866607666, 4.412984371185303, 4.670000076293945, 4.927016258239746, 5.184031963348389, 5.441047668457031, 5.698063850402832, 5.955079555511475, 6.212095260620117, 6.46911096572876, 6.726126670837402, 6.983142852783203, 7.240158557891846, 7.497174263000488, 7.754190444946289, 8.011205673217773, 8.268221855163574]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 10.0, 6.0, 8.0, 8.0, 11.0, 13.0, 10.0, 17.0, 15.0, 18.0, 22.0, 27.0, 17.0, 35.0, 36.0, 40.0, 47.0, 39.0, 33.0, 42.0, 40.0, 34.0, 38.0, 40.0, 33.0, 39.0, 36.0, 26.0, 34.0, 33.0, 33.0, 21.0, 22.0, 21.0, 14.0, 15.0, 10.0, 13.0, 12.0, 5.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6953125, -1.63916015625, -1.5830078125, -1.52685546875, -1.470703125, -1.41455078125, -1.3583984375, -1.30224609375, -1.24609375, -1.18994140625, -1.1337890625, -1.07763671875, -1.021484375, -0.96533203125, -0.9091796875, -0.85302734375, -0.796875, -0.74072265625, -0.6845703125, -0.62841796875, -0.572265625, -0.51611328125, -0.4599609375, -0.40380859375, -0.34765625, -0.29150390625, -0.2353515625, -0.17919921875, -0.123046875, -0.06689453125, -0.0107421875, 0.04541015625, 0.1015625, 0.15771484375, 0.2138671875, 0.27001953125, 0.326171875, 0.38232421875, 0.4384765625, 0.49462890625, 0.55078125, 0.60693359375, 0.6630859375, 0.71923828125, 0.775390625, 0.83154296875, 0.8876953125, 0.94384765625, 1.0, 1.05615234375, 1.1123046875, 1.16845703125, 1.224609375, 1.28076171875, 1.3369140625, 1.39306640625, 1.44921875, 1.50537109375, 1.5615234375, 1.61767578125, 1.673828125, 1.72998046875, 1.7861328125, 1.84228515625, 1.8984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 15.0, 14.0, 15.0, 16.0, 37.0, 50.0, 102.0, 140.0, 239.0, 412.0, 710.0, 1226.0, 2179.0, 3872.0, 6614.0, 11598.0, 20478.0, 34676.0, 57610.0, 91483.0, 134014.0, 167119.0, 165496.0, 129514.0, 87857.0, 54776.0, 33001.0, 19265.0, 11164.0, 6359.0, 3622.0, 2032.0, 1191.0, 654.0, 408.0, 208.0, 142.0, 78.0, 62.0, 40.0, 29.0, 16.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31884765625, -0.308868408203125, -0.29888916015625, -0.288909912109375, -0.2789306640625, -0.268951416015625, -0.25897216796875, -0.248992919921875, -0.239013671875, -0.229034423828125, -0.21905517578125, -0.209075927734375, -0.1990966796875, -0.189117431640625, -0.17913818359375, -0.169158935546875, -0.1591796875, -0.149200439453125, -0.13922119140625, -0.129241943359375, -0.1192626953125, -0.109283447265625, -0.09930419921875, -0.089324951171875, -0.079345703125, -0.069366455078125, -0.05938720703125, -0.049407958984375, -0.0394287109375, -0.029449462890625, -0.01947021484375, -0.009490966796875, 0.00048828125, 0.010467529296875, 0.02044677734375, 0.030426025390625, 0.0404052734375, 0.050384521484375, 0.06036376953125, 0.070343017578125, 0.080322265625, 0.090301513671875, 0.10028076171875, 0.110260009765625, 0.1202392578125, 0.130218505859375, 0.14019775390625, 0.150177001953125, 0.16015625, 0.170135498046875, 0.18011474609375, 0.190093994140625, 0.2000732421875, 0.210052490234375, 0.22003173828125, 0.230010986328125, 0.239990234375, 0.249969482421875, 0.25994873046875, 0.269927978515625, 0.2799072265625, 0.289886474609375, 0.29986572265625, 0.309844970703125, 0.31982421875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 3.0, 12.0, 11.0, 13.0, 10.0, 26.0, 11.0, 21.0, 21.0, 23.0, 24.0, 27.0, 33.0, 37.0, 48.0, 35.0, 36.0, 29.0, 28.0, 1065.0, 40.0, 48.0, 34.0, 33.0, 48.0, 34.0, 29.0, 38.0, 22.0, 23.0, 20.0, 24.0, 21.0, 15.0, 12.0, 10.0, 8.0, 13.0, 11.0, 5.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1340789794921875, -1.092376708984375, -1.0506744384765625, -1.00897216796875, -0.9672698974609375, -0.925567626953125, -0.8838653564453125, -0.8421630859375, -0.8004608154296875, -0.758758544921875, -0.7170562744140625, -0.67535400390625, -0.6336517333984375, -0.591949462890625, -0.5502471923828125, -0.508544921875, -0.4668426513671875, -0.425140380859375, -0.3834381103515625, -0.34173583984375, -0.3000335693359375, -0.258331298828125, -0.2166290283203125, -0.1749267578125, -0.1332244873046875, -0.091522216796875, -0.0498199462890625, -0.00811767578125, 0.0335845947265625, 0.075286865234375, 0.1169891357421875, 0.15869140625, 0.2003936767578125, 0.242095947265625, 0.2837982177734375, 0.32550048828125, 0.3672027587890625, 0.408905029296875, 0.4506072998046875, 0.4923095703125, 0.5340118408203125, 0.575714111328125, 0.6174163818359375, 0.65911865234375, 0.7008209228515625, 0.742523193359375, 0.7842254638671875, 0.825927734375, 0.8676300048828125, 0.909332275390625, 0.9510345458984375, 0.99273681640625, 1.0344390869140625, 1.076141357421875, 1.1178436279296875, 1.1595458984375, 1.2012481689453125, 1.242950439453125, 1.2846527099609375, 1.32635498046875, 1.3680572509765625, 1.409759521484375, 1.4514617919921875, 1.4931640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 17.0, 35.0, 51.0, 60.0, 87.0, 154.0, 226.0, 342.0, 506.0, 838.0, 1380.0, 2147.0, 3374.0, 5335.0, 8353.0, 14008.0, 25531.0, 87401.0, 1633316.0, 232183.0, 36462.0, 17476.0, 10260.0, 6375.0, 4038.0, 2518.0, 1636.0, 1108.0, 679.0, 424.0, 285.0, 162.0, 109.0, 80.0, 46.0, 29.0, 16.0, 17.0, 13.0, 9.0, 11.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5643043518066406, -0.5480422973632812, -0.5317802429199219, -0.5155181884765625, -0.4992561340332031, -0.48299407958984375, -0.4667320251464844, -0.450469970703125, -0.4342079162597656, -0.41794586181640625, -0.4016838073730469, -0.3854217529296875, -0.3691596984863281, -0.35289764404296875, -0.3366355895996094, -0.32037353515625, -0.3041114807128906, -0.28784942626953125, -0.2715873718261719, -0.2553253173828125, -0.23906326293945312, -0.22280120849609375, -0.20653915405273438, -0.190277099609375, -0.17401504516601562, -0.15775299072265625, -0.14149093627929688, -0.1252288818359375, -0.10896682739257812, -0.09270477294921875, -0.07644271850585938, -0.0601806640625, -0.043918609619140625, -0.02765655517578125, -0.011394500732421875, 0.0048675537109375, 0.021129608154296875, 0.03739166259765625, 0.053653717041015625, 0.069915771484375, 0.08617782592773438, 0.10243988037109375, 0.11870193481445312, 0.1349639892578125, 0.15122604370117188, 0.16748809814453125, 0.18375015258789062, 0.20001220703125, 0.21627426147460938, 0.23253631591796875, 0.24879837036132812, 0.2650604248046875, 0.2813224792480469, 0.29758453369140625, 0.3138465881347656, 0.330108642578125, 0.3463706970214844, 0.36263275146484375, 0.3788948059082031, 0.3951568603515625, 0.4114189147949219, 0.42768096923828125, 0.4439430236816406, 0.460205078125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 14.0, 12.0, 34.0, 28.0, 49.0, 38.0, 47.0, 46.0, 61.0, 58.0, 65.0, 69.0, 67.0, 78.0, 39.0, 35.0, 35.0, 39.0, 32.0, 25.0, 11.0, 15.0, 11.0, 7.0, 14.0, 8.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.028961181640625, -0.028029441833496094, -0.027097702026367188, -0.02616596221923828, -0.025234222412109375, -0.02430248260498047, -0.023370742797851562, -0.022439002990722656, -0.02150726318359375, -0.020575523376464844, -0.019643783569335938, -0.01871204376220703, -0.017780303955078125, -0.01684856414794922, -0.015916824340820312, -0.014985084533691406, -0.0140533447265625, -0.013121604919433594, -0.012189865112304688, -0.011258125305175781, -0.010326385498046875, -0.009394645690917969, -0.008462905883789062, -0.007531166076660156, -0.00659942626953125, -0.005667686462402344, -0.0047359466552734375, -0.0038042068481445312, -0.002872467041015625, -0.0019407272338867188, -0.0010089874267578125, -7.724761962890625e-05, 0.0008544921875, 0.0017862319946289062, 0.0027179718017578125, 0.0036497116088867188, 0.004581451416015625, 0.005513191223144531, 0.0064449310302734375, 0.007376670837402344, 0.00830841064453125, 0.009240150451660156, 0.010171890258789062, 0.011103630065917969, 0.012035369873046875, 0.012967109680175781, 0.013898849487304688, 0.014830589294433594, 0.0157623291015625, 0.016694068908691406, 0.017625808715820312, 0.01855754852294922, 0.019489288330078125, 0.02042102813720703, 0.021352767944335938, 0.022284507751464844, 0.02321624755859375, 0.024147987365722656, 0.025079727172851562, 0.02601146697998047, 0.026943206787109375, 0.02787494659423828, 0.028806686401367188, 0.029738426208496094, 0.030670166015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 8.0, 6.0, 14.0, 16.0, 13.0, 21.0, 36.0, 59.0, 69.0, 85.0, 155.0, 290.0, 621.0, 3695.0, 975981.0, 65268.0, 1219.0, 369.0, 219.0, 118.0, 85.0, 61.0, 42.0, 25.0, 22.0, 7.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7216796875, -0.7003021240234375, -0.678924560546875, -0.6575469970703125, -0.63616943359375, -0.6147918701171875, -0.593414306640625, -0.5720367431640625, -0.5506591796875, -0.5292816162109375, -0.507904052734375, -0.4865264892578125, -0.46514892578125, -0.4437713623046875, -0.422393798828125, -0.4010162353515625, -0.379638671875, -0.3582611083984375, -0.336883544921875, -0.3155059814453125, -0.29412841796875, -0.2727508544921875, -0.251373291015625, -0.2299957275390625, -0.2086181640625, -0.1872406005859375, -0.165863037109375, -0.1444854736328125, -0.12310791015625, -0.1017303466796875, -0.080352783203125, -0.0589752197265625, -0.03759765625, -0.0162200927734375, 0.005157470703125, 0.0265350341796875, 0.04791259765625, 0.0692901611328125, 0.090667724609375, 0.1120452880859375, 0.1334228515625, 0.1548004150390625, 0.176177978515625, 0.1975555419921875, 0.21893310546875, 0.2403106689453125, 0.261688232421875, 0.2830657958984375, 0.304443359375, 0.3258209228515625, 0.347198486328125, 0.3685760498046875, 0.38995361328125, 0.4113311767578125, 0.432708740234375, 0.4540863037109375, 0.4754638671875, 0.4968414306640625, 0.518218994140625, 0.5395965576171875, 0.56097412109375, 0.5823516845703125, 0.603729248046875, 0.6251068115234375, 0.646484375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 28.0, 524.0, 450.0, 13.0, 4.0, 1.0], "bins": [-0.6063457131385803, -0.596233606338501, -0.5861214995384216, -0.5760093927383423, -0.5658973455429077, -0.5557852387428284, -0.545673131942749, -0.5355610251426697, -0.5254489183425903, -0.515336811542511, -0.5052247047424316, -0.4951126277446747, -0.48500052094459534, -0.474888414144516, -0.46477633714675903, -0.4546642303466797, -0.44455212354660034, -0.434440016746521, -0.42432790994644165, -0.4142158329486847, -0.40410372614860535, -0.393991619348526, -0.38387954235076904, -0.3737674355506897, -0.36365532875061035, -0.353543221950531, -0.34343111515045166, -0.3333190381526947, -0.32320693135261536, -0.313094824552536, -0.30298274755477905, -0.2928706407546997, -0.28275853395462036, -0.272646427154541, -0.26253432035446167, -0.2524222433567047, -0.24231013655662537, -0.23219802975654602, -0.22208593785762787, -0.21197384595870972, -0.20186173915863037, -0.19174963235855103, -0.18163754045963287, -0.17152544856071472, -0.16141334176063538, -0.15130123496055603, -0.14118914306163788, -0.13107705116271973, -0.12096494436264038, -0.11085284501314163, -0.10074074566364288, -0.09062864631414413, -0.08051654696464539, -0.07040444761514664, -0.06029234826564789, -0.05018024891614914, -0.04006815329194069, -0.02995605394244194, -0.01984395459294319, -0.009731855243444443, 0.00038024410605430603, 0.010492343455553055, 0.020604442805051804, 0.030716542154550552, 0.0408286415040493]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 12.0, 10.0, 19.0, 8.0, 15.0, 16.0, 18.0, 17.0, 14.0, 26.0, 25.0, 20.0, 33.0, 29.0, 37.0, 51.0, 36.0, 44.0, 53.0, 31.0, 47.0, 60.0, 40.0, 38.0, 35.0, 35.0, 36.0, 22.0, 20.0, 23.0, 18.0, 16.0, 18.0, 10.0, 15.0, 11.0, 5.0, 11.0, 6.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.026995837688446045, -0.026118773967027664, -0.025241708382964134, -0.024364642798900604, -0.023487579077482224, -0.022610515356063843, -0.021733449772000313, -0.020856384187936783, -0.019979320466518402, -0.01910225674510002, -0.01822519116103649, -0.01734812557697296, -0.01647106185555458, -0.015593997202813625, -0.01471693255007267, -0.013839867897331715, -0.01296280324459076, -0.012085738591849804, -0.011208673939108849, -0.010331609286367893, -0.009454544633626938, -0.008577479980885983, -0.007700415328145027, -0.006823350675404072, -0.0059462860226631165, -0.005069221369922161, -0.004192156717181206, -0.0033150920644402504, -0.002438027411699295, -0.0015609627589583397, -0.0006838981062173843, 0.00019316654652357101, 0.0010702311992645264, 0.0019472958520054817, 0.002824360504746437, 0.0037014251574873924, 0.004578489810228348, 0.005455554462969303, 0.0063326191157102585, 0.007209683768451214, 0.00808674842119217, 0.008963813073933125, 0.00984087772667408, 0.010717942379415035, 0.01159500703215599, 0.012472071684896946, 0.013349136337637901, 0.014226200990378857, 0.015103265643119812, 0.015980329364538193, 0.016857394948601723, 0.017734460532665253, 0.018611524254083633, 0.019488587975502014, 0.020365653559565544, 0.021242719143629074, 0.022119782865047455, 0.022996846586465836, 0.023873912170529366, 0.024750977754592896, 0.025628041476011276, 0.026505105197429657, 0.027382170781493187, 0.028259236365556717, 0.029136300086975098]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 9.0, 9.0, 7.0, 15.0, 10.0, 15.0, 16.0, 10.0, 19.0, 20.0, 20.0, 21.0, 37.0, 30.0, 27.0, 45.0, 37.0, 32.0, 44.0, 40.0, 38.0, 43.0, 31.0, 43.0, 40.0, 39.0, 24.0, 34.0, 37.0, 19.0, 32.0, 27.0, 15.0, 24.0, 20.0, 12.0, 10.0, 6.0, 10.0, 7.0, 6.0, 5.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9202728271484375, -1.864959716796875, -1.8096466064453125, -1.75433349609375, -1.6990203857421875, -1.643707275390625, -1.5883941650390625, -1.5330810546875, -1.4777679443359375, -1.422454833984375, -1.3671417236328125, -1.31182861328125, -1.2565155029296875, -1.201202392578125, -1.1458892822265625, -1.090576171875, -1.0352630615234375, -0.979949951171875, -0.9246368408203125, -0.86932373046875, -0.8140106201171875, -0.758697509765625, -0.7033843994140625, -0.6480712890625, -0.5927581787109375, -0.537445068359375, -0.4821319580078125, -0.42681884765625, -0.3715057373046875, -0.316192626953125, -0.2608795166015625, -0.20556640625, -0.1502532958984375, -0.094940185546875, -0.0396270751953125, 0.01568603515625, 0.0709991455078125, 0.126312255859375, 0.1816253662109375, 0.2369384765625, 0.2922515869140625, 0.347564697265625, 0.4028778076171875, 0.45819091796875, 0.5135040283203125, 0.568817138671875, 0.6241302490234375, 0.679443359375, 0.7347564697265625, 0.790069580078125, 0.8453826904296875, 0.90069580078125, 0.9560089111328125, 1.011322021484375, 1.0666351318359375, 1.1219482421875, 1.1772613525390625, 1.232574462890625, 1.2878875732421875, 1.34320068359375, 1.3985137939453125, 1.453826904296875, 1.5091400146484375, 1.564453125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 10.0, 8.0, 6.0, 8.0, 13.0, 30.0, 39.0, 68.0, 86.0, 120.0, 176.0, 236.0, 416.0, 636.0, 981.0, 1699.0, 3060.0, 5221.0, 9562.0, 18013.0, 35089.0, 71360.0, 150738.0, 291579.0, 236689.0, 110410.0, 53547.0, 26696.0, 14165.0, 7504.0, 4120.0, 2425.0, 1535.0, 821.0, 490.0, 329.0, 224.0, 137.0, 97.0, 72.0, 52.0, 30.0, 24.0, 12.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7184600830078125, -1.656646728515625, -1.5948333740234375, -1.53302001953125, -1.4712066650390625, -1.409393310546875, -1.3475799560546875, -1.2857666015625, -1.2239532470703125, -1.162139892578125, -1.1003265380859375, -1.03851318359375, -0.9766998291015625, -0.914886474609375, -0.8530731201171875, -0.791259765625, -0.7294464111328125, -0.667633056640625, -0.6058197021484375, -0.54400634765625, -0.4821929931640625, -0.420379638671875, -0.3585662841796875, -0.2967529296875, -0.2349395751953125, -0.173126220703125, -0.1113128662109375, -0.04949951171875, 0.0123138427734375, 0.074127197265625, 0.1359405517578125, 0.19775390625, 0.2595672607421875, 0.321380615234375, 0.3831939697265625, 0.44500732421875, 0.5068206787109375, 0.568634033203125, 0.6304473876953125, 0.6922607421875, 0.7540740966796875, 0.815887451171875, 0.8777008056640625, 0.93951416015625, 1.0013275146484375, 1.063140869140625, 1.1249542236328125, 1.186767578125, 1.2485809326171875, 1.310394287109375, 1.3722076416015625, 1.43402099609375, 1.4958343505859375, 1.557647705078125, 1.6194610595703125, 1.6812744140625, 1.7430877685546875, 1.804901123046875, 1.8667144775390625, 1.92852783203125, 1.9903411865234375, 2.052154541015625, 2.1139678955078125, 2.17578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 5.0, 9.0, 17.0, 7.0, 13.0, 22.0, 23.0, 23.0, 33.0, 34.0, 41.0, 43.0, 35.0, 59.0, 118.0, 229.0, 1404.0, 363.0, 154.0, 81.0, 40.0, 39.0, 30.0, 31.0, 30.0, 27.0, 28.0, 17.0, 15.0, 8.0, 8.0, 14.0, 7.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.921875, -4.7763671875, -4.630859375, -4.4853515625, -4.33984375, -4.1943359375, -4.048828125, -3.9033203125, -3.7578125, -3.6123046875, -3.466796875, -3.3212890625, -3.17578125, -3.0302734375, -2.884765625, -2.7392578125, -2.59375, -2.4482421875, -2.302734375, -2.1572265625, -2.01171875, -1.8662109375, -1.720703125, -1.5751953125, -1.4296875, -1.2841796875, -1.138671875, -0.9931640625, -0.84765625, -0.7021484375, -0.556640625, -0.4111328125, -0.265625, -0.1201171875, 0.025390625, 0.1708984375, 0.31640625, 0.4619140625, 0.607421875, 0.7529296875, 0.8984375, 1.0439453125, 1.189453125, 1.3349609375, 1.48046875, 1.6259765625, 1.771484375, 1.9169921875, 2.0625, 2.2080078125, 2.353515625, 2.4990234375, 2.64453125, 2.7900390625, 2.935546875, 3.0810546875, 3.2265625, 3.3720703125, 3.517578125, 3.6630859375, 3.80859375, 3.9541015625, 4.099609375, 4.2451171875, 4.390625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 4.0, 15.0, 15.0, 26.0, 40.0, 39.0, 51.0, 90.0, 95.0, 125.0, 182.0, 292.0, 464.0, 1016.0, 10232.0, 2963873.0, 164692.0, 2436.0, 733.0, 369.0, 249.0, 174.0, 109.0, 84.0, 84.0, 39.0, 32.0, 32.0, 20.0, 15.0, 14.0, 12.0, 6.0, 6.0, 9.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.765625, -11.356689453125, -10.94775390625, -10.538818359375, -10.1298828125, -9.720947265625, -9.31201171875, -8.903076171875, -8.494140625, -8.085205078125, -7.67626953125, -7.267333984375, -6.8583984375, -6.449462890625, -6.04052734375, -5.631591796875, -5.22265625, -4.813720703125, -4.40478515625, -3.995849609375, -3.5869140625, -3.177978515625, -2.76904296875, -2.360107421875, -1.951171875, -1.542236328125, -1.13330078125, -0.724365234375, -0.3154296875, 0.093505859375, 0.50244140625, 0.911376953125, 1.3203125, 1.729248046875, 2.13818359375, 2.547119140625, 2.9560546875, 3.364990234375, 3.77392578125, 4.182861328125, 4.591796875, 5.000732421875, 5.40966796875, 5.818603515625, 6.2275390625, 6.636474609375, 7.04541015625, 7.454345703125, 7.86328125, 8.272216796875, 8.68115234375, 9.090087890625, 9.4990234375, 9.907958984375, 10.31689453125, 10.725830078125, 11.134765625, 11.543701171875, 11.95263671875, 12.361572265625, 12.7705078125, 13.179443359375, 13.58837890625, 13.997314453125, 14.40625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 31.0, 359.0, 513.0, 104.0, 8.0, 1.0], "bins": [-94.95520782470703, -93.37904357910156, -91.8028793334961, -90.22671508789062, -88.65054321289062, -87.07437896728516, -85.49821472167969, -83.92205047607422, -82.34588623046875, -80.76972198486328, -79.19355773925781, -77.61739349365234, -76.04122924804688, -74.46505737304688, -72.8888931274414, -71.31272888183594, -69.73656463623047, -68.160400390625, -66.58423614501953, -65.00807189941406, -63.43190383911133, -61.85573959350586, -60.279571533203125, -58.703407287597656, -57.12724304199219, -55.55107879638672, -53.97491455078125, -52.398746490478516, -50.82258224487305, -49.24641799926758, -47.670249938964844, -46.094085693359375, -44.517921447753906, -42.94175720214844, -41.36559295654297, -39.789424896240234, -38.213260650634766, -36.6370964050293, -35.06092834472656, -33.484764099121094, -31.908601760864258, -30.332435607910156, -28.756271362304688, -27.18010711669922, -25.603940963745117, -24.027774810791016, -22.451610565185547, -20.875446319580078, -19.299280166625977, -17.723114013671875, -16.146949768066406, -14.570784568786621, -12.994619369506836, -11.41845417022705, -9.842288970947266, -8.26612377166748, -6.689958095550537, -5.113792896270752, -3.537627696990967, -1.9614624977111816, -0.3852972984313965, 1.1908679008483887, 2.767033100128174, 4.343198299407959, 5.919363498687744]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 4.0, 12.0, 8.0, 12.0, 14.0, 13.0, 18.0, 18.0, 24.0, 28.0, 22.0, 25.0, 24.0, 27.0, 44.0, 33.0, 40.0, 31.0, 30.0, 51.0, 47.0, 26.0, 44.0, 38.0, 42.0, 29.0, 38.0, 28.0, 29.0, 29.0, 24.0, 23.0, 14.0, 16.0, 17.0, 13.0, 10.0, 10.0, 8.0, 5.0, 6.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.294658660888672, -10.940302848815918, -10.58594799041748, -10.231592178344727, -9.877237319946289, -9.522881507873535, -9.168525695800781, -8.814170837402344, -8.459815979003906, -8.105460166931152, -7.751105308532715, -7.396749496459961, -7.042394638061523, -6.6880388259887695, -6.333683490753174, -5.979328155517578, -5.624972343444824, -5.2706170082092285, -4.916261672973633, -4.561905860900879, -4.207551002502441, -3.8531954288482666, -3.498839855194092, -3.144484519958496, -2.7901291847229004, -2.4357738494873047, -2.081418514251709, -1.7270629405975342, -1.3727076053619385, -1.0183522701263428, -0.663996696472168, -0.30964136123657227, 0.04471302032470703, 0.3990684151649475, 0.753423810005188, 1.1077792644500732, 1.462134599685669, 1.8164899349212646, 2.1708455085754395, 2.525200843811035, 2.879556179046631, 3.2339115142822266, 3.5882668495178223, 3.942622423171997, 4.296977996826172, 4.651332855224609, 5.005688667297363, 5.360044002532959, 5.714399337768555, 6.06875467300415, 6.423110008239746, 6.7774658203125, 7.1318206787109375, 7.486176490783691, 7.840531826019287, 8.194887161254883, 8.54924201965332, 8.903597831726074, 9.257952690124512, 9.612308502197266, 9.966663360595703, 10.321019172668457, 10.675374984741211, 11.029729843139648, 11.384085655212402]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 9.0, 12.0, 10.0, 10.0, 14.0, 14.0, 14.0, 20.0, 16.0, 32.0, 37.0, 29.0, 23.0, 36.0, 44.0, 36.0, 42.0, 35.0, 35.0, 28.0, 43.0, 31.0, 45.0, 38.0, 31.0, 31.0, 36.0, 24.0, 24.0, 21.0, 27.0, 17.0, 18.0, 9.0, 15.0, 17.0, 9.0, 11.0, 10.0, 1.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.590972900390625, -1.53741455078125, -1.483856201171875, -1.4302978515625, -1.376739501953125, -1.32318115234375, -1.269622802734375, -1.216064453125, -1.162506103515625, -1.10894775390625, -1.055389404296875, -1.0018310546875, -0.948272705078125, -0.89471435546875, -0.841156005859375, -0.78759765625, -0.734039306640625, -0.68048095703125, -0.626922607421875, -0.5733642578125, -0.519805908203125, -0.46624755859375, -0.412689208984375, -0.359130859375, -0.305572509765625, -0.25201416015625, -0.198455810546875, -0.1448974609375, -0.091339111328125, -0.03778076171875, 0.015777587890625, 0.0693359375, 0.122894287109375, 0.17645263671875, 0.230010986328125, 0.2835693359375, 0.337127685546875, 0.39068603515625, 0.444244384765625, 0.497802734375, 0.551361083984375, 0.60491943359375, 0.658477783203125, 0.7120361328125, 0.765594482421875, 0.81915283203125, 0.872711181640625, 0.92626953125, 0.979827880859375, 1.03338623046875, 1.086944580078125, 1.1405029296875, 1.194061279296875, 1.24761962890625, 1.301177978515625, 1.354736328125, 1.408294677734375, 1.46185302734375, 1.515411376953125, 1.5689697265625, 1.622528076171875, 1.67608642578125, 1.729644775390625, 1.783203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 7.0, 10.0, 9.0, 24.0, 39.0, 42.0, 69.0, 83.0, 148.0, 230.0, 316.0, 439.0, 722.0, 1214.0, 2217.0, 4784.0, 12668.0, 56318.0, 590082.0, 2721340.0, 711678.0, 65885.0, 14384.0, 5298.0, 2530.0, 1384.0, 814.0, 512.0, 305.0, 214.0, 126.0, 110.0, 86.0, 56.0, 33.0, 30.0, 24.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.695892333984375, -3.56170654296875, -3.427520751953125, -3.2933349609375, -3.159149169921875, -3.02496337890625, -2.890777587890625, -2.756591796875, -2.622406005859375, -2.48822021484375, -2.354034423828125, -2.2198486328125, -2.085662841796875, -1.95147705078125, -1.817291259765625, -1.68310546875, -1.548919677734375, -1.41473388671875, -1.280548095703125, -1.1463623046875, -1.012176513671875, -0.87799072265625, -0.743804931640625, -0.609619140625, -0.475433349609375, -0.34124755859375, -0.207061767578125, -0.0728759765625, 0.061309814453125, 0.19549560546875, 0.329681396484375, 0.4638671875, 0.598052978515625, 0.73223876953125, 0.866424560546875, 1.0006103515625, 1.134796142578125, 1.26898193359375, 1.403167724609375, 1.537353515625, 1.671539306640625, 1.80572509765625, 1.939910888671875, 2.0740966796875, 2.208282470703125, 2.34246826171875, 2.476654052734375, 2.61083984375, 2.745025634765625, 2.87921142578125, 3.013397216796875, 3.1475830078125, 3.281768798828125, 3.41595458984375, 3.550140380859375, 3.684326171875, 3.818511962890625, 3.95269775390625, 4.086883544921875, 4.2210693359375, 4.355255126953125, 4.48944091796875, 4.623626708984375, 4.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 18.0, 10.0, 34.0, 25.0, 37.0, 66.0, 68.0, 101.0, 170.0, 214.0, 329.0, 489.0, 629.0, 557.0, 418.0, 256.0, 179.0, 125.0, 94.0, 77.0, 58.0, 33.0, 25.0, 21.0, 10.0, 7.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.58770751953125, -4.4722900390625, -4.35687255859375, -4.241455078125, -4.12603759765625, -4.0106201171875, -3.89520263671875, -3.77978515625, -3.66436767578125, -3.5489501953125, -3.43353271484375, -3.318115234375, -3.20269775390625, -3.0872802734375, -2.97186279296875, -2.8564453125, -2.74102783203125, -2.6256103515625, -2.51019287109375, -2.394775390625, -2.27935791015625, -2.1639404296875, -2.04852294921875, -1.93310546875, -1.81768798828125, -1.7022705078125, -1.58685302734375, -1.471435546875, -1.35601806640625, -1.2406005859375, -1.12518310546875, -1.009765625, -0.89434814453125, -0.7789306640625, -0.66351318359375, -0.548095703125, -0.43267822265625, -0.3172607421875, -0.20184326171875, -0.08642578125, 0.02899169921875, 0.1444091796875, 0.25982666015625, 0.375244140625, 0.49066162109375, 0.6060791015625, 0.72149658203125, 0.8369140625, 0.95233154296875, 1.0677490234375, 1.18316650390625, 1.298583984375, 1.41400146484375, 1.5294189453125, 1.64483642578125, 1.76025390625, 1.87567138671875, 1.9910888671875, 2.10650634765625, 2.221923828125, 2.33734130859375, 2.4527587890625, 2.56817626953125, 2.68359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 13.0, 13.0, 29.0, 53.0, 91.0, 140.0, 293.0, 681.0, 1799.0, 6182.0, 34899.0, 537197.0, 3398630.0, 189741.0, 18417.0, 3830.0, 1184.0, 525.0, 239.0, 129.0, 66.0, 36.0, 29.0, 24.0, 10.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8343505859375, -7.606201171875, -7.3780517578125, -7.14990234375, -6.9217529296875, -6.693603515625, -6.4654541015625, -6.2373046875, -6.0091552734375, -5.781005859375, -5.5528564453125, -5.32470703125, -5.0965576171875, -4.868408203125, -4.6402587890625, -4.412109375, -4.1839599609375, -3.955810546875, -3.7276611328125, -3.49951171875, -3.2713623046875, -3.043212890625, -2.8150634765625, -2.5869140625, -2.3587646484375, -2.130615234375, -1.9024658203125, -1.67431640625, -1.4461669921875, -1.218017578125, -0.9898681640625, -0.76171875, -0.5335693359375, -0.305419921875, -0.0772705078125, 0.15087890625, 0.3790283203125, 0.607177734375, 0.8353271484375, 1.0634765625, 1.2916259765625, 1.519775390625, 1.7479248046875, 1.97607421875, 2.2042236328125, 2.432373046875, 2.6605224609375, 2.888671875, 3.1168212890625, 3.344970703125, 3.5731201171875, 3.80126953125, 4.0294189453125, 4.257568359375, 4.4857177734375, 4.7138671875, 4.9420166015625, 5.170166015625, 5.3983154296875, 5.62646484375, 5.8546142578125, 6.082763671875, 6.3109130859375, 6.5390625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 60.0, 202.0, 400.0, 240.0, 85.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.944175720214844, -33.57929229736328, -32.21440505981445, -30.84952163696289, -29.484634399414062, -28.1197509765625, -26.754865646362305, -25.38998031616211, -24.025094985961914, -22.66020965576172, -21.295324325561523, -19.930438995361328, -18.565555572509766, -17.200668334960938, -15.835784912109375, -14.47089958190918, -13.106014251708984, -11.741128921508789, -10.376243591308594, -9.011359214782715, -7.6464738845825195, -6.281588554382324, -4.916704177856445, -3.55181884765625, -2.1869335174560547, -0.8220484256744385, 0.5428366661071777, 1.9077215194702148, 3.27260684967041, 4.6374921798706055, 6.002376556396484, 7.36726188659668, 8.732147216796875, 10.09703254699707, 11.461917877197266, 12.826802253723145, 14.19168758392334, 15.556572914123535, 16.921457290649414, 18.28634262084961, 19.651227951049805, 21.01611328125, 22.380998611450195, 23.74588394165039, 25.110767364501953, 26.47565460205078, 27.840538024902344, 29.20542335510254, 30.570308685302734, 31.93519401550293, 33.300079345703125, 34.66496276855469, 36.029850006103516, 37.39473342895508, 38.759620666503906, 40.12450408935547, 41.48938751220703, 42.854270935058594, 44.21915817260742, 45.584041595458984, 46.94892883300781, 48.313812255859375, 49.67869567871094, 51.043582916259766, 52.408470153808594]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 4.0, 11.0, 13.0, 14.0, 14.0, 17.0, 18.0, 21.0, 24.0, 31.0, 20.0, 23.0, 34.0, 43.0, 44.0, 29.0, 41.0, 41.0, 38.0, 40.0, 36.0, 36.0, 41.0, 30.0, 42.0, 36.0, 47.0, 32.0, 25.0, 23.0, 24.0, 17.0, 16.0, 15.0, 8.0, 14.0, 5.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.979555130004883, -9.61448860168457, -9.249422073364258, -8.884355545043945, -8.519288063049316, -8.154221534729004, -7.789155006408691, -7.424088478088379, -7.059021472930908, -6.693954944610596, -6.328887939453125, -5.9638214111328125, -5.5987548828125, -5.233687877655029, -4.868621349334717, -4.503554344177246, -4.138487815856934, -3.773421049118042, -3.4083542823791504, -3.043287754058838, -2.6782209873199463, -2.3131542205810547, -1.9480876922607422, -1.5830209255218506, -1.217954158782959, -0.8528874516487122, -0.48782074451446533, -0.12275409698486328, 0.24231266975402832, 0.6073794364929199, 0.9724459648132324, 1.337512731552124, 1.7025794982910156, 2.0676462650299072, 2.432713031768799, 2.7977795600891113, 3.162846326828003, 3.5279130935668945, 3.892979621887207, 4.2580461502075195, 4.62311315536499, 4.988179683685303, 5.353246688842773, 5.718313217163086, 6.083379745483398, 6.448446750640869, 6.813513278961182, 7.178580284118652, 7.543646812438965, 7.908713340759277, 8.27377986907959, 8.638847351074219, 9.003913879394531, 9.368980407714844, 9.734046936035156, 10.099113464355469, 10.464179992675781, 10.829246520996094, 11.194313049316406, 11.559379577636719, 11.924447059631348, 12.28951358795166, 12.654580116271973, 13.019646644592285, 13.384714126586914]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 12.0, 12.0, 14.0, 19.0, 14.0, 17.0, 21.0, 20.0, 20.0, 33.0, 21.0, 40.0, 33.0, 33.0, 56.0, 41.0, 40.0, 35.0, 46.0, 41.0, 42.0, 41.0, 46.0, 35.0, 31.0, 25.0, 22.0, 22.0, 26.0, 25.0, 13.0, 18.0, 15.0, 16.0, 6.0, 11.0, 3.0, 10.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5146484375, -1.464385986328125, -1.41412353515625, -1.363861083984375, -1.3135986328125, -1.263336181640625, -1.21307373046875, -1.162811279296875, -1.112548828125, -1.062286376953125, -1.01202392578125, -0.961761474609375, -0.9114990234375, -0.861236572265625, -0.81097412109375, -0.760711669921875, -0.71044921875, -0.660186767578125, -0.60992431640625, -0.559661865234375, -0.5093994140625, -0.459136962890625, -0.40887451171875, -0.358612060546875, -0.308349609375, -0.258087158203125, -0.20782470703125, -0.157562255859375, -0.1072998046875, -0.057037353515625, -0.00677490234375, 0.043487548828125, 0.09375, 0.144012451171875, 0.19427490234375, 0.244537353515625, 0.2947998046875, 0.345062255859375, 0.39532470703125, 0.445587158203125, 0.495849609375, 0.546112060546875, 0.59637451171875, 0.646636962890625, 0.6968994140625, 0.747161865234375, 0.79742431640625, 0.847686767578125, 0.89794921875, 0.948211669921875, 0.99847412109375, 1.048736572265625, 1.0989990234375, 1.149261474609375, 1.19952392578125, 1.249786376953125, 1.300048828125, 1.350311279296875, 1.40057373046875, 1.450836181640625, 1.5010986328125, 1.551361083984375, 1.60162353515625, 1.651885986328125, 1.7021484375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 11.0, 16.0, 16.0, 37.0, 47.0, 83.0, 158.0, 203.0, 311.0, 507.0, 805.0, 1285.0, 1891.0, 2848.0, 4360.0, 6562.0, 9963.0, 14690.0, 22082.0, 32311.0, 46717.0, 65050.0, 87197.0, 110178.0, 125615.0, 124366.0, 106860.0, 85017.0, 62368.0, 44075.0, 30658.0, 20862.0, 14149.0, 9365.0, 6113.0, 4127.0, 2632.0, 1743.0, 1157.0, 752.0, 494.0, 314.0, 208.0, 125.0, 87.0, 45.0, 34.0, 19.0, 12.0, 7.0, 7.0, 6.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.1839599609375, -0.17801284790039062, -0.17206573486328125, -0.16611862182617188, -0.1601715087890625, -0.15422439575195312, -0.14827728271484375, -0.14233016967773438, -0.136383056640625, -0.13043594360351562, -0.12448883056640625, -0.11854171752929688, -0.1125946044921875, -0.10664749145507812, -0.10070037841796875, -0.09475326538085938, -0.08880615234375, -0.08285903930664062, -0.07691192626953125, -0.07096481323242188, -0.0650177001953125, -0.059070587158203125, -0.05312347412109375, -0.047176361083984375, -0.041229248046875, -0.035282135009765625, -0.02933502197265625, -0.023387908935546875, -0.0174407958984375, -0.011493682861328125, -0.00554656982421875, 0.000400543212890625, 0.00634765625, 0.012294769287109375, 0.01824188232421875, 0.024188995361328125, 0.0301361083984375, 0.036083221435546875, 0.04203033447265625, 0.047977447509765625, 0.053924560546875, 0.059871673583984375, 0.06581878662109375, 0.07176589965820312, 0.0777130126953125, 0.08366012573242188, 0.08960723876953125, 0.09555435180664062, 0.10150146484375, 0.10744857788085938, 0.11339569091796875, 0.11934280395507812, 0.1252899169921875, 0.13123703002929688, 0.13718414306640625, 0.14313125610351562, 0.149078369140625, 0.15502548217773438, 0.16097259521484375, 0.16691970825195312, 0.1728668212890625, 0.17881393432617188, 0.18476104736328125, 0.19070816040039062, 0.1966552734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 7.0, 9.0, 7.0, 13.0, 14.0, 14.0, 10.0, 27.0, 15.0, 28.0, 27.0, 38.0, 29.0, 49.0, 46.0, 43.0, 43.0, 44.0, 44.0, 1063.0, 51.0, 29.0, 36.0, 38.0, 35.0, 41.0, 33.0, 28.0, 27.0, 19.0, 17.0, 10.0, 30.0, 10.0, 9.0, 5.0, 8.0, 9.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2576751708984375, -1.218475341796875, -1.1792755126953125, -1.14007568359375, -1.1008758544921875, -1.061676025390625, -1.0224761962890625, -0.9832763671875, -0.9440765380859375, -0.904876708984375, -0.8656768798828125, -0.82647705078125, -0.7872772216796875, -0.748077392578125, -0.7088775634765625, -0.669677734375, -0.6304779052734375, -0.591278076171875, -0.5520782470703125, -0.51287841796875, -0.4736785888671875, -0.434478759765625, -0.3952789306640625, -0.3560791015625, -0.3168792724609375, -0.277679443359375, -0.2384796142578125, -0.19927978515625, -0.1600799560546875, -0.120880126953125, -0.0816802978515625, -0.04248046875, -0.0032806396484375, 0.035919189453125, 0.0751190185546875, 0.11431884765625, 0.1535186767578125, 0.192718505859375, 0.2319183349609375, 0.2711181640625, 0.3103179931640625, 0.349517822265625, 0.3887176513671875, 0.42791748046875, 0.4671173095703125, 0.506317138671875, 0.5455169677734375, 0.584716796875, 0.6239166259765625, 0.663116455078125, 0.7023162841796875, 0.74151611328125, 0.7807159423828125, 0.819915771484375, 0.8591156005859375, 0.8983154296875, 0.9375152587890625, 0.976715087890625, 1.0159149169921875, 1.05511474609375, 1.0943145751953125, 1.133514404296875, 1.1727142333984375, 1.2119140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 15.0, 13.0, 10.0, 15.0, 34.0, 46.0, 72.0, 87.0, 129.0, 182.0, 252.0, 465.0, 674.0, 1104.0, 1697.0, 2578.0, 4070.0, 6440.0, 10054.0, 16550.0, 33883.0, 186838.0, 1652267.0, 111940.0, 27858.0, 14851.0, 8866.0, 5728.0, 3704.0, 2306.0, 1493.0, 969.0, 672.0, 429.0, 290.0, 188.0, 119.0, 63.0, 55.0, 46.0, 20.0, 12.0, 10.0, 9.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.39208984375, -0.3787498474121094, -0.36540985107421875, -0.3520698547363281, -0.3387298583984375, -0.3253898620605469, -0.31204986572265625, -0.2987098693847656, -0.285369873046875, -0.2720298767089844, -0.25868988037109375, -0.24534988403320312, -0.2320098876953125, -0.21866989135742188, -0.20532989501953125, -0.19198989868164062, -0.17864990234375, -0.16530990600585938, -0.15196990966796875, -0.13862991333007812, -0.1252899169921875, -0.11194992065429688, -0.09860992431640625, -0.08526992797851562, -0.071929931640625, -0.058589935302734375, -0.04524993896484375, -0.031909942626953125, -0.0185699462890625, -0.005229949951171875, 0.00811004638671875, 0.021450042724609375, 0.0347900390625, 0.048130035400390625, 0.06147003173828125, 0.07481002807617188, 0.0881500244140625, 0.10149002075195312, 0.11483001708984375, 0.12817001342773438, 0.141510009765625, 0.15485000610351562, 0.16819000244140625, 0.18152999877929688, 0.1948699951171875, 0.20820999145507812, 0.22154998779296875, 0.23488998413085938, 0.24822998046875, 0.2615699768066406, 0.27490997314453125, 0.2882499694824219, 0.3015899658203125, 0.3149299621582031, 0.32826995849609375, 0.3416099548339844, 0.354949951171875, 0.3682899475097656, 0.38162994384765625, 0.3949699401855469, 0.4083099365234375, 0.4216499328613281, 0.43498992919921875, 0.4483299255371094, 0.461669921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 11.0, 11.0, 14.0, 19.0, 13.0, 23.0, 26.0, 24.0, 38.0, 55.0, 37.0, 55.0, 61.0, 58.0, 48.0, 56.0, 53.0, 60.0, 46.0, 51.0, 36.0, 25.0, 24.0, 23.0, 18.0, 23.0, 13.0, 7.0, 9.0, 11.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.0247802734375, -0.02407050132751465, -0.023360729217529297, -0.022650957107543945, -0.021941184997558594, -0.021231412887573242, -0.02052164077758789, -0.01981186866760254, -0.019102096557617188, -0.018392324447631836, -0.017682552337646484, -0.016972780227661133, -0.01626300811767578, -0.01555323600769043, -0.014843463897705078, -0.014133691787719727, -0.013423919677734375, -0.012714147567749023, -0.012004375457763672, -0.01129460334777832, -0.010584831237792969, -0.009875059127807617, -0.009165287017822266, -0.008455514907836914, -0.0077457427978515625, -0.007035970687866211, -0.006326198577880859, -0.005616426467895508, -0.004906654357910156, -0.004196882247924805, -0.003487110137939453, -0.0027773380279541016, -0.00206756591796875, -0.0013577938079833984, -0.0006480216979980469, 6.175041198730469e-05, 0.0007715225219726562, 0.0014812946319580078, 0.0021910667419433594, 0.002900838851928711, 0.0036106109619140625, 0.004320383071899414, 0.005030155181884766, 0.005739927291870117, 0.006449699401855469, 0.00715947151184082, 0.007869243621826172, 0.008579015731811523, 0.009288787841796875, 0.009998559951782227, 0.010708332061767578, 0.01141810417175293, 0.012127876281738281, 0.012837648391723633, 0.013547420501708984, 0.014257192611694336, 0.014966964721679688, 0.01567673683166504, 0.01638650894165039, 0.017096281051635742, 0.017806053161621094, 0.018515825271606445, 0.019225597381591797, 0.01993536949157715, 0.0206451416015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 7.0, 13.0, 18.0, 17.0, 17.0, 30.0, 48.0, 45.0, 52.0, 101.0, 116.0, 185.0, 298.0, 527.0, 1499.0, 75850.0, 958788.0, 8792.0, 864.0, 412.0, 239.0, 155.0, 119.0, 73.0, 56.0, 55.0, 41.0, 36.0, 18.0, 12.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.397216796875, -0.3831825256347656, -0.36914825439453125, -0.3551139831542969, -0.3410797119140625, -0.3270454406738281, -0.31301116943359375, -0.2989768981933594, -0.284942626953125, -0.2709083557128906, -0.25687408447265625, -0.24283981323242188, -0.2288055419921875, -0.21477127075195312, -0.20073699951171875, -0.18670272827148438, -0.17266845703125, -0.15863418579101562, -0.14459991455078125, -0.13056564331054688, -0.1165313720703125, -0.10249710083007812, -0.08846282958984375, -0.07442855834960938, -0.060394287109375, -0.046360015869140625, -0.03232574462890625, -0.018291473388671875, -0.0042572021484375, 0.009777069091796875, 0.02381134033203125, 0.037845611572265625, 0.0518798828125, 0.06591415405273438, 0.07994842529296875, 0.09398269653320312, 0.1080169677734375, 0.12205123901367188, 0.13608551025390625, 0.15011978149414062, 0.164154052734375, 0.17818832397460938, 0.19222259521484375, 0.20625686645507812, 0.2202911376953125, 0.23432540893554688, 0.24835968017578125, 0.2623939514160156, 0.27642822265625, 0.2904624938964844, 0.30449676513671875, 0.3185310363769531, 0.3325653076171875, 0.3465995788574219, 0.36063385009765625, 0.3746681213378906, 0.388702392578125, 0.4027366638183594, 0.41677093505859375, 0.4308052062988281, 0.4448394775390625, 0.4588737487792969, 0.47290802001953125, 0.4869422912597656, 0.5009765625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 6.0, 32.0, 223.0, 574.0, 160.0, 15.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03916732966899872, -0.03387698903679848, -0.028586646541953087, -0.023296304047107697, -0.018005963414907455, -0.012715622782707214, -0.007425278425216675, -0.0021349377930164337, 0.0031554028391838074, 0.008445744402706623, 0.013736085966229439, 0.01902642846107483, 0.02431676909327507, 0.02960710972547531, 0.03489745408296585, 0.04018779471516609, 0.04547813534736633, 0.050768475979566574, 0.056058816611766815, 0.061349160969257355, 0.0666394978761673, 0.07192984223365784, 0.07722018659114838, 0.08251053094863892, 0.08780086785554886, 0.0930912122130394, 0.09838154911994934, 0.10367189347743988, 0.10896223783493042, 0.11425257474184036, 0.1195429190993309, 0.12483325600624084, 0.1301235854625702, 0.13541392982006073, 0.14070427417755127, 0.14599460363388062, 0.15128494799137115, 0.1565752923488617, 0.16186563670635223, 0.16715598106384277, 0.17244631052017212, 0.17773665487766266, 0.1830269992351532, 0.18831732869148254, 0.19360767304897308, 0.19889801740646362, 0.20418836176395416, 0.2094787061214447, 0.21476905047893524, 0.22005939483642578, 0.22534973919391632, 0.23064008355140686, 0.2359304130077362, 0.24122075736522675, 0.24651110172271729, 0.25180143117904663, 0.25709179043769836, 0.2623821198940277, 0.26767247915267944, 0.2729628086090088, 0.2782531678676605, 0.28354349732398987, 0.2888338565826416, 0.29412418603897095, 0.2994145154953003]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 12.0, 6.0, 12.0, 21.0, 21.0, 25.0, 32.0, 57.0, 41.0, 60.0, 54.0, 70.0, 54.0, 68.0, 59.0, 60.0, 52.0, 57.0, 42.0, 36.0, 34.0, 30.0, 24.0, 22.0, 15.0, 16.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.047025442123413086, -0.04588892683386803, -0.04475241154432297, -0.04361589252948761, -0.04247937723994255, -0.04134286195039749, -0.040206342935562134, -0.039069827646017075, -0.037933312356472015, -0.036796797066926956, -0.0356602817773819, -0.03452376276254654, -0.03338724747300148, -0.03225073218345642, -0.031114215031266212, -0.029977697879076004, -0.028841182589530945, -0.027704667299985886, -0.026568150147795677, -0.02543163299560547, -0.02429511770606041, -0.02315860241651535, -0.022022085264325142, -0.020885568112134933, -0.019749052822589874, -0.018612537533044815, -0.017476020380854607, -0.016339503228664398, -0.015202987939119339, -0.014066471718251705, -0.012929955497384071, -0.011793439276516438, -0.010656923055648804, -0.00952040683478117, -0.008383890613913536, -0.007247374393045902, -0.006110858172178268, -0.004974341951310635, -0.003837825730443001, -0.002701309509575367, -0.0015647932887077332, -0.00042827706784009933, 0.0007082391530275345, 0.0018447553738951683, 0.002981271594762802, 0.004117787815630436, 0.00525430403649807, 0.006390820257365704, 0.007527336478233337, 0.008663852699100971, 0.009800368919968605, 0.010936885140836239, 0.012073401361703873, 0.013209917582571507, 0.01434643380343914, 0.015482950024306774, 0.016619466245174408, 0.017755981534719467, 0.018892498686909676, 0.020029015839099884, 0.021165531128644943, 0.022302046418190002, 0.02343856357038021, 0.02457508072257042, 0.02571159601211548]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 8.0, 9.0, 13.0, 11.0, 18.0, 20.0, 20.0, 15.0, 25.0, 29.0, 28.0, 28.0, 32.0, 40.0, 32.0, 41.0, 49.0, 30.0, 48.0, 43.0, 37.0, 34.0, 34.0, 30.0, 31.0, 32.0, 38.0, 39.0, 30.0, 23.0, 27.0, 25.0, 7.0, 13.0, 9.0, 12.0, 9.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.4086151123046875, -1.358245849609375, -1.3078765869140625, -1.25750732421875, -1.2071380615234375, -1.156768798828125, -1.1063995361328125, -1.0560302734375, -1.0056610107421875, -0.955291748046875, -0.9049224853515625, -0.85455322265625, -0.8041839599609375, -0.753814697265625, -0.7034454345703125, -0.653076171875, -0.6027069091796875, -0.552337646484375, -0.5019683837890625, -0.45159912109375, -0.4012298583984375, -0.350860595703125, -0.3004913330078125, -0.2501220703125, -0.1997528076171875, -0.149383544921875, -0.0990142822265625, -0.04864501953125, 0.0017242431640625, 0.052093505859375, 0.1024627685546875, 0.15283203125, 0.2032012939453125, 0.253570556640625, 0.3039398193359375, 0.35430908203125, 0.4046783447265625, 0.455047607421875, 0.5054168701171875, 0.5557861328125, 0.6061553955078125, 0.656524658203125, 0.7068939208984375, 0.75726318359375, 0.8076324462890625, 0.858001708984375, 0.9083709716796875, 0.958740234375, 1.0091094970703125, 1.059478759765625, 1.1098480224609375, 1.16021728515625, 1.2105865478515625, 1.260955810546875, 1.3113250732421875, 1.3616943359375, 1.4120635986328125, 1.462432861328125, 1.5128021240234375, 1.56317138671875, 1.6135406494140625, 1.663909912109375, 1.7142791748046875, 1.7646484375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 8.0, 10.0, 11.0, 23.0, 32.0, 46.0, 62.0, 86.0, 131.0, 217.0, 320.0, 431.0, 687.0, 1108.0, 1792.0, 3084.0, 5430.0, 10568.0, 24690.0, 71820.0, 283128.0, 459316.0, 117941.0, 36483.0, 14486.0, 6837.0, 3759.0, 2181.0, 1351.0, 833.0, 552.0, 374.0, 247.0, 155.0, 112.0, 74.0, 48.0, 38.0, 27.0, 21.0, 13.0, 10.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.65631103515625, -2.5762939453125, -2.49627685546875, -2.416259765625, -2.33624267578125, -2.2562255859375, -2.17620849609375, -2.09619140625, -2.01617431640625, -1.9361572265625, -1.85614013671875, -1.776123046875, -1.69610595703125, -1.6160888671875, -1.53607177734375, -1.4560546875, -1.37603759765625, -1.2960205078125, -1.21600341796875, -1.135986328125, -1.05596923828125, -0.9759521484375, -0.89593505859375, -0.81591796875, -0.73590087890625, -0.6558837890625, -0.57586669921875, -0.495849609375, -0.41583251953125, -0.3358154296875, -0.25579833984375, -0.17578125, -0.09576416015625, -0.0157470703125, 0.06427001953125, 0.144287109375, 0.22430419921875, 0.3043212890625, 0.38433837890625, 0.46435546875, 0.54437255859375, 0.6243896484375, 0.70440673828125, 0.784423828125, 0.86444091796875, 0.9444580078125, 1.02447509765625, 1.1044921875, 1.18450927734375, 1.2645263671875, 1.34454345703125, 1.424560546875, 1.50457763671875, 1.5845947265625, 1.66461181640625, 1.74462890625, 1.82464599609375, 1.9046630859375, 1.98468017578125, 2.064697265625, 2.14471435546875, 2.2247314453125, 2.30474853515625, 2.384765625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 2.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 14.0, 19.0, 16.0, 14.0, 22.0, 22.0, 35.0, 28.0, 37.0, 49.0, 73.0, 88.0, 96.0, 208.0, 1407.0, 262.0, 154.0, 86.0, 49.0, 35.0, 52.0, 34.0, 35.0, 25.0, 28.0, 29.0, 16.0, 13.0, 12.0, 12.0, 16.0, 10.0, 8.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.05859375, -3.9451904296875, -3.831787109375, -3.7183837890625, -3.60498046875, -3.4915771484375, -3.378173828125, -3.2647705078125, -3.1513671875, -3.0379638671875, -2.924560546875, -2.8111572265625, -2.69775390625, -2.5843505859375, -2.470947265625, -2.3575439453125, -2.244140625, -2.1307373046875, -2.017333984375, -1.9039306640625, -1.79052734375, -1.6771240234375, -1.563720703125, -1.4503173828125, -1.3369140625, -1.2235107421875, -1.110107421875, -0.9967041015625, -0.88330078125, -0.7698974609375, -0.656494140625, -0.5430908203125, -0.4296875, -0.3162841796875, -0.202880859375, -0.0894775390625, 0.02392578125, 0.1373291015625, 0.250732421875, 0.3641357421875, 0.4775390625, 0.5909423828125, 0.704345703125, 0.8177490234375, 0.93115234375, 1.0445556640625, 1.157958984375, 1.2713623046875, 1.384765625, 1.4981689453125, 1.611572265625, 1.7249755859375, 1.83837890625, 1.9517822265625, 2.065185546875, 2.1785888671875, 2.2919921875, 2.4053955078125, 2.518798828125, 2.6322021484375, 2.74560546875, 2.8590087890625, 2.972412109375, 3.0858154296875, 3.19921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 9.0, 8.0, 7.0, 12.0, 17.0, 26.0, 23.0, 21.0, 61.0, 87.0, 107.0, 153.0, 262.0, 456.0, 864.0, 3057.0, 124644.0, 3005783.0, 7356.0, 1301.0, 537.0, 309.0, 174.0, 127.0, 97.0, 52.0, 41.0, 27.0, 24.0, 19.0, 8.0, 7.0, 14.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8515625, -11.4591064453125, -11.066650390625, -10.6741943359375, -10.28173828125, -9.8892822265625, -9.496826171875, -9.1043701171875, -8.7119140625, -8.3194580078125, -7.927001953125, -7.5345458984375, -7.14208984375, -6.7496337890625, -6.357177734375, -5.9647216796875, -5.572265625, -5.1798095703125, -4.787353515625, -4.3948974609375, -4.00244140625, -3.6099853515625, -3.217529296875, -2.8250732421875, -2.4326171875, -2.0401611328125, -1.647705078125, -1.2552490234375, -0.86279296875, -0.4703369140625, -0.077880859375, 0.3145751953125, 0.70703125, 1.0994873046875, 1.491943359375, 1.8843994140625, 2.27685546875, 2.6693115234375, 3.061767578125, 3.4542236328125, 3.8466796875, 4.2391357421875, 4.631591796875, 5.0240478515625, 5.41650390625, 5.8089599609375, 6.201416015625, 6.5938720703125, 6.986328125, 7.3787841796875, 7.771240234375, 8.1636962890625, 8.55615234375, 8.9486083984375, 9.341064453125, 9.7335205078125, 10.1259765625, 10.5184326171875, 10.910888671875, 11.3033447265625, 11.69580078125, 12.0882568359375, 12.480712890625, 12.8731689453125, 13.265625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 17.0, 121.0, 352.0, 351.0, 129.0, 33.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.051490783691406, -53.881195068359375, -52.710899353027344, -51.54060363769531, -50.37030792236328, -49.200016021728516, -48.029720306396484, -46.85942459106445, -45.68912887573242, -44.51883316040039, -43.34853744506836, -42.17824172973633, -41.00794982910156, -39.83765411376953, -38.6673583984375, -37.49706268310547, -36.32676696777344, -35.156471252441406, -33.986175537109375, -32.815879821777344, -31.645586013793945, -30.475290298461914, -29.304996490478516, -28.134700775146484, -26.964405059814453, -25.794109344482422, -24.62381362915039, -23.453519821166992, -22.28322410583496, -21.11292839050293, -19.94263458251953, -18.7723388671875, -17.602046966552734, -16.431751251220703, -15.261456489562988, -14.091161727905273, -12.920866012573242, -11.750570297241211, -10.580275535583496, -9.409980773925781, -8.23968505859375, -7.069389820098877, -5.899094581604004, -4.728799343109131, -3.558504104614258, -2.3882088661193848, -1.2179136276245117, -0.047618865966796875, 1.1226768493652344, 2.2929720878601074, 3.4632673263549805, 4.6335625648498535, 5.803857803344727, 6.9741530418396, 8.144448280334473, 9.314743041992188, 10.485038757324219, 11.65533447265625, 12.825629234313965, 13.99592399597168, 15.166219711303711, 16.336515426635742, 17.50680923461914, 18.677104949951172, 19.847400665283203]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 6.0, 4.0, 3.0, 6.0, 5.0, 6.0, 4.0, 9.0, 14.0, 15.0, 16.0, 11.0, 19.0, 11.0, 11.0, 17.0, 17.0, 20.0, 19.0, 20.0, 22.0, 26.0, 47.0, 29.0, 21.0, 38.0, 39.0, 35.0, 33.0, 43.0, 28.0, 36.0, 23.0, 34.0, 29.0, 33.0, 30.0, 31.0, 21.0, 21.0, 19.0, 32.0, 12.0, 18.0, 14.0, 5.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.882428169250488, -7.606545925140381, -7.330663204193115, -7.054780960083008, -6.778898239135742, -6.503015995025635, -6.227133750915527, -5.951251029968262, -5.675368785858154, -5.399486541748047, -5.123603820800781, -4.847721576690674, -4.571839332580566, -4.295956611633301, -4.020074367523193, -3.744191884994507, -3.4683094024658203, -3.192426919937134, -2.9165444374084473, -2.64066219329834, -2.3647797107696533, -2.088897228240967, -1.8130148649215698, -1.5371325016021729, -1.2612500190734863, -0.9853675961494446, -0.7094851732254028, -0.4336027503013611, -0.15772032737731934, 0.11816215515136719, 0.39404451847076416, 0.6699268817901611, 0.9458093643188477, 1.2216918468475342, 1.4975742101669312, 1.7734565734863281, 2.0493390560150146, 2.325221538543701, 2.6011037826538086, 2.876986265182495, 3.1528687477111816, 3.428751230239868, 3.7046337127685547, 3.980515956878662, 4.2563982009887695, 4.532280921936035, 4.808163166046143, 5.08404541015625, 5.359928131103516, 5.635810375213623, 5.911693096160889, 6.187575340270996, 6.463458061218262, 6.739340305328369, 7.015222549438477, 7.291105270385742, 7.56698751449585, 7.842869758605957, 8.118752479553223, 8.394635200500488, 8.670516967773438, 8.946399688720703, 9.222282409667969, 9.498164176940918, 9.774046897888184]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 8.0, 4.0, 11.0, 15.0, 18.0, 21.0, 25.0, 23.0, 33.0, 31.0, 51.0, 34.0, 41.0, 38.0, 36.0, 36.0, 46.0, 41.0, 42.0, 40.0, 41.0, 44.0, 42.0, 36.0, 34.0, 32.0, 35.0, 26.0, 21.0, 15.0, 12.0, 11.0, 16.0, 8.0, 8.0, 5.0, 2.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.6447601318359375, -1.588348388671875, -1.5319366455078125, -1.47552490234375, -1.4191131591796875, -1.362701416015625, -1.3062896728515625, -1.2498779296875, -1.1934661865234375, -1.137054443359375, -1.0806427001953125, -1.02423095703125, -0.9678192138671875, -0.911407470703125, -0.8549957275390625, -0.798583984375, -0.7421722412109375, -0.685760498046875, -0.6293487548828125, -0.57293701171875, -0.5165252685546875, -0.460113525390625, -0.4037017822265625, -0.3472900390625, -0.2908782958984375, -0.234466552734375, -0.1780548095703125, -0.12164306640625, -0.0652313232421875, -0.008819580078125, 0.0475921630859375, 0.10400390625, 0.1604156494140625, 0.216827392578125, 0.2732391357421875, 0.32965087890625, 0.3860626220703125, 0.442474365234375, 0.4988861083984375, 0.5552978515625, 0.6117095947265625, 0.668121337890625, 0.7245330810546875, 0.78094482421875, 0.8373565673828125, 0.893768310546875, 0.9501800537109375, 1.006591796875, 1.0630035400390625, 1.119415283203125, 1.1758270263671875, 1.23223876953125, 1.2886505126953125, 1.345062255859375, 1.4014739990234375, 1.4578857421875, 1.5142974853515625, 1.570709228515625, 1.6271209716796875, 1.68353271484375, 1.7399444580078125, 1.796356201171875, 1.8527679443359375, 1.9091796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 25.0, 33.0, 34.0, 64.0, 93.0, 114.0, 168.0, 227.0, 318.0, 459.0, 635.0, 1011.0, 1616.0, 3124.0, 7154.0, 22899.0, 157042.0, 1659539.0, 2081296.0, 213235.0, 27975.0, 8279.0, 3486.0, 1874.0, 1134.0, 721.0, 507.0, 315.0, 228.0, 164.0, 129.0, 97.0, 66.0, 53.0, 42.0, 29.0, 19.0, 19.0, 10.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.923828125, -3.797515869140625, -3.67120361328125, -3.544891357421875, -3.4185791015625, -3.292266845703125, -3.16595458984375, -3.039642333984375, -2.913330078125, -2.787017822265625, -2.66070556640625, -2.534393310546875, -2.4080810546875, -2.281768798828125, -2.15545654296875, -2.029144287109375, -1.90283203125, -1.776519775390625, -1.65020751953125, -1.523895263671875, -1.3975830078125, -1.271270751953125, -1.14495849609375, -1.018646240234375, -0.892333984375, -0.766021728515625, -0.63970947265625, -0.513397216796875, -0.3870849609375, -0.260772705078125, -0.13446044921875, -0.008148193359375, 0.1181640625, 0.244476318359375, 0.37078857421875, 0.497100830078125, 0.6234130859375, 0.749725341796875, 0.87603759765625, 1.002349853515625, 1.128662109375, 1.254974365234375, 1.38128662109375, 1.507598876953125, 1.6339111328125, 1.760223388671875, 1.88653564453125, 2.012847900390625, 2.13916015625, 2.265472412109375, 2.39178466796875, 2.518096923828125, 2.6444091796875, 2.770721435546875, 2.89703369140625, 3.023345947265625, 3.149658203125, 3.275970458984375, 3.40228271484375, 3.528594970703125, 3.6549072265625, 3.781219482421875, 3.90753173828125, 4.033843994140625, 4.16015625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 29.0, 26.0, 44.0, 62.0, 104.0, 164.0, 245.0, 330.0, 515.0, 672.0, 586.0, 454.0, 264.0, 186.0, 106.0, 84.0, 80.0, 28.0, 18.0, 12.0, 9.0, 11.0, 5.0, 5.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.383880615234375, -3.26580810546875, -3.147735595703125, -3.0296630859375, -2.911590576171875, -2.79351806640625, -2.675445556640625, -2.557373046875, -2.439300537109375, -2.32122802734375, -2.203155517578125, -2.0850830078125, -1.967010498046875, -1.84893798828125, -1.730865478515625, -1.61279296875, -1.494720458984375, -1.37664794921875, -1.258575439453125, -1.1405029296875, -1.022430419921875, -0.90435791015625, -0.786285400390625, -0.668212890625, -0.550140380859375, -0.43206787109375, -0.313995361328125, -0.1959228515625, -0.077850341796875, 0.04022216796875, 0.158294677734375, 0.2763671875, 0.394439697265625, 0.51251220703125, 0.630584716796875, 0.7486572265625, 0.866729736328125, 0.98480224609375, 1.102874755859375, 1.220947265625, 1.339019775390625, 1.45709228515625, 1.575164794921875, 1.6932373046875, 1.811309814453125, 1.92938232421875, 2.047454833984375, 2.16552734375, 2.283599853515625, 2.40167236328125, 2.519744873046875, 2.6378173828125, 2.755889892578125, 2.87396240234375, 2.992034912109375, 3.110107421875, 3.228179931640625, 3.34625244140625, 3.464324951171875, 3.5823974609375, 3.700469970703125, 3.81854248046875, 3.936614990234375, 4.0546875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 13.0, 14.0, 10.0, 18.0, 24.0, 37.0, 59.0, 88.0, 135.0, 256.0, 545.0, 1402.0, 4836.0, 33938.0, 994288.0, 3061739.0, 85045.0, 8340.0, 1943.0, 738.0, 323.0, 182.0, 100.0, 69.0, 44.0, 15.0, 19.0, 12.0, 11.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.144775390625, -5.93408203125, -5.723388671875, -5.5126953125, -5.302001953125, -5.09130859375, -4.880615234375, -4.669921875, -4.459228515625, -4.24853515625, -4.037841796875, -3.8271484375, -3.616455078125, -3.40576171875, -3.195068359375, -2.984375, -2.773681640625, -2.56298828125, -2.352294921875, -2.1416015625, -1.930908203125, -1.72021484375, -1.509521484375, -1.298828125, -1.088134765625, -0.87744140625, -0.666748046875, -0.4560546875, -0.245361328125, -0.03466796875, 0.176025390625, 0.38671875, 0.597412109375, 0.80810546875, 1.018798828125, 1.2294921875, 1.440185546875, 1.65087890625, 1.861572265625, 2.072265625, 2.282958984375, 2.49365234375, 2.704345703125, 2.9150390625, 3.125732421875, 3.33642578125, 3.547119140625, 3.7578125, 3.968505859375, 4.17919921875, 4.389892578125, 4.6005859375, 4.811279296875, 5.02197265625, 5.232666015625, 5.443359375, 5.654052734375, 5.86474609375, 6.075439453125, 6.2861328125, 6.496826171875, 6.70751953125, 6.918212890625, 7.12890625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 277.0, 667.0, 59.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.44068908691406, -171.28453063964844, -168.12835693359375, -164.97219848632812, -161.81602478027344, -158.6598663330078, -155.50369262695312, -152.3475341796875, -149.19137573242188, -146.03521728515625, -142.87904357910156, -139.72288513183594, -136.56671142578125, -133.41055297851562, -130.25439453125, -127.09822082519531, -123.94205474853516, -120.785888671875, -117.62972259521484, -114.47355651855469, -111.31739807128906, -108.1612319946289, -105.00506591796875, -101.8488998413086, -98.69273376464844, -95.53656768798828, -92.38040161132812, -89.2242431640625, -86.06807708740234, -82.91191101074219, -79.75574493408203, -76.59957885742188, -73.44342041015625, -70.2872543334961, -67.13108825683594, -63.97492599487305, -60.818763732910156, -57.66259765625, -54.506431579589844, -51.35026550292969, -48.19410705566406, -45.037940979003906, -41.881778717041016, -38.72561264038086, -35.56945037841797, -32.41328430175781, -29.257118225097656, -26.100954055786133, -22.944787979125977, -19.788623809814453, -16.632457733154297, -13.476293563842773, -10.32012939453125, -7.163965225219727, -4.00779914855957, -0.8516349792480469, 2.3045291900634766, 5.460693836212158, 8.61685848236084, 11.77302360534668, 14.929187774658203, 18.085351943969727, 21.241518020629883, 24.397682189941406, 27.55384635925293]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 7.0, 16.0, 15.0, 14.0, 28.0, 33.0, 51.0, 50.0, 50.0, 62.0, 85.0, 62.0, 74.0, 74.0, 59.0, 62.0, 50.0, 39.0, 34.0, 36.0, 19.0, 26.0, 17.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.838165283203125, -16.26803970336914, -15.697914123535156, -15.127788543701172, -14.557662963867188, -13.987537384033203, -13.417411804199219, -12.847286224365234, -12.27716064453125, -11.707035064697266, -11.136909484863281, -10.566783905029297, -9.996658325195312, -9.426532745361328, -8.856407165527344, -8.28628158569336, -7.716156959533691, -7.146031379699707, -6.575905799865723, -6.005780220031738, -5.435654640197754, -4.8655290603637695, -4.295403957366943, -3.725278377532959, -3.1551527976989746, -2.5850272178649902, -2.014901638031006, -1.4447762966156006, -0.8746507167816162, -0.30452513694763184, 0.26560020446777344, 0.8357257843017578, 1.4058513641357422, 1.9759769439697266, 2.546102523803711, 3.116227865219116, 3.6863534450531006, 4.256479263305664, 4.82660436630249, 5.396729946136475, 5.966855525970459, 6.536981105804443, 7.107106685638428, 7.677231788635254, 8.247357368469238, 8.817482948303223, 9.387608528137207, 9.957734107971191, 10.527859687805176, 11.09798526763916, 11.668110847473145, 12.238236427307129, 12.808362007141113, 13.378487586975098, 13.948612213134766, 14.51873779296875, 15.088863372802734, 15.658988952636719, 16.229114532470703, 16.799240112304688, 17.369365692138672, 17.939491271972656, 18.50961685180664, 19.079742431640625, 19.64986801147461]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 18.0, 13.0, 15.0, 21.0, 29.0, 26.0, 29.0, 29.0, 37.0, 35.0, 45.0, 34.0, 31.0, 34.0, 34.0, 42.0, 37.0, 39.0, 41.0, 27.0, 48.0, 39.0, 37.0, 32.0, 28.0, 31.0, 22.0, 13.0, 18.0, 12.0, 11.0, 13.0, 14.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.5654296875, -1.51898193359375, -1.4725341796875, -1.42608642578125, -1.379638671875, -1.33319091796875, -1.2867431640625, -1.24029541015625, -1.19384765625, -1.14739990234375, -1.1009521484375, -1.05450439453125, -1.008056640625, -0.96160888671875, -0.9151611328125, -0.86871337890625, -0.822265625, -0.77581787109375, -0.7293701171875, -0.68292236328125, -0.636474609375, -0.59002685546875, -0.5435791015625, -0.49713134765625, -0.45068359375, -0.40423583984375, -0.3577880859375, -0.31134033203125, -0.264892578125, -0.21844482421875, -0.1719970703125, -0.12554931640625, -0.0791015625, -0.03265380859375, 0.0137939453125, 0.06024169921875, 0.106689453125, 0.15313720703125, 0.1995849609375, 0.24603271484375, 0.29248046875, 0.33892822265625, 0.3853759765625, 0.43182373046875, 0.478271484375, 0.52471923828125, 0.5711669921875, 0.61761474609375, 0.6640625, 0.71051025390625, 0.7569580078125, 0.80340576171875, 0.849853515625, 0.89630126953125, 0.9427490234375, 0.98919677734375, 1.03564453125, 1.08209228515625, 1.1285400390625, 1.17498779296875, 1.221435546875, 1.26788330078125, 1.3143310546875, 1.36077880859375, 1.4072265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 11.0, 14.0, 28.0, 34.0, 62.0, 89.0, 158.0, 196.0, 328.0, 509.0, 805.0, 1235.0, 1863.0, 3020.0, 4692.0, 7090.0, 10958.0, 16804.0, 26018.0, 39258.0, 58269.0, 84562.0, 113186.0, 137796.0, 140782.0, 120319.0, 91368.0, 64257.0, 43468.0, 28485.0, 18669.0, 12182.0, 7760.0, 5107.0, 3216.0, 2127.0, 1346.0, 868.0, 558.0, 386.0, 220.0, 153.0, 92.0, 66.0, 43.0, 36.0, 23.0, 12.0, 8.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1658935546875, -0.16056251525878906, -0.15523147583007812, -0.1499004364013672, -0.14456939697265625, -0.1392383575439453, -0.13390731811523438, -0.12857627868652344, -0.1232452392578125, -0.11791419982910156, -0.11258316040039062, -0.10725212097167969, -0.10192108154296875, -0.09659004211425781, -0.09125900268554688, -0.08592796325683594, -0.080596923828125, -0.07526588439941406, -0.06993484497070312, -0.06460380554199219, -0.05927276611328125, -0.05394172668457031, -0.048610687255859375, -0.04327964782714844, -0.0379486083984375, -0.03261756896972656, -0.027286529541015625, -0.021955490112304688, -0.01662445068359375, -0.011293411254882812, -0.005962371826171875, -0.0006313323974609375, 0.00469970703125, 0.010030746459960938, 0.015361785888671875, 0.020692825317382812, 0.02602386474609375, 0.03135490417480469, 0.036685943603515625, 0.04201698303222656, 0.0473480224609375, 0.05267906188964844, 0.058010101318359375, 0.06334114074707031, 0.06867218017578125, 0.07400321960449219, 0.07933425903320312, 0.08466529846191406, 0.089996337890625, 0.09532737731933594, 0.10065841674804688, 0.10598945617675781, 0.11132049560546875, 0.11665153503417969, 0.12198257446289062, 0.12731361389160156, 0.1326446533203125, 0.13797569274902344, 0.14330673217773438, 0.1486377716064453, 0.15396881103515625, 0.1592998504638672, 0.16463088989257812, 0.16996192932128906, 0.17529296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 7.0, 7.0, 11.0, 13.0, 11.0, 8.0, 10.0, 24.0, 16.0, 20.0, 21.0, 23.0, 23.0, 31.0, 37.0, 31.0, 32.0, 24.0, 35.0, 39.0, 33.0, 1057.0, 35.0, 43.0, 46.0, 40.0, 41.0, 44.0, 33.0, 30.0, 21.0, 27.0, 22.0, 14.0, 23.0, 17.0, 11.0, 11.0, 12.0, 7.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9267578125, -0.8947296142578125, -0.862701416015625, -0.8306732177734375, -0.79864501953125, -0.7666168212890625, -0.734588623046875, -0.7025604248046875, -0.6705322265625, -0.6385040283203125, -0.606475830078125, -0.5744476318359375, -0.54241943359375, -0.5103912353515625, -0.478363037109375, -0.4463348388671875, -0.414306640625, -0.3822784423828125, -0.350250244140625, -0.3182220458984375, -0.28619384765625, -0.2541656494140625, -0.222137451171875, -0.1901092529296875, -0.1580810546875, -0.1260528564453125, -0.094024658203125, -0.0619964599609375, -0.02996826171875, 0.0020599365234375, 0.034088134765625, 0.0661163330078125, 0.09814453125, 0.1301727294921875, 0.162200927734375, 0.1942291259765625, 0.22625732421875, 0.2582855224609375, 0.290313720703125, 0.3223419189453125, 0.3543701171875, 0.3863983154296875, 0.418426513671875, 0.4504547119140625, 0.48248291015625, 0.5145111083984375, 0.546539306640625, 0.5785675048828125, 0.610595703125, 0.6426239013671875, 0.674652099609375, 0.7066802978515625, 0.73870849609375, 0.7707366943359375, 0.802764892578125, 0.8347930908203125, 0.8668212890625, 0.8988494873046875, 0.930877685546875, 0.9629058837890625, 0.99493408203125, 1.0269622802734375, 1.058990478515625, 1.0910186767578125, 1.123046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 12.0, 25.0, 19.0, 35.0, 55.0, 90.0, 132.0, 199.0, 308.0, 484.0, 722.0, 1218.0, 1800.0, 3005.0, 4722.0, 7521.0, 12135.0, 21398.0, 55846.0, 1219662.0, 664883.0, 50919.0, 20906.0, 11791.0, 7117.0, 4359.0, 2658.0, 1870.0, 1143.0, 735.0, 458.0, 338.0, 187.0, 123.0, 73.0, 40.0, 38.0, 30.0, 23.0, 9.0, 6.0, 7.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.40045166015625, -0.3883056640625, -0.37615966796875, -0.364013671875, -0.35186767578125, -0.3397216796875, -0.32757568359375, -0.3154296875, -0.30328369140625, -0.2911376953125, -0.27899169921875, -0.266845703125, -0.25469970703125, -0.2425537109375, -0.23040771484375, -0.21826171875, -0.20611572265625, -0.1939697265625, -0.18182373046875, -0.169677734375, -0.15753173828125, -0.1453857421875, -0.13323974609375, -0.12109375, -0.10894775390625, -0.0968017578125, -0.08465576171875, -0.072509765625, -0.06036376953125, -0.0482177734375, -0.03607177734375, -0.02392578125, -0.01177978515625, 0.0003662109375, 0.01251220703125, 0.024658203125, 0.03680419921875, 0.0489501953125, 0.06109619140625, 0.0732421875, 0.08538818359375, 0.0975341796875, 0.10968017578125, 0.121826171875, 0.13397216796875, 0.1461181640625, 0.15826416015625, 0.17041015625, 0.18255615234375, 0.1947021484375, 0.20684814453125, 0.218994140625, 0.23114013671875, 0.2432861328125, 0.25543212890625, 0.267578125, 0.27972412109375, 0.2918701171875, 0.30401611328125, 0.316162109375, 0.32830810546875, 0.3404541015625, 0.35260009765625, 0.36474609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 2.0, 7.0, 3.0, 7.0, 5.0, 20.0, 23.0, 29.0, 39.0, 40.0, 55.0, 66.0, 85.0, 71.0, 83.0, 96.0, 63.0, 62.0, 52.0, 40.0, 29.0, 25.0, 19.0, 19.0, 15.0, 11.0, 5.0, 3.0, 7.0, 7.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02166748046875, -0.020815372467041016, -0.01996326446533203, -0.019111156463623047, -0.018259048461914062, -0.017406940460205078, -0.016554832458496094, -0.01570272445678711, -0.014850616455078125, -0.01399850845336914, -0.013146400451660156, -0.012294292449951172, -0.011442184448242188, -0.010590076446533203, -0.009737968444824219, -0.008885860443115234, -0.00803375244140625, -0.007181644439697266, -0.006329536437988281, -0.005477428436279297, -0.0046253204345703125, -0.003773212432861328, -0.0029211044311523438, -0.0020689964294433594, -0.001216888427734375, -0.0003647804260253906, 0.00048732757568359375, 0.0013394355773925781, 0.0021915435791015625, 0.003043651580810547, 0.0038957595825195312, 0.004747867584228516, 0.0055999755859375, 0.006452083587646484, 0.007304191589355469, 0.008156299591064453, 0.009008407592773438, 0.009860515594482422, 0.010712623596191406, 0.01156473159790039, 0.012416839599609375, 0.01326894760131836, 0.014121055603027344, 0.014973163604736328, 0.015825271606445312, 0.016677379608154297, 0.01752948760986328, 0.018381595611572266, 0.01923370361328125, 0.020085811614990234, 0.02093791961669922, 0.021790027618408203, 0.022642135620117188, 0.023494243621826172, 0.024346351623535156, 0.02519845962524414, 0.026050567626953125, 0.02690267562866211, 0.027754783630371094, 0.028606891632080078, 0.029458999633789062, 0.030311107635498047, 0.03116321563720703, 0.032015323638916016, 0.032867431640625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 10.0, 23.0, 16.0, 27.0, 39.0, 45.0, 67.0, 101.0, 139.0, 189.0, 399.0, 897.0, 5459.0, 875027.0, 161761.0, 2780.0, 620.0, 299.0, 201.0, 114.0, 83.0, 73.0, 47.0, 23.0, 14.0, 13.0, 16.0, 16.0, 7.0, 4.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0], "bins": [-0.54931640625, -0.5355339050292969, -0.5217514038085938, -0.5079689025878906, -0.4941864013671875, -0.4804039001464844, -0.46662139892578125, -0.4528388977050781, -0.439056396484375, -0.4252738952636719, -0.41149139404296875, -0.3977088928222656, -0.3839263916015625, -0.3701438903808594, -0.35636138916015625, -0.3425788879394531, -0.32879638671875, -0.3150138854980469, -0.30123138427734375, -0.2874488830566406, -0.2736663818359375, -0.2598838806152344, -0.24610137939453125, -0.23231887817382812, -0.218536376953125, -0.20475387573242188, -0.19097137451171875, -0.17718887329101562, -0.1634063720703125, -0.14962387084960938, -0.13584136962890625, -0.12205886840820312, -0.1082763671875, -0.09449386596679688, -0.08071136474609375, -0.06692886352539062, -0.0531463623046875, -0.039363861083984375, -0.02558135986328125, -0.011798858642578125, 0.001983642578125, 0.015766143798828125, 0.02954864501953125, 0.043331146240234375, 0.0571136474609375, 0.07089614868164062, 0.08467864990234375, 0.09846115112304688, 0.11224365234375, 0.12602615356445312, 0.13980865478515625, 0.15359115600585938, 0.1673736572265625, 0.18115615844726562, 0.19493865966796875, 0.20872116088867188, 0.222503662109375, 0.23628616333007812, 0.25006866455078125, 0.2638511657714844, 0.2776336669921875, 0.2914161682128906, 0.30519866943359375, 0.3189811706542969, 0.332763671875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 20.0, 48.0, 93.0, 231.0, 281.0, 163.0, 85.0, 32.0, 20.0, 10.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.09890901297330856, -0.09705847501754761, -0.09520793706178665, -0.0933573916554451, -0.09150685369968414, -0.08965631574392319, -0.08780577778816223, -0.08595523238182068, -0.08410469442605972, -0.08225415647029877, -0.08040361851453781, -0.07855307310819626, -0.0767025351524353, -0.07485199719667435, -0.07300145924091339, -0.07115091383457184, -0.06930038332939148, -0.06744984537363052, -0.06559930741786957, -0.06374876201152802, -0.06189822405576706, -0.060047686100006104, -0.05819714814424515, -0.05634660646319389, -0.05449606478214264, -0.05264552682638168, -0.05079498514533043, -0.04894444718956947, -0.04709390550851822, -0.04524336755275726, -0.04339282959699631, -0.04154228791594505, -0.0396917499601841, -0.03784121200442314, -0.03599067032337189, -0.03414013236761093, -0.03228959068655968, -0.03043905273079872, -0.028588512912392616, -0.02673797309398651, -0.024887433275580406, -0.0230368934571743, -0.021186353638768196, -0.01933581382036209, -0.017485275864601135, -0.01563473418354988, -0.013784196227788925, -0.01193365640938282, -0.010083116590976715, -0.00823257677257061, -0.006382037419825792, -0.004531498067080975, -0.0026809582486748695, -0.0008304184302687645, 0.001020120456814766, 0.002870660275220871, 0.004721200093626976, 0.006571739912033081, 0.008422279730439186, 0.010272818617522717, 0.012123358435928822, 0.013973898254334927, 0.015824437141418457, 0.017674976959824562, 0.019525516778230667]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 2.0, 8.0, 9.0, 5.0, 8.0, 10.0, 14.0, 17.0, 17.0, 20.0, 18.0, 18.0, 26.0, 25.0, 36.0, 44.0, 34.0, 40.0, 41.0, 37.0, 41.0, 36.0, 47.0, 32.0, 37.0, 35.0, 34.0, 24.0, 34.0, 25.0, 25.0, 22.0, 25.0, 16.0, 24.0, 20.0, 15.0, 17.0, 14.0, 8.0, 8.0, 9.0, 7.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017521142959594727, -0.016970328986644745, -0.016419516876339912, -0.01586870476603508, -0.015317890793085098, -0.014767077751457691, -0.014216264709830284, -0.013665451668202877, -0.01311463862657547, -0.012563825584948063, -0.012013012543320656, -0.011462199501693249, -0.010911386460065842, -0.010360573418438435, -0.009809760376811028, -0.00925894733518362, -0.008708134293556213, -0.008157321251928806, -0.007606508210301399, -0.007055695168673992, -0.006504882127046585, -0.005954069085419178, -0.005403256043791771, -0.004852443002164364, -0.004301629960536957, -0.0037508169189095497, -0.0032000038772821426, -0.0026491908356547356, -0.0020983777940273285, -0.0015475647523999214, -0.0009967517107725143, -0.00044593866914510727, 0.0001048743724822998, 0.0006556874141097069, 0.001206500455737114, 0.001757313497364521, 0.002308126538991928, 0.002858939580619335, 0.0034097526222467422, 0.003960565663874149, 0.004511378705501556, 0.0050621917471289635, 0.0056130047887563705, 0.006163817830383778, 0.006714630872011185, 0.007265443913638592, 0.007816256955265999, 0.008367069996893406, 0.008917883038520813, 0.00946869608014822, 0.010019509121775627, 0.010570322163403034, 0.011121135205030441, 0.011671948246657848, 0.012222761288285255, 0.012773574329912663, 0.01332438737154007, 0.013875200413167477, 0.014426013454794884, 0.01497682649642229, 0.015527639538049698, 0.01607845351099968, 0.016629265621304512, 0.017180077731609344, 0.017730891704559326]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 8.0, 12.0, 10.0, 15.0, 15.0, 10.0, 19.0, 14.0, 26.0, 31.0, 20.0, 31.0, 42.0, 35.0, 27.0, 39.0, 42.0, 32.0, 29.0, 22.0, 43.0, 39.0, 34.0, 42.0, 29.0, 35.0, 40.0, 23.0, 23.0, 19.0, 17.0, 32.0, 10.0, 21.0, 16.0, 12.0, 12.0, 7.0, 8.0, 8.0, 10.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.34375, -1.302459716796875, -1.26116943359375, -1.219879150390625, -1.1785888671875, -1.137298583984375, -1.09600830078125, -1.054718017578125, -1.013427734375, -0.972137451171875, -0.93084716796875, -0.889556884765625, -0.8482666015625, -0.806976318359375, -0.76568603515625, -0.724395751953125, -0.68310546875, -0.641815185546875, -0.60052490234375, -0.559234619140625, -0.5179443359375, -0.476654052734375, -0.43536376953125, -0.394073486328125, -0.352783203125, -0.311492919921875, -0.27020263671875, -0.228912353515625, -0.1876220703125, -0.146331787109375, -0.10504150390625, -0.063751220703125, -0.0224609375, 0.018829345703125, 0.06011962890625, 0.101409912109375, 0.1427001953125, 0.183990478515625, 0.22528076171875, 0.266571044921875, 0.307861328125, 0.349151611328125, 0.39044189453125, 0.431732177734375, 0.4730224609375, 0.514312744140625, 0.55560302734375, 0.596893310546875, 0.63818359375, 0.679473876953125, 0.72076416015625, 0.762054443359375, 0.8033447265625, 0.844635009765625, 0.88592529296875, 0.927215576171875, 0.968505859375, 1.009796142578125, 1.05108642578125, 1.092376708984375, 1.1336669921875, 1.174957275390625, 1.21624755859375, 1.257537841796875, 1.298828125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 10.0, 4.0, 12.0, 9.0, 17.0, 25.0, 33.0, 52.0, 72.0, 76.0, 110.0, 158.0, 238.0, 363.0, 531.0, 873.0, 1471.0, 2584.0, 5193.0, 11319.0, 29042.0, 96421.0, 354947.0, 381468.0, 107520.0, 31365.0, 12149.0, 5406.0, 2818.0, 1540.0, 926.0, 643.0, 348.0, 233.0, 166.0, 100.0, 85.0, 50.0, 37.0, 36.0, 23.0, 21.0, 13.0, 9.0, 9.0, 8.0, 4.0, 4.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.708740234375, -1.65185546875, -1.594970703125, -1.5380859375, -1.481201171875, -1.42431640625, -1.367431640625, -1.310546875, -1.253662109375, -1.19677734375, -1.139892578125, -1.0830078125, -1.026123046875, -0.96923828125, -0.912353515625, -0.85546875, -0.798583984375, -0.74169921875, -0.684814453125, -0.6279296875, -0.571044921875, -0.51416015625, -0.457275390625, -0.400390625, -0.343505859375, -0.28662109375, -0.229736328125, -0.1728515625, -0.115966796875, -0.05908203125, -0.002197265625, 0.0546875, 0.111572265625, 0.16845703125, 0.225341796875, 0.2822265625, 0.339111328125, 0.39599609375, 0.452880859375, 0.509765625, 0.566650390625, 0.62353515625, 0.680419921875, 0.7373046875, 0.794189453125, 0.85107421875, 0.907958984375, 0.96484375, 1.021728515625, 1.07861328125, 1.135498046875, 1.1923828125, 1.249267578125, 1.30615234375, 1.363037109375, 1.419921875, 1.476806640625, 1.53369140625, 1.590576171875, 1.6474609375, 1.704345703125, 1.76123046875, 1.818115234375, 1.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 14.0, 26.0, 19.0, 37.0, 44.0, 49.0, 61.0, 71.0, 77.0, 164.0, 1506.0, 409.0, 165.0, 90.0, 61.0, 46.0, 37.0, 24.0, 25.0, 25.0, 13.0, 17.0, 6.0, 9.0, 9.0, 3.0, 6.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.43359375, -5.2685546875, -5.103515625, -4.9384765625, -4.7734375, -4.6083984375, -4.443359375, -4.2783203125, -4.11328125, -3.9482421875, -3.783203125, -3.6181640625, -3.453125, -3.2880859375, -3.123046875, -2.9580078125, -2.79296875, -2.6279296875, -2.462890625, -2.2978515625, -2.1328125, -1.9677734375, -1.802734375, -1.6376953125, -1.47265625, -1.3076171875, -1.142578125, -0.9775390625, -0.8125, -0.6474609375, -0.482421875, -0.3173828125, -0.15234375, 0.0126953125, 0.177734375, 0.3427734375, 0.5078125, 0.6728515625, 0.837890625, 1.0029296875, 1.16796875, 1.3330078125, 1.498046875, 1.6630859375, 1.828125, 1.9931640625, 2.158203125, 2.3232421875, 2.48828125, 2.6533203125, 2.818359375, 2.9833984375, 3.1484375, 3.3134765625, 3.478515625, 3.6435546875, 3.80859375, 3.9736328125, 4.138671875, 4.3037109375, 4.46875, 4.6337890625, 4.798828125, 4.9638671875, 5.12890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 6.0, 10.0, 14.0, 9.0, 13.0, 18.0, 25.0, 34.0, 50.0, 77.0, 81.0, 151.0, 197.0, 416.0, 1237.0, 11367.0, 3064622.0, 63747.0, 2163.0, 593.0, 310.0, 154.0, 104.0, 74.0, 68.0, 50.0, 34.0, 23.0, 9.0, 12.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.4375, -8.171142578125, -7.90478515625, -7.638427734375, -7.3720703125, -7.105712890625, -6.83935546875, -6.572998046875, -6.306640625, -6.040283203125, -5.77392578125, -5.507568359375, -5.2412109375, -4.974853515625, -4.70849609375, -4.442138671875, -4.17578125, -3.909423828125, -3.64306640625, -3.376708984375, -3.1103515625, -2.843994140625, -2.57763671875, -2.311279296875, -2.044921875, -1.778564453125, -1.51220703125, -1.245849609375, -0.9794921875, -0.713134765625, -0.44677734375, -0.180419921875, 0.0859375, 0.352294921875, 0.61865234375, 0.885009765625, 1.1513671875, 1.417724609375, 1.68408203125, 1.950439453125, 2.216796875, 2.483154296875, 2.74951171875, 3.015869140625, 3.2822265625, 3.548583984375, 3.81494140625, 4.081298828125, 4.34765625, 4.614013671875, 4.88037109375, 5.146728515625, 5.4130859375, 5.679443359375, 5.94580078125, 6.212158203125, 6.478515625, 6.744873046875, 7.01123046875, 7.277587890625, 7.5439453125, 7.810302734375, 8.07666015625, 8.343017578125, 8.609375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 530.0, 480.0], "bins": [-170.3904571533203, -167.68580627441406, -164.98114013671875, -162.2764892578125, -159.57183837890625, -156.86717224121094, -154.1625213623047, -151.45787048339844, -148.75320434570312, -146.04855346679688, -143.34388732910156, -140.6392364501953, -137.93458557128906, -135.22991943359375, -132.5252685546875, -129.82061767578125, -127.11595916748047, -124.41130065917969, -121.70664978027344, -119.00199127197266, -116.29733276367188, -113.59268188476562, -110.88802337646484, -108.18336486816406, -105.47871398925781, -102.77405548095703, -100.06940460205078, -97.36474609375, -94.66008758544922, -91.95542907714844, -89.25077819824219, -86.5461196899414, -83.8414535522461, -81.13679504394531, -78.43214416503906, -75.72748565673828, -73.0228271484375, -70.31817626953125, -67.61351776123047, -64.90885925292969, -62.20420455932617, -59.499549865722656, -56.794891357421875, -54.09023666381836, -51.385581970214844, -48.68092346191406, -45.97626876831055, -43.27161407470703, -40.56695556640625, -37.862300872802734, -35.15764236450195, -32.45298767089844, -29.74833106994629, -27.04367446899414, -24.339019775390625, -21.634363174438477, -18.929706573486328, -16.22504997253418, -13.520394325256348, -10.815738677978516, -8.111082077026367, -5.406425476074219, -2.701770782470703, 0.0028858184814453125, 2.7075419425964355]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 11.0, 14.0, 15.0, 18.0, 36.0, 28.0, 32.0, 44.0, 51.0, 44.0, 54.0, 46.0, 59.0, 66.0, 54.0, 67.0, 49.0, 52.0, 41.0, 40.0, 50.0, 19.0, 21.0, 19.0, 22.0, 6.0, 9.0, 4.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.213035583496094, -14.82083797454834, -14.42863941192627, -14.036441802978516, -13.644243240356445, -13.252045631408691, -12.859847068786621, -12.467649459838867, -12.075450897216797, -11.683253288269043, -11.291054725646973, -10.898857116699219, -10.506658554077148, -10.114460945129395, -9.722262382507324, -9.33006477355957, -8.9378662109375, -8.545668601989746, -8.153470039367676, -7.761271953582764, -7.369073867797852, -6.9768757820129395, -6.584677696228027, -6.192480087280273, -5.8002824783325195, -5.408084392547607, -5.015886306762695, -4.623688220977783, -4.231490135192871, -3.839292049407959, -3.447094202041626, -3.054896116256714, -2.6626977920532227, -2.2704997062683105, -1.8783016204833984, -1.4861036539077759, -1.0939055681228638, -0.7017074823379517, -0.3095095157623291, 0.08268857002258301, 0.4748866558074951, 0.8670847415924072, 1.2592828273773193, 1.651480793952942, 2.0436787605285645, 2.4358768463134766, 2.8280749320983887, 3.220273017883301, 3.612471103668213, 4.004669189453125, 4.396867275238037, 4.789065361022949, 5.181263446807861, 5.573461532592773, 5.965659141540527, 6.357857704162598, 6.750055313110352, 7.142253398895264, 7.534451484680176, 7.926649570465088, 8.31884765625, 8.711045265197754, 9.103243827819824, 9.495441436767578, 9.887639999389648]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 2.0, 8.0, 10.0, 9.0, 13.0, 16.0, 20.0, 25.0, 23.0, 33.0, 34.0, 31.0, 32.0, 37.0, 42.0, 42.0, 43.0, 41.0, 35.0, 35.0, 45.0, 42.0, 44.0, 47.0, 46.0, 31.0, 42.0, 28.0, 27.0, 20.0, 14.0, 20.0, 13.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.752838134765625, -1.69903564453125, -1.645233154296875, -1.5914306640625, -1.537628173828125, -1.48382568359375, -1.430023193359375, -1.376220703125, -1.322418212890625, -1.26861572265625, -1.214813232421875, -1.1610107421875, -1.107208251953125, -1.05340576171875, -0.999603271484375, -0.94580078125, -0.891998291015625, -0.83819580078125, -0.784393310546875, -0.7305908203125, -0.676788330078125, -0.62298583984375, -0.569183349609375, -0.515380859375, -0.461578369140625, -0.40777587890625, -0.353973388671875, -0.3001708984375, -0.246368408203125, -0.19256591796875, -0.138763427734375, -0.0849609375, -0.031158447265625, 0.02264404296875, 0.076446533203125, 0.1302490234375, 0.184051513671875, 0.23785400390625, 0.291656494140625, 0.345458984375, 0.399261474609375, 0.45306396484375, 0.506866455078125, 0.5606689453125, 0.614471435546875, 0.66827392578125, 0.722076416015625, 0.77587890625, 0.829681396484375, 0.88348388671875, 0.937286376953125, 0.9910888671875, 1.044891357421875, 1.09869384765625, 1.152496337890625, 1.206298828125, 1.260101318359375, 1.31390380859375, 1.367706298828125, 1.4215087890625, 1.475311279296875, 1.52911376953125, 1.582916259765625, 1.63671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 8.0, 9.0, 15.0, 24.0, 33.0, 45.0, 62.0, 91.0, 115.0, 175.0, 278.0, 388.0, 660.0, 1099.0, 2350.0, 6588.0, 27755.0, 328664.0, 3400779.0, 383013.0, 29708.0, 7011.0, 2345.0, 1183.0, 616.0, 423.0, 260.0, 163.0, 115.0, 85.0, 61.0, 47.0, 31.0, 23.0, 16.0, 11.0, 3.0, 5.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.94940185546875, -7.7191162109375, -7.48883056640625, -7.258544921875, -7.02825927734375, -6.7979736328125, -6.56768798828125, -6.33740234375, -6.10711669921875, -5.8768310546875, -5.64654541015625, -5.416259765625, -5.18597412109375, -4.9556884765625, -4.72540283203125, -4.4951171875, -4.26483154296875, -4.0345458984375, -3.80426025390625, -3.573974609375, -3.34368896484375, -3.1134033203125, -2.88311767578125, -2.65283203125, -2.42254638671875, -2.1922607421875, -1.96197509765625, -1.731689453125, -1.50140380859375, -1.2711181640625, -1.04083251953125, -0.810546875, -0.58026123046875, -0.3499755859375, -0.11968994140625, 0.110595703125, 0.34088134765625, 0.5711669921875, 0.80145263671875, 1.03173828125, 1.26202392578125, 1.4923095703125, 1.72259521484375, 1.952880859375, 2.18316650390625, 2.4134521484375, 2.64373779296875, 2.8740234375, 3.10430908203125, 3.3345947265625, 3.56488037109375, 3.795166015625, 4.02545166015625, 4.2557373046875, 4.48602294921875, 4.71630859375, 4.94659423828125, 5.1768798828125, 5.40716552734375, 5.637451171875, 5.86773681640625, 6.0980224609375, 6.32830810546875, 6.55859375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 19.0, 24.0, 40.0, 43.0, 91.0, 100.0, 184.0, 263.0, 381.0, 599.0, 600.0, 468.0, 407.0, 271.0, 197.0, 128.0, 86.0, 60.0, 32.0, 30.0, 15.0, 6.0, 8.0, 8.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.6680908203125, -3.543212890625, -3.4183349609375, -3.29345703125, -3.1685791015625, -3.043701171875, -2.9188232421875, -2.7939453125, -2.6690673828125, -2.544189453125, -2.4193115234375, -2.29443359375, -2.1695556640625, -2.044677734375, -1.9197998046875, -1.794921875, -1.6700439453125, -1.545166015625, -1.4202880859375, -1.29541015625, -1.1705322265625, -1.045654296875, -0.9207763671875, -0.7958984375, -0.6710205078125, -0.546142578125, -0.4212646484375, -0.29638671875, -0.1715087890625, -0.046630859375, 0.0782470703125, 0.203125, 0.3280029296875, 0.452880859375, 0.5777587890625, 0.70263671875, 0.8275146484375, 0.952392578125, 1.0772705078125, 1.2021484375, 1.3270263671875, 1.451904296875, 1.5767822265625, 1.70166015625, 1.8265380859375, 1.951416015625, 2.0762939453125, 2.201171875, 2.3260498046875, 2.450927734375, 2.5758056640625, 2.70068359375, 2.8255615234375, 2.950439453125, 3.0753173828125, 3.2001953125, 3.3250732421875, 3.449951171875, 3.5748291015625, 3.69970703125, 3.8245849609375, 3.949462890625, 4.0743408203125, 4.19921875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 7.0, 14.0, 32.0, 51.0, 129.0, 245.0, 597.0, 1556.0, 4099.0, 13643.0, 54366.0, 322248.0, 2344646.0, 1253447.0, 154655.0, 30975.0, 8753.0, 2828.0, 1077.0, 466.0, 204.0, 121.0, 42.0, 35.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.804779052734375, -2.68182373046875, -2.558868408203125, -2.4359130859375, -2.312957763671875, -2.19000244140625, -2.067047119140625, -1.944091796875, -1.821136474609375, -1.69818115234375, -1.575225830078125, -1.4522705078125, -1.329315185546875, -1.20635986328125, -1.083404541015625, -0.96044921875, -0.837493896484375, -0.71453857421875, -0.591583251953125, -0.4686279296875, -0.345672607421875, -0.22271728515625, -0.099761962890625, 0.023193359375, 0.146148681640625, 0.26910400390625, 0.392059326171875, 0.5150146484375, 0.637969970703125, 0.76092529296875, 0.883880615234375, 1.0068359375, 1.129791259765625, 1.25274658203125, 1.375701904296875, 1.4986572265625, 1.621612548828125, 1.74456787109375, 1.867523193359375, 1.990478515625, 2.113433837890625, 2.23638916015625, 2.359344482421875, 2.4822998046875, 2.605255126953125, 2.72821044921875, 2.851165771484375, 2.97412109375, 3.097076416015625, 3.22003173828125, 3.342987060546875, 3.4659423828125, 3.588897705078125, 3.71185302734375, 3.834808349609375, 3.957763671875, 4.080718994140625, 4.20367431640625, 4.326629638671875, 4.4495849609375, 4.572540283203125, 4.69549560546875, 4.818450927734375, 4.94140625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 16.0, 23.0, 27.0, 36.0, 34.0, 44.0, 60.0, 63.0, 61.0, 72.0, 57.0, 86.0, 59.0, 59.0, 58.0, 41.0, 26.0, 31.0, 35.0, 11.0, 20.0, 13.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.702457427978516, -19.16834259033203, -18.63422966003418, -18.100114822387695, -17.56599998474121, -17.03188705444336, -16.497772216796875, -15.96365737915039, -15.429543495178223, -14.895429611206055, -14.36131477355957, -13.827200889587402, -13.293087005615234, -12.75897216796875, -12.224858283996582, -11.690744400024414, -11.15662956237793, -10.622515678405762, -10.088400840759277, -9.55428695678711, -9.020172119140625, -8.486058235168457, -7.951944351196289, -7.417829990386963, -6.883715629577637, -6.3496012687683105, -5.815486907958984, -5.281373023986816, -4.74725866317749, -4.213144302368164, -3.679030179977417, -3.14491605758667, -2.6108016967773438, -2.0766873359680176, -1.5425732135772705, -1.0084589719772339, -0.47434473037719727, 0.059769630432128906, 0.593883752822876, 1.127997875213623, 1.6621122360229492, 2.1962265968322754, 2.7303407192230225, 3.2644548416137695, 3.7985692024230957, 4.332683563232422, 4.86679744720459, 5.400911808013916, 5.935026168823242, 6.469140529632568, 7.0032548904418945, 7.5373687744140625, 8.071483612060547, 8.605597496032715, 9.139711380004883, 9.673826217651367, 10.207940101623535, 10.742053985595703, 11.276168823242188, 11.810282707214355, 12.344396591186523, 12.878511428833008, 13.412625312805176, 13.946739196777344, 14.480854034423828]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 12.0, 6.0, 1.0, 9.0, 14.0, 13.0, 11.0, 15.0, 12.0, 20.0, 20.0, 23.0, 26.0, 40.0, 31.0, 32.0, 29.0, 31.0, 34.0, 42.0, 31.0, 41.0, 40.0, 41.0, 41.0, 27.0, 37.0, 33.0, 35.0, 39.0, 38.0, 26.0, 23.0, 24.0, 18.0, 16.0, 7.0, 10.0, 12.0, 8.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.171516418457031, -11.80154800415039, -11.431578636169434, -11.061610221862793, -10.691641807556152, -10.321672439575195, -9.951704025268555, -9.581735610961914, -9.211767196655273, -8.841798782348633, -8.471829414367676, -8.101861000061035, -7.7318925857543945, -7.361923694610596, -6.991954803466797, -6.621986389160156, -6.252017021179199, -5.8820481300354, -5.51207971572876, -5.142110824584961, -4.77214241027832, -4.4021735191345215, -4.032204627990723, -3.662235975265503, -3.292267322540283, -2.9222986698150635, -2.5523300170898438, -2.182361125946045, -1.8123924732208252, -1.4424238204956055, -1.0724549293518066, -0.7024862766265869, -0.3325166702270508, 0.03745204210281372, 0.4074207544326782, 0.7773895263671875, 1.1473581790924072, 1.517326831817627, 1.8872957229614258, 2.2572643756866455, 2.6272330284118652, 2.997201681137085, 3.3671703338623047, 3.7371392250061035, 4.107108116149902, 4.477076530456543, 4.847045421600342, 5.217014312744141, 5.586982727050781, 5.95695161819458, 6.326920032501221, 6.6968889236450195, 7.06685733795166, 7.436826229095459, 7.806795120239258, 8.176763534545898, 8.546731948852539, 8.91670036315918, 9.286669731140137, 9.656638145446777, 10.026606559753418, 10.396575927734375, 10.766544342041016, 11.136512756347656, 11.506482124328613]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 8.0, 6.0, 9.0, 16.0, 12.0, 20.0, 20.0, 22.0, 28.0, 43.0, 37.0, 28.0, 38.0, 49.0, 35.0, 44.0, 48.0, 43.0, 58.0, 38.0, 55.0, 41.0, 39.0, 33.0, 31.0, 22.0, 23.0, 27.0, 23.0, 18.0, 14.0, 10.0, 11.0, 5.0, 9.0, 4.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-31.015625, -30.175048828125, -29.33447265625, -28.493896484375, -27.6533203125, -26.812744140625, -25.97216796875, -25.131591796875, -24.291015625, -23.450439453125, -22.60986328125, -21.769287109375, -20.9287109375, -20.088134765625, -19.24755859375, -18.406982421875, -17.56640625, -16.725830078125, -15.88525390625, -15.044677734375, -14.2041015625, -13.363525390625, -12.52294921875, -11.682373046875, -10.841796875, -10.001220703125, -9.16064453125, -8.320068359375, -7.4794921875, -6.638916015625, -5.79833984375, -4.957763671875, -4.1171875, -3.276611328125, -2.43603515625, -1.595458984375, -0.7548828125, 0.085693359375, 0.92626953125, 1.766845703125, 2.607421875, 3.447998046875, 4.28857421875, 5.129150390625, 5.9697265625, 6.810302734375, 7.65087890625, 8.491455078125, 9.33203125, 10.172607421875, 11.01318359375, 11.853759765625, 12.6943359375, 13.534912109375, 14.37548828125, 15.216064453125, 16.056640625, 16.897216796875, 17.73779296875, 18.578369140625, 19.4189453125, 20.259521484375, 21.10009765625, 21.940673828125, 22.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 10.0, 9.0, 11.0, 12.0, 17.0, 41.0, 63.0, 72.0, 130.0, 177.0, 273.0, 407.0, 629.0, 930.0, 1510.0, 2234.0, 3338.0, 5154.0, 7985.0, 12388.0, 19069.0, 30234.0, 47968.0, 74778.0, 112496.0, 151490.0, 165353.0, 137808.0, 97445.0, 63699.0, 40724.0, 25538.0, 16386.0, 10447.0, 6756.0, 4403.0, 2902.0, 1867.0, 1242.0, 869.0, 586.0, 347.0, 240.0, 198.0, 119.0, 69.0, 53.0, 31.0, 17.0, 12.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.8369140625, -1.78338623046875, -1.7298583984375, -1.67633056640625, -1.622802734375, -1.56927490234375, -1.5157470703125, -1.46221923828125, -1.40869140625, -1.35516357421875, -1.3016357421875, -1.24810791015625, -1.194580078125, -1.14105224609375, -1.0875244140625, -1.03399658203125, -0.98046875, -0.92694091796875, -0.8734130859375, -0.81988525390625, -0.766357421875, -0.71282958984375, -0.6593017578125, -0.60577392578125, -0.55224609375, -0.49871826171875, -0.4451904296875, -0.39166259765625, -0.338134765625, -0.28460693359375, -0.2310791015625, -0.17755126953125, -0.1240234375, -0.07049560546875, -0.0169677734375, 0.03656005859375, 0.090087890625, 0.14361572265625, 0.1971435546875, 0.25067138671875, 0.30419921875, 0.35772705078125, 0.4112548828125, 0.46478271484375, 0.518310546875, 0.57183837890625, 0.6253662109375, 0.67889404296875, 0.732421875, 0.78594970703125, 0.8394775390625, 0.89300537109375, 0.946533203125, 1.00006103515625, 1.0535888671875, 1.10711669921875, 1.16064453125, 1.21417236328125, 1.2677001953125, 1.32122802734375, 1.374755859375, 1.42828369140625, 1.4818115234375, 1.53533935546875, 1.5888671875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 10.0, 9.0, 9.0, 8.0, 10.0, 16.0, 11.0, 30.0, 29.0, 18.0, 18.0, 36.0, 28.0, 26.0, 33.0, 40.0, 37.0, 24.0, 23.0, 36.0, 1065.0, 42.0, 39.0, 31.0, 35.0, 31.0, 32.0, 38.0, 30.0, 22.0, 33.0, 22.0, 18.0, 23.0, 17.0, 14.0, 12.0, 12.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-13.640625, -13.2186279296875, -12.796630859375, -12.3746337890625, -11.95263671875, -11.5306396484375, -11.108642578125, -10.6866455078125, -10.2646484375, -9.8426513671875, -9.420654296875, -8.9986572265625, -8.57666015625, -8.1546630859375, -7.732666015625, -7.3106689453125, -6.888671875, -6.4666748046875, -6.044677734375, -5.6226806640625, -5.20068359375, -4.7786865234375, -4.356689453125, -3.9346923828125, -3.5126953125, -3.0906982421875, -2.668701171875, -2.2467041015625, -1.82470703125, -1.4027099609375, -0.980712890625, -0.5587158203125, -0.13671875, 0.2852783203125, 0.707275390625, 1.1292724609375, 1.55126953125, 1.9732666015625, 2.395263671875, 2.8172607421875, 3.2392578125, 3.6612548828125, 4.083251953125, 4.5052490234375, 4.92724609375, 5.3492431640625, 5.771240234375, 6.1932373046875, 6.615234375, 7.0372314453125, 7.459228515625, 7.8812255859375, 8.30322265625, 8.7252197265625, 9.147216796875, 9.5692138671875, 9.9912109375, 10.4132080078125, 10.835205078125, 11.2572021484375, 11.67919921875, 12.1011962890625, 12.523193359375, 12.9451904296875, 13.3671875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 7.0, 6.0, 14.0, 20.0, 16.0, 29.0, 44.0, 69.0, 74.0, 138.0, 188.0, 270.0, 385.0, 653.0, 991.0, 1533.0, 2472.0, 3863.0, 6245.0, 10580.0, 18983.0, 45858.0, 314383.0, 1548948.0, 82211.0, 25604.0, 13085.0, 7601.0, 4680.0, 2909.0, 1818.0, 1140.0, 748.0, 480.0, 350.0, 207.0, 160.0, 116.0, 66.0, 36.0, 45.0, 32.0, 19.0, 9.0, 14.0, 4.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.58203125, -4.4302978515625, -4.278564453125, -4.1268310546875, -3.97509765625, -3.8233642578125, -3.671630859375, -3.5198974609375, -3.3681640625, -3.2164306640625, -3.064697265625, -2.9129638671875, -2.76123046875, -2.6094970703125, -2.457763671875, -2.3060302734375, -2.154296875, -2.0025634765625, -1.850830078125, -1.6990966796875, -1.54736328125, -1.3956298828125, -1.243896484375, -1.0921630859375, -0.9404296875, -0.7886962890625, -0.636962890625, -0.4852294921875, -0.33349609375, -0.1817626953125, -0.030029296875, 0.1217041015625, 0.2734375, 0.4251708984375, 0.576904296875, 0.7286376953125, 0.88037109375, 1.0321044921875, 1.183837890625, 1.3355712890625, 1.4873046875, 1.6390380859375, 1.790771484375, 1.9425048828125, 2.09423828125, 2.2459716796875, 2.397705078125, 2.5494384765625, 2.701171875, 2.8529052734375, 3.004638671875, 3.1563720703125, 3.30810546875, 3.4598388671875, 3.611572265625, 3.7633056640625, 3.9150390625, 4.0667724609375, 4.218505859375, 4.3702392578125, 4.52197265625, 4.6737060546875, 4.825439453125, 4.9771728515625, 5.12890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 10.0, 5.0, 4.0, 13.0, 9.0, 8.0, 9.0, 12.0, 17.0, 24.0, 34.0, 41.0, 39.0, 43.0, 48.0, 52.0, 47.0, 65.0, 66.0, 53.0, 42.0, 48.0, 42.0, 32.0, 26.0, 30.0, 31.0, 26.0, 19.0, 16.0, 22.0, 20.0, 4.0, 11.0, 5.0, 5.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08343219757080078, -0.08037757873535156, -0.07732295989990234, -0.07426834106445312, -0.0712137222290039, -0.06815910339355469, -0.06510448455810547, -0.06204986572265625, -0.05899524688720703, -0.05594062805175781, -0.052886009216308594, -0.049831390380859375, -0.046776771545410156, -0.04372215270996094, -0.04066753387451172, -0.0376129150390625, -0.03455829620361328, -0.03150367736816406, -0.028449058532714844, -0.025394439697265625, -0.022339820861816406, -0.019285202026367188, -0.01623058319091797, -0.01317596435546875, -0.010121345520019531, -0.0070667266845703125, -0.004012107849121094, -0.000957489013671875, 0.0020971298217773438, 0.0051517486572265625, 0.008206367492675781, 0.011260986328125, 0.014315605163574219, 0.017370223999023438, 0.020424842834472656, 0.023479461669921875, 0.026534080505371094, 0.029588699340820312, 0.03264331817626953, 0.03569793701171875, 0.03875255584716797, 0.04180717468261719, 0.044861793518066406, 0.047916412353515625, 0.050971031188964844, 0.05402565002441406, 0.05708026885986328, 0.0601348876953125, 0.06318950653076172, 0.06624412536621094, 0.06929874420166016, 0.07235336303710938, 0.0754079818725586, 0.07846260070800781, 0.08151721954345703, 0.08457183837890625, 0.08762645721435547, 0.09068107604980469, 0.0937356948852539, 0.09679031372070312, 0.09984493255615234, 0.10289955139160156, 0.10595417022705078, 0.1090087890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 9.0, 12.0, 10.0, 14.0, 24.0, 30.0, 53.0, 89.0, 113.0, 177.0, 262.0, 408.0, 684.0, 1125.0, 1955.0, 3639.0, 7301.0, 15691.0, 37372.0, 96569.0, 225756.0, 314631.0, 199950.0, 82753.0, 32128.0, 13594.0, 6390.0, 3280.0, 1743.0, 1012.0, 603.0, 400.0, 226.0, 182.0, 121.0, 75.0, 48.0, 35.0, 39.0, 20.0, 4.0, 10.0, 4.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4833984375, -0.46935272216796875, -0.4553070068359375, -0.44126129150390625, -0.427215576171875, -0.41316986083984375, -0.3991241455078125, -0.38507843017578125, -0.37103271484375, -0.35698699951171875, -0.3429412841796875, -0.32889556884765625, -0.314849853515625, -0.30080413818359375, -0.2867584228515625, -0.27271270751953125, -0.2586669921875, -0.24462127685546875, -0.2305755615234375, -0.21652984619140625, -0.202484130859375, -0.18843841552734375, -0.1743927001953125, -0.16034698486328125, -0.14630126953125, -0.13225555419921875, -0.1182098388671875, -0.10416412353515625, -0.090118408203125, -0.07607269287109375, -0.0620269775390625, -0.04798126220703125, -0.033935546875, -0.01988983154296875, -0.0058441162109375, 0.00820159912109375, 0.022247314453125, 0.03629302978515625, 0.0503387451171875, 0.06438446044921875, 0.07843017578125, 0.09247589111328125, 0.1065216064453125, 0.12056732177734375, 0.134613037109375, 0.14865875244140625, 0.1627044677734375, 0.17675018310546875, 0.1907958984375, 0.20484161376953125, 0.2188873291015625, 0.23293304443359375, 0.246978759765625, 0.26102447509765625, 0.2750701904296875, 0.28911590576171875, 0.30316162109375, 0.31720733642578125, 0.3312530517578125, 0.34529876708984375, 0.359344482421875, 0.37339019775390625, 0.3874359130859375, 0.40148162841796875, 0.41552734375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 3.0, 10.0, 13.0, 30.0, 22.0, 27.0, 52.0, 37.0, 62.0, 69.0, 67.0, 70.0, 71.0, 85.0, 71.0, 63.0, 50.0, 39.0, 37.0, 25.0, 13.0, 17.0, 15.0, 8.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11321540921926498, -0.10929177701473236, -0.10536813735961914, -0.10144450515508652, -0.0975208654999733, -0.09359723329544067, -0.08967359364032745, -0.08574996143579483, -0.08182632923126221, -0.07790269702672958, -0.07397905737161636, -0.07005542516708374, -0.06613178551197052, -0.0622081533074379, -0.058284517377614975, -0.05436088144779205, -0.05043724179267883, -0.04651360586285591, -0.04258996993303299, -0.038666337728500366, -0.034742698073387146, -0.030819064006209373, -0.0268954299390316, -0.02297179400920868, -0.019048158079385757, -0.015124522149562836, -0.011200887151062489, -0.007277252152562141, -0.0033536162227392197, 0.0005700197070837021, 0.004493653774261475, 0.008417289704084396, 0.012340933084487915, 0.016264569014310837, 0.02018820494413376, 0.02411183901131153, 0.028035474941134453, 0.031959109008312225, 0.03588274493813515, 0.03980638086795807, 0.04373001679778099, 0.04765365272760391, 0.051577288657426834, 0.055500924587249756, 0.05942455679178238, 0.0633481964468956, 0.06727182865142822, 0.07119546830654144, 0.07511910051107407, 0.07904273271560669, 0.08296637237071991, 0.08689000457525253, 0.09081364423036575, 0.09473727643489838, 0.0986609160900116, 0.10258454829454422, 0.10650818049907684, 0.11043181270360947, 0.11435545235872269, 0.11827908456325531, 0.12220272421836853, 0.12612636387348175, 0.13004998862743378, 0.133973628282547, 0.13789726793766022]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 10.0, 9.0, 18.0, 18.0, 26.0, 28.0, 20.0, 23.0, 24.0, 30.0, 39.0, 45.0, 50.0, 43.0, 48.0, 49.0, 48.0, 35.0, 30.0, 49.0, 40.0, 37.0, 29.0, 31.0, 31.0, 28.0, 20.0, 24.0, 18.0, 11.0, 19.0, 13.0, 6.0, 4.0, 9.0, 3.0, 1.0, 2.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08047318458557129, -0.07789602130651474, -0.07531885802745819, -0.07274169474840164, -0.07016453146934509, -0.06758736819028854, -0.065010204911232, -0.062433041632175446, -0.059855878353118896, -0.05727871507406235, -0.0547015517950058, -0.05212438851594925, -0.0495472252368927, -0.04697006195783615, -0.0443928986787796, -0.04181573539972305, -0.039238572120666504, -0.036661408841609955, -0.034084245562553406, -0.03150708228349686, -0.028929919004440308, -0.02635275572538376, -0.02377559244632721, -0.02119842916727066, -0.01862126588821411, -0.016044102609157562, -0.013466939330101013, -0.010889776051044464, -0.008312612771987915, -0.005735449492931366, -0.003158286213874817, -0.0005811229348182678, 0.0019960403442382812, 0.00457320362329483, 0.007150366902351379, 0.009727530181407928, 0.012304693460464478, 0.014881856739521027, 0.017459020018577576, 0.020036183297634125, 0.022613346576690674, 0.025190509855747223, 0.027767673134803772, 0.03034483641386032, 0.03292199969291687, 0.03549916297197342, 0.03807632625102997, 0.04065348953008652, 0.043230652809143066, 0.045807816088199615, 0.048384979367256165, 0.050962142646312714, 0.05353930592536926, 0.05611646920442581, 0.05869363248348236, 0.06127079576253891, 0.06384795904159546, 0.06642512232065201, 0.06900228559970856, 0.0715794488787651, 0.07415661215782166, 0.0767337754368782, 0.07931093871593475, 0.0818881019949913, 0.08446526527404785]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 12.0, 8.0, 7.0, 5.0, 20.0, 13.0, 20.0, 19.0, 23.0, 20.0, 29.0, 26.0, 24.0, 33.0, 34.0, 35.0, 47.0, 40.0, 48.0, 45.0, 34.0, 44.0, 47.0, 38.0, 36.0, 30.0, 27.0, 36.0, 18.0, 24.0, 30.0, 8.0, 24.0, 17.0, 10.0, 13.0, 6.0, 10.0, 11.0, 2.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.359375, -22.6142578125, -21.869140625, -21.1240234375, -20.37890625, -19.6337890625, -18.888671875, -18.1435546875, -17.3984375, -16.6533203125, -15.908203125, -15.1630859375, -14.41796875, -13.6728515625, -12.927734375, -12.1826171875, -11.4375, -10.6923828125, -9.947265625, -9.2021484375, -8.45703125, -7.7119140625, -6.966796875, -6.2216796875, -5.4765625, -4.7314453125, -3.986328125, -3.2412109375, -2.49609375, -1.7509765625, -1.005859375, -0.2607421875, 0.484375, 1.2294921875, 1.974609375, 2.7197265625, 3.46484375, 4.2099609375, 4.955078125, 5.7001953125, 6.4453125, 7.1904296875, 7.935546875, 8.6806640625, 9.42578125, 10.1708984375, 10.916015625, 11.6611328125, 12.40625, 13.1513671875, 13.896484375, 14.6416015625, 15.38671875, 16.1318359375, 16.876953125, 17.6220703125, 18.3671875, 19.1123046875, 19.857421875, 20.6025390625, 21.34765625, 22.0927734375, 22.837890625, 23.5830078125, 24.328125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 13.0, 9.0, 5.0, 13.0, 14.0, 21.0, 22.0, 21.0, 31.0, 26.0, 51.0, 90.0, 215.0, 533.0, 1847.0, 7481.0, 45061.0, 391356.0, 520457.0, 67634.0, 10045.0, 2255.0, 665.0, 265.0, 100.0, 55.0, 32.0, 29.0, 35.0, 20.0, 16.0, 15.0, 14.0, 18.0, 8.0, 10.0, 7.0, 10.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.35546875, -5.1885986328125, -5.021728515625, -4.8548583984375, -4.68798828125, -4.5211181640625, -4.354248046875, -4.1873779296875, -4.0205078125, -3.8536376953125, -3.686767578125, -3.5198974609375, -3.35302734375, -3.1861572265625, -3.019287109375, -2.8524169921875, -2.685546875, -2.5186767578125, -2.351806640625, -2.1849365234375, -2.01806640625, -1.8511962890625, -1.684326171875, -1.5174560546875, -1.3505859375, -1.1837158203125, -1.016845703125, -0.8499755859375, -0.68310546875, -0.5162353515625, -0.349365234375, -0.1824951171875, -0.015625, 0.1512451171875, 0.318115234375, 0.4849853515625, 0.65185546875, 0.8187255859375, 0.985595703125, 1.1524658203125, 1.3193359375, 1.4862060546875, 1.653076171875, 1.8199462890625, 1.98681640625, 2.1536865234375, 2.320556640625, 2.4874267578125, 2.654296875, 2.8211669921875, 2.988037109375, 3.1549072265625, 3.32177734375, 3.4886474609375, 3.655517578125, 3.8223876953125, 3.9892578125, 4.1561279296875, 4.322998046875, 4.4898681640625, 4.65673828125, 4.8236083984375, 4.990478515625, 5.1573486328125, 5.32421875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 10.0, 10.0, 19.0, 18.0, 31.0, 31.0, 35.0, 37.0, 58.0, 63.0, 84.0, 69.0, 2115.0, 68.0, 70.0, 47.0, 51.0, 42.0, 39.0, 40.0, 21.0, 23.0, 15.0, 10.0, 13.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.0, -47.52734375, -46.0546875, -44.58203125, -43.109375, -41.63671875, -40.1640625, -38.69140625, -37.21875, -35.74609375, -34.2734375, -32.80078125, -31.328125, -29.85546875, -28.3828125, -26.91015625, -25.4375, -23.96484375, -22.4921875, -21.01953125, -19.546875, -18.07421875, -16.6015625, -15.12890625, -13.65625, -12.18359375, -10.7109375, -9.23828125, -7.765625, -6.29296875, -4.8203125, -3.34765625, -1.875, -0.40234375, 1.0703125, 2.54296875, 4.015625, 5.48828125, 6.9609375, 8.43359375, 9.90625, 11.37890625, 12.8515625, 14.32421875, 15.796875, 17.26953125, 18.7421875, 20.21484375, 21.6875, 23.16015625, 24.6328125, 26.10546875, 27.578125, 29.05078125, 30.5234375, 31.99609375, 33.46875, 34.94140625, 36.4140625, 37.88671875, 39.359375, 40.83203125, 42.3046875, 43.77734375, 45.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 12.0, 15.0, 14.0, 20.0, 37.0, 48.0, 79.0, 127.0, 175.0, 241.0, 444.0, 822.0, 1618.0, 3763.0, 11599.0, 46541.0, 224188.0, 2600945.0, 196565.0, 41198.0, 10249.0, 3536.0, 1507.0, 775.0, 438.0, 243.0, 162.0, 101.0, 67.0, 54.0, 28.0, 16.0, 25.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.1640625, -3.072235107421875, -2.98040771484375, -2.888580322265625, -2.7967529296875, -2.704925537109375, -2.61309814453125, -2.521270751953125, -2.429443359375, -2.337615966796875, -2.24578857421875, -2.153961181640625, -2.0621337890625, -1.970306396484375, -1.87847900390625, -1.786651611328125, -1.69482421875, -1.602996826171875, -1.51116943359375, -1.419342041015625, -1.3275146484375, -1.235687255859375, -1.14385986328125, -1.052032470703125, -0.960205078125, -0.868377685546875, -0.77655029296875, -0.684722900390625, -0.5928955078125, -0.501068115234375, -0.40924072265625, -0.317413330078125, -0.2255859375, -0.133758544921875, -0.04193115234375, 0.049896240234375, 0.1417236328125, 0.233551025390625, 0.32537841796875, 0.417205810546875, 0.509033203125, 0.600860595703125, 0.69268798828125, 0.784515380859375, 0.8763427734375, 0.968170166015625, 1.05999755859375, 1.151824951171875, 1.24365234375, 1.335479736328125, 1.42730712890625, 1.519134521484375, 1.6109619140625, 1.702789306640625, 1.79461669921875, 1.886444091796875, 1.978271484375, 2.070098876953125, 2.16192626953125, 2.253753662109375, 2.3455810546875, 2.437408447265625, 2.52923583984375, 2.621063232421875, 2.712890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 7.0, 9.0, 20.0, 30.0, 51.0, 72.0, 110.0, 182.0, 145.0, 119.0, 75.0, 56.0, 40.0, 24.0, 13.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.18195343017578, -45.56523132324219, -43.948509216308594, -42.331787109375, -40.715065002441406, -39.09834289550781, -37.48162078857422, -35.864898681640625, -34.24817657470703, -32.63145446777344, -31.014732360839844, -29.39801025390625, -27.781288146972656, -26.164566040039062, -24.54784393310547, -22.931121826171875, -21.314401626586914, -19.69767951965332, -18.080957412719727, -16.464235305786133, -14.847513198852539, -13.230792045593262, -11.614069938659668, -9.997347831726074, -8.38062572479248, -6.763903617858887, -5.147181510925293, -3.5304598808288574, -1.9137377738952637, -0.2970161437988281, 1.3197059631347656, 2.9364280700683594, 4.553150177001953, 6.169872283935547, 7.786594390869141, 9.403316497802734, 11.020038604736328, 12.636759757995605, 14.2534818649292, 15.870203971862793, 17.486927032470703, 19.103649139404297, 20.72037124633789, 22.337093353271484, 23.953815460205078, 25.570537567138672, 27.187259674072266, 28.80398178100586, 30.42070198059082, 32.03742218017578, 33.654144287109375, 35.27086639404297, 36.88758850097656, 38.504310607910156, 40.12103271484375, 41.737754821777344, 43.35447692871094, 44.97119903564453, 46.587921142578125, 48.20464324951172, 49.82136535644531, 51.438087463378906, 53.0548095703125, 54.671531677246094, 56.28825378417969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 9.0, 6.0, 5.0, 10.0, 13.0, 16.0, 18.0, 15.0, 24.0, 23.0, 36.0, 24.0, 33.0, 31.0, 34.0, 44.0, 35.0, 44.0, 34.0, 47.0, 48.0, 45.0, 39.0, 45.0, 40.0, 25.0, 35.0, 38.0, 18.0, 23.0, 24.0, 15.0, 23.0, 12.0, 20.0, 12.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.71887969970703, -41.32689666748047, -39.934913635253906, -38.542930603027344, -37.15094757080078, -35.758968353271484, -34.36698532104492, -32.97500228881836, -31.583019256591797, -30.191036224365234, -28.799053192138672, -27.407072067260742, -26.01508903503418, -24.623106002807617, -23.231124877929688, -21.839141845703125, -20.447158813476562, -19.05517578125, -17.663192749023438, -16.271211624145508, -14.879228591918945, -13.487245559692383, -12.095263481140137, -10.70328140258789, -9.311298370361328, -7.919315814971924, -6.5273332595825195, -5.135350704193115, -3.743368148803711, -2.3513855934143066, -0.9594030380249023, 0.43257904052734375, 1.8245620727539062, 3.2165446281433105, 4.608527183532715, 6.000509738922119, 7.392492294311523, 8.784475326538086, 10.176457405090332, 11.568439483642578, 12.96042251586914, 14.352405548095703, 15.74438762664795, 17.136369705200195, 18.528352737426758, 19.92033576965332, 21.31231689453125, 22.704299926757812, 24.096282958984375, 25.488265991210938, 26.8802490234375, 28.27223014831543, 29.664213180541992, 31.056196212768555, 32.448177337646484, 33.84016036987305, 35.23214340209961, 36.62412643432617, 38.016109466552734, 39.4080924987793, 40.800071716308594, 42.192054748535156, 43.58403778076172, 44.97602081298828, 46.368003845214844]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 7.0, 11.0, 9.0, 20.0, 30.0, 38.0, 57.0, 61.0, 114.0, 114.0, 211.0, 383.0, 683.0, 1435.0, 3201.0, 8722.0, 1025654.0, 4072.0, 1749.0, 819.0, 387.0, 221.0, 164.0, 94.0, 72.0, 53.0, 30.0, 21.0, 12.0, 16.0, 19.0, 16.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.935699462890625, -15.388357162475586, -14.841014862060547, -14.293672561645508, -13.746330261230469, -13.19898796081543, -12.65164566040039, -12.104303359985352, -11.556961059570312, -11.009618759155273, -10.462276458740234, -9.914934158325195, -9.367591857910156, -8.820249557495117, -8.272907257080078, -7.725565433502197, -7.178223609924316, -6.630881309509277, -6.083539009094238, -5.536196708679199, -4.98885440826416, -4.441512107849121, -3.8941702842712402, -3.346827983856201, -2.799485683441162, -2.252143383026123, -1.7048012018203735, -1.157459020614624, -0.610116720199585, -0.0627744197845459, 0.48456764221191406, 1.0319099426269531, 1.5792522430419922, 2.1265945434570312, 2.6739368438720703, 3.2212789058685303, 3.7686212062835693, 4.3159637451171875, 4.863305568695068, 5.410647869110107, 5.9579901695251465, 6.5053324699401855, 7.052674770355225, 7.6000165939331055, 8.147358894348145, 8.694701194763184, 9.242043495178223, 9.789385795593262, 10.3367280960083, 10.88407039642334, 11.431412696838379, 11.978754997253418, 12.526097297668457, 13.073439598083496, 13.620780944824219, 14.168123245239258, 14.715465545654297, 15.262807846069336, 15.810150146484375, 16.357492446899414, 16.904834747314453, 17.452177047729492, 17.99951934814453, 18.54686164855957, 19.09420394897461]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 12.0, 4.0, 10.0, 45.0, 649.0, 51460040.0, 2251.0, 106.0, 15.0, 6.0, 10.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-693.6778564453125, -675.2608642578125, -656.8438720703125, -638.4268798828125, -620.0098876953125, -601.5928955078125, -583.1759033203125, -564.7589111328125, -546.3419189453125, -527.9249267578125, -509.5079345703125, -491.0909423828125, -472.6739501953125, -454.2569580078125, -435.8399963378906, -417.4230041503906, -399.00604248046875, -380.58905029296875, -362.17205810546875, -343.75506591796875, -325.33807373046875, -306.92108154296875, -288.5041198730469, -270.0871276855469, -251.67013549804688, -233.25314331054688, -214.83615112304688, -196.41917419433594, -178.00218200683594, -159.58518981933594, -141.168212890625, -122.751220703125, -104.33425903320312, -85.91726684570312, -67.50028228759766, -49.08329391479492, -30.666305541992188, -12.249313354492188, 6.167671203613281, 24.58465576171875, 43.00164794921875, 61.418636322021484, 79.83562469482422, 98.25260925292969, 116.66960144042969, 135.0865936279297, 153.50357055664062, 171.92056274414062, 190.33755493164062, 208.75454711914062, 227.17153930664062, 245.58851623535156, 264.0054931640625, 282.4224853515625, 300.8394775390625, 319.2564697265625, 337.6734619140625, 356.0904541015625, 374.5074462890625, 392.9244384765625, 411.3414306640625, 429.7584228515625, 448.1753845214844, 466.5923767089844, 485.0093688964844]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 13.0, 13.0, 22.0, 34.0, 36.0, 45.0, 59.0, 68.0, 82.0, 104.0, 114.0, 90.0, 65.0, 54.0, 36.0, 30.0, 25.0, 14.0, 18.0, 6.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.240867614746094, -43.900184631347656, -42.559505462646484, -41.21882247924805, -39.878143310546875, -38.53746032714844, -37.19677734375, -35.85609817504883, -34.51541519165039, -33.17473220825195, -31.83405303955078, -30.493370056152344, -29.15268898010254, -27.812007904052734, -26.47132682800293, -25.130645751953125, -23.78996467590332, -22.449283599853516, -21.10860252380371, -19.767921447753906, -18.42723846435547, -17.086557388305664, -15.74587631225586, -14.405194282531738, -13.064513206481934, -11.723832130432129, -10.383150100708008, -9.042469024658203, -7.70178747177124, -6.361105918884277, -5.020424842834473, -3.6797428131103516, -2.339061737060547, -0.9983803033828735, 0.3423011302947998, 1.6829824447631836, 3.0236639976501465, 4.364345550537109, 5.705026626586914, 7.045708656311035, 8.38638973236084, 9.727070808410645, 11.067752838134766, 12.40843391418457, 13.749114990234375, 15.089797019958496, 16.430477142333984, 17.771160125732422, 19.111841201782227, 20.45252227783203, 21.793203353881836, 23.13388442993164, 24.474567413330078, 25.815248489379883, 27.155929565429688, 28.496612548828125, 29.837291717529297, 31.1779727935791, 32.518653869628906, 33.859336853027344, 35.200016021728516, 36.54069900512695, 37.881378173828125, 39.22206115722656, 40.562744140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 15.0, 9.0, 9.0, 15.0, 12.0, 30.0, 15.0, 25.0, 30.0, 38.0, 35.0, 32.0, 33.0, 35.0, 36.0, 31.0, 56.0, 34.0, 51.0, 39.0, 41.0, 35.0, 46.0, 28.0, 37.0, 25.0, 21.0, 22.0, 18.0, 23.0, 20.0, 12.0, 5.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.677288055419922, -27.8645076751709, -27.051727294921875, -26.238948822021484, -25.42616844177246, -24.613388061523438, -23.800607681274414, -22.98782730102539, -22.175048828125, -21.362268447875977, -20.549488067626953, -19.736709594726562, -18.92392921447754, -18.111148834228516, -17.298368453979492, -16.48558807373047, -15.672807693481445, -14.860027313232422, -14.047247886657715, -13.234467506408691, -12.421688079833984, -11.608907699584961, -10.796127319335938, -9.983346939086914, -9.170567512512207, -8.357787132263184, -7.545007705688477, -6.732227325439453, -5.919447422027588, -5.106667518615723, -4.293887138366699, -3.481107234954834, -2.6683292388916016, -1.8555492162704468, -1.042769193649292, -0.22998905181884766, 0.5827908515930176, 1.3955707550048828, 2.2083511352539062, 3.0211310386657715, 3.8339109420776367, 4.646690845489502, 5.459470748901367, 6.272251129150391, 7.085031032562256, 7.897810935974121, 8.710591316223145, 9.523370742797852, 10.336151123046875, 11.148931503295898, 11.961710929870605, 12.774491310119629, 13.587270736694336, 14.40005111694336, 15.212831497192383, 16.025611877441406, 16.838390350341797, 17.65117073059082, 18.463951110839844, 19.276729583740234, 20.089509963989258, 20.90229034423828, 21.715070724487305, 22.527851104736328, 23.34063148498535]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 9.0, 6.0, 15.0, 18.0, 27.0, 31.0, 54.0, 87.0, 112.0, 211.0, 306.0, 496.0, 815.0, 1403.0, 2568.0, 4939.0, 10453.0, 25256.0, 92052.0, 3099234.0, 851509.0, 69149.0, 19663.0, 7784.0, 3661.0, 1851.0, 997.0, 605.0, 365.0, 213.0, 122.0, 63.0, 73.0, 38.0, 32.0, 22.0, 15.0, 5.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.513092041015625, -1.46075439453125, -1.408416748046875, -1.3560791015625, -1.303741455078125, -1.25140380859375, -1.199066162109375, -1.146728515625, -1.094390869140625, -1.04205322265625, -0.989715576171875, -0.9373779296875, -0.885040283203125, -0.83270263671875, -0.780364990234375, -0.72802734375, -0.675689697265625, -0.62335205078125, -0.571014404296875, -0.5186767578125, -0.466339111328125, -0.41400146484375, -0.361663818359375, -0.309326171875, -0.256988525390625, -0.20465087890625, -0.152313232421875, -0.0999755859375, -0.047637939453125, 0.00469970703125, 0.057037353515625, 0.109375, 0.161712646484375, 0.21405029296875, 0.266387939453125, 0.3187255859375, 0.371063232421875, 0.42340087890625, 0.475738525390625, 0.528076171875, 0.580413818359375, 0.63275146484375, 0.685089111328125, 0.7374267578125, 0.789764404296875, 0.84210205078125, 0.894439697265625, 0.94677734375, 0.999114990234375, 1.05145263671875, 1.103790283203125, 1.1561279296875, 1.208465576171875, 1.26080322265625, 1.313140869140625, 1.365478515625, 1.417816162109375, 1.47015380859375, 1.522491455078125, 1.5748291015625, 1.627166748046875, 1.67950439453125, 1.731842041015625, 1.7841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 14.0, 13.0, 18.0, 19.0, 43.0, 71.0, 113.0, 153.0, 150.0, 138.0, 91.0, 50.0, 21.0, 19.0, 12.0, 11.0, 6.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2433013916015625, -0.236114501953125, -0.2289276123046875, -0.22174072265625, -0.2145538330078125, -0.207366943359375, -0.2001800537109375, -0.1929931640625, -0.1858062744140625, -0.178619384765625, -0.1714324951171875, -0.16424560546875, -0.1570587158203125, -0.149871826171875, -0.1426849365234375, -0.135498046875, -0.1283111572265625, -0.121124267578125, -0.1139373779296875, -0.10675048828125, -0.0995635986328125, -0.092376708984375, -0.0851898193359375, -0.0780029296875, -0.0708160400390625, -0.063629150390625, -0.0564422607421875, -0.04925537109375, -0.0420684814453125, -0.034881591796875, -0.0276947021484375, -0.0205078125, -0.0133209228515625, -0.006134033203125, 0.0010528564453125, 0.00823974609375, 0.0154266357421875, 0.022613525390625, 0.0298004150390625, 0.0369873046875, 0.0441741943359375, 0.051361083984375, 0.0585479736328125, 0.06573486328125, 0.0729217529296875, 0.080108642578125, 0.0872955322265625, 0.094482421875, 0.1016693115234375, 0.108856201171875, 0.1160430908203125, 0.12322998046875, 0.1304168701171875, 0.137603759765625, 0.1447906494140625, 0.1519775390625, 0.1591644287109375, 0.166351318359375, 0.1735382080078125, 0.18072509765625, 0.1879119873046875, 0.195098876953125, 0.2022857666015625, 0.20947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 13.0, 7.0, 5.0, 12.0, 20.0, 25.0, 53.0, 84.0, 107.0, 144.0, 246.0, 372.0, 523.0, 848.0, 1436.0, 2447.0, 4232.0, 8276.0, 16801.0, 38302.0, 102800.0, 376937.0, 2878066.0, 542047.0, 131524.0, 47248.0, 19899.0, 9627.0, 4963.0, 2810.0, 1625.0, 976.0, 614.0, 383.0, 261.0, 171.0, 129.0, 71.0, 66.0, 35.0, 22.0, 20.0, 15.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0602264404296875, -1.021820068359375, -0.9834136962890625, -0.94500732421875, -0.9066009521484375, -0.868194580078125, -0.8297882080078125, -0.7913818359375, -0.7529754638671875, -0.714569091796875, -0.6761627197265625, -0.63775634765625, -0.5993499755859375, -0.560943603515625, -0.5225372314453125, -0.484130859375, -0.4457244873046875, -0.407318115234375, -0.3689117431640625, -0.33050537109375, -0.2920989990234375, -0.253692626953125, -0.2152862548828125, -0.1768798828125, -0.1384735107421875, -0.100067138671875, -0.0616607666015625, -0.02325439453125, 0.0151519775390625, 0.053558349609375, 0.0919647216796875, 0.13037109375, 0.1687774658203125, 0.207183837890625, 0.2455902099609375, 0.28399658203125, 0.3224029541015625, 0.360809326171875, 0.3992156982421875, 0.4376220703125, 0.4760284423828125, 0.514434814453125, 0.5528411865234375, 0.59124755859375, 0.6296539306640625, 0.668060302734375, 0.7064666748046875, 0.744873046875, 0.7832794189453125, 0.821685791015625, 0.8600921630859375, 0.89849853515625, 0.9369049072265625, 0.975311279296875, 1.0137176513671875, 1.0521240234375, 1.0905303955078125, 1.128936767578125, 1.1673431396484375, 1.20574951171875, 1.2441558837890625, 1.282562255859375, 1.3209686279296875, 1.359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 15.0, 17.0, 24.0, 29.0, 51.0, 48.0, 62.0, 83.0, 118.0, 148.0, 257.0, 384.0, 1020.0, 676.0, 328.0, 198.0, 131.0, 95.0, 73.0, 68.0, 46.0, 50.0, 28.0, 16.0, 22.0, 13.0, 10.0, 3.0, 8.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2673225402832031, -0.25656890869140625, -0.24581527709960938, -0.2350616455078125, -0.22430801391601562, -0.21355438232421875, -0.20280075073242188, -0.192047119140625, -0.18129348754882812, -0.17053985595703125, -0.15978622436523438, -0.1490325927734375, -0.13827896118164062, -0.12752532958984375, -0.11677169799804688, -0.10601806640625, -0.09526443481445312, -0.08451080322265625, -0.07375717163085938, -0.0630035400390625, -0.052249908447265625, -0.04149627685546875, -0.030742645263671875, -0.019989013671875, -0.009235382080078125, 0.00151824951171875, 0.012271881103515625, 0.0230255126953125, 0.033779144287109375, 0.04453277587890625, 0.055286407470703125, 0.0660400390625, 0.07679367065429688, 0.08754730224609375, 0.09830093383789062, 0.1090545654296875, 0.11980819702148438, 0.13056182861328125, 0.14131546020507812, 0.152069091796875, 0.16282272338867188, 0.17357635498046875, 0.18432998657226562, 0.1950836181640625, 0.20583724975585938, 0.21659088134765625, 0.22734451293945312, 0.23809814453125, 0.24885177612304688, 0.25960540771484375, 0.2703590393066406, 0.2811126708984375, 0.2918663024902344, 0.30261993408203125, 0.3133735656738281, 0.324127197265625, 0.3348808288574219, 0.34563446044921875, 0.3563880920410156, 0.3671417236328125, 0.3778953552246094, 0.38864898681640625, 0.3994026184082031, 0.41015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 7.0, 6.0, 14.0, 12.0, 33.0, 43.0, 79.0, 113.0, 178.0, 169.0, 120.0, 69.0, 66.0, 26.0, 21.0, 9.0, 12.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6453351974487305, -3.504408836364746, -3.3634824752807617, -3.2225561141967773, -3.081629753112793, -2.9407033920288086, -2.799777030944824, -2.65885066986084, -2.5179243087768555, -2.376997947692871, -2.2360715866088867, -2.0951452255249023, -1.954218864440918, -1.8132925033569336, -1.6723662614822388, -1.5314399003982544, -1.3905136585235596, -1.2495872974395752, -1.1086609363555908, -0.9677346348762512, -0.8268082737922668, -0.6858819127082825, -0.5449556112289429, -0.4040292501449585, -0.2631028890609741, -0.12217654287815094, 0.01874980330467224, 0.15967613458633423, 0.3006024956703186, 0.441528856754303, 0.5824551582336426, 0.723381519317627, 0.8643078804016113, 1.0052342414855957, 1.14616060256958, 1.2870869636535645, 1.4280133247375488, 1.5689396858215332, 1.709865927696228, 1.8507922887802124, 1.9917186498641968, 2.1326448917388916, 2.273571252822876, 2.4144976139068604, 2.5554239749908447, 2.696350336074829, 2.8372766971588135, 2.978203058242798, 3.1191294193267822, 3.2600557804107666, 3.400982141494751, 3.5419085025787354, 3.6828348636627197, 3.823761224746704, 3.9646873474121094, 4.105613708496094, 4.246540069580078, 4.3874664306640625, 4.528392791748047, 4.669319152832031, 4.810245513916016, 4.951171875, 5.092098236083984, 5.233024597167969, 5.373950958251953]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 12.0, 9.0, 13.0, 16.0, 13.0, 23.0, 23.0, 23.0, 31.0, 33.0, 50.0, 39.0, 47.0, 50.0, 50.0, 53.0, 42.0, 43.0, 56.0, 38.0, 44.0, 38.0, 34.0, 32.0, 29.0, 20.0, 18.0, 11.0, 14.0, 13.0, 12.0, 8.0, 9.0, 2.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.381821870803833, -1.3363724946975708, -1.2909231185913086, -1.2454737424850464, -1.2000243663787842, -1.154574990272522, -1.1091256141662598, -1.063676118850708, -1.0182268619537354, -0.9727774858474731, -0.9273281097412109, -0.8818787336349487, -0.8364293575286865, -0.7909799814224243, -0.7455305457115173, -0.7000811696052551, -0.6546317338943481, -0.6091823577880859, -0.5637329816818237, -0.5182836055755615, -0.47283419966697693, -0.4273848235607147, -0.3819354176521301, -0.3364860415458679, -0.2910366654396057, -0.2455872893333435, -0.2001378983259201, -0.1546885073184967, -0.1092391312122345, -0.06378975510597229, -0.018340349197387695, 0.02710902690887451, 0.07255840301513672, 0.11800778657197952, 0.16345717012882233, 0.20890656113624573, 0.25435593724250793, 0.29980531334877014, 0.34525471925735474, 0.39070409536361694, 0.43615347146987915, 0.48160284757614136, 0.5270522236824036, 0.5725016593933105, 0.6179510354995728, 0.663400411605835, 0.7088497877120972, 0.7542991638183594, 0.7997485399246216, 0.8451979160308838, 0.890647292137146, 0.9360966682434082, 0.9815460443496704, 1.0269954204559326, 1.0724449157714844, 1.117894172668457, 1.1633436679840088, 1.208793044090271, 1.2542424201965332, 1.2996917963027954, 1.3451411724090576, 1.3905905485153198, 1.436039924621582, 1.4814894199371338, 1.5269386768341064]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 19.0, 19.0, 26.0, 33.0, 42.0, 71.0, 115.0, 152.0, 279.0, 385.0, 584.0, 954.0, 1606.0, 2561.0, 4395.0, 7627.0, 14201.0, 32527.0, 100604.0, 372430.0, 354090.0, 93001.0, 30859.0, 13772.0, 7141.0, 4212.0, 2552.0, 1596.0, 952.0, 612.0, 385.0, 243.0, 150.0, 117.0, 75.0, 50.0, 26.0, 26.0, 22.0, 12.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9428558349609375, -0.909149169921875, -0.8754425048828125, -0.84173583984375, -0.8080291748046875, -0.774322509765625, -0.7406158447265625, -0.7069091796875, -0.6732025146484375, -0.639495849609375, -0.6057891845703125, -0.57208251953125, -0.5383758544921875, -0.504669189453125, -0.4709625244140625, -0.437255859375, -0.4035491943359375, -0.369842529296875, -0.3361358642578125, -0.30242919921875, -0.2687225341796875, -0.235015869140625, -0.2013092041015625, -0.1676025390625, -0.1338958740234375, -0.100189208984375, -0.0664825439453125, -0.03277587890625, 0.0009307861328125, 0.034637451171875, 0.0683441162109375, 0.10205078125, 0.1357574462890625, 0.169464111328125, 0.2031707763671875, 0.23687744140625, 0.2705841064453125, 0.304290771484375, 0.3379974365234375, 0.3717041015625, 0.4054107666015625, 0.439117431640625, 0.4728240966796875, 0.50653076171875, 0.5402374267578125, 0.573944091796875, 0.6076507568359375, 0.641357421875, 0.6750640869140625, 0.708770751953125, 0.7424774169921875, 0.77618408203125, 0.8098907470703125, 0.843597412109375, 0.8773040771484375, 0.9110107421875, 0.9447174072265625, 0.978424072265625, 1.0121307373046875, 1.04583740234375, 1.0795440673828125, 1.113250732421875, 1.1469573974609375, 1.1806640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 10.0, 3.0, 9.0, 9.0, 11.0, 20.0, 44.0, 56.0, 85.0, 151.0, 145.0, 138.0, 113.0, 66.0, 39.0, 21.0, 19.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.297607421875, -0.2900409698486328, -0.2824745178222656, -0.27490806579589844, -0.26734161376953125, -0.25977516174316406, -0.2522087097167969, -0.2446422576904297, -0.2370758056640625, -0.2295093536376953, -0.22194290161132812, -0.21437644958496094, -0.20680999755859375, -0.19924354553222656, -0.19167709350585938, -0.1841106414794922, -0.176544189453125, -0.1689777374267578, -0.16141128540039062, -0.15384483337402344, -0.14627838134765625, -0.13871192932128906, -0.13114547729492188, -0.12357902526855469, -0.1160125732421875, -0.10844612121582031, -0.10087966918945312, -0.09331321716308594, -0.08574676513671875, -0.07818031311035156, -0.07061386108398438, -0.06304740905761719, -0.05548095703125, -0.04791450500488281, -0.040348052978515625, -0.03278160095214844, -0.02521514892578125, -0.017648696899414062, -0.010082244873046875, -0.0025157928466796875, 0.0050506591796875, 0.012617111206054688, 0.020183563232421875, 0.027750015258789062, 0.03531646728515625, 0.04288291931152344, 0.050449371337890625, 0.05801582336425781, 0.065582275390625, 0.07314872741699219, 0.08071517944335938, 0.08828163146972656, 0.09584808349609375, 0.10341453552246094, 0.11098098754882812, 0.11854743957519531, 0.1261138916015625, 0.1336803436279297, 0.14124679565429688, 0.14881324768066406, 0.15637969970703125, 0.16394615173339844, 0.17151260375976562, 0.1790790557861328, 0.1866455078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 8.0, 10.0, 13.0, 15.0, 25.0, 45.0, 71.0, 103.0, 167.0, 240.0, 384.0, 596.0, 941.0, 1519.0, 2678.0, 4476.0, 8166.0, 15942.0, 31912.0, 69580.0, 157375.0, 300588.0, 241203.0, 111686.0, 49610.0, 23859.0, 12021.0, 6353.0, 3506.0, 2006.0, 1258.0, 832.0, 460.0, 296.0, 224.0, 138.0, 78.0, 57.0, 32.0, 30.0, 25.0, 10.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8852386474609375, -0.857391357421875, -0.8295440673828125, -0.80169677734375, -0.7738494873046875, -0.746002197265625, -0.7181549072265625, -0.6903076171875, -0.6624603271484375, -0.634613037109375, -0.6067657470703125, -0.57891845703125, -0.5510711669921875, -0.523223876953125, -0.4953765869140625, -0.467529296875, -0.4396820068359375, -0.411834716796875, -0.3839874267578125, -0.35614013671875, -0.3282928466796875, -0.300445556640625, -0.2725982666015625, -0.2447509765625, -0.2169036865234375, -0.189056396484375, -0.1612091064453125, -0.13336181640625, -0.1055145263671875, -0.077667236328125, -0.0498199462890625, -0.02197265625, 0.0058746337890625, 0.033721923828125, 0.0615692138671875, 0.08941650390625, 0.1172637939453125, 0.145111083984375, 0.1729583740234375, 0.2008056640625, 0.2286529541015625, 0.256500244140625, 0.2843475341796875, 0.31219482421875, 0.3400421142578125, 0.367889404296875, 0.3957366943359375, 0.423583984375, 0.4514312744140625, 0.479278564453125, 0.5071258544921875, 0.53497314453125, 0.5628204345703125, 0.590667724609375, 0.6185150146484375, 0.6463623046875, 0.6742095947265625, 0.702056884765625, 0.7299041748046875, 0.75775146484375, 0.7855987548828125, 0.813446044921875, 0.8412933349609375, 0.869140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 3.0, 15.0, 14.0, 17.0, 17.0, 18.0, 38.0, 32.0, 33.0, 29.0, 37.0, 34.0, 45.0, 33.0, 43.0, 43.0, 68.0, 45.0, 33.0, 35.0, 39.0, 39.0, 34.0, 19.0, 27.0, 19.0, 23.0, 18.0, 13.0, 13.0, 14.0, 13.0, 10.0, 9.0, 6.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.8369140625, -0.810455322265625, -0.78399658203125, -0.757537841796875, -0.7310791015625, -0.704620361328125, -0.67816162109375, -0.651702880859375, -0.625244140625, -0.598785400390625, -0.57232666015625, -0.545867919921875, -0.5194091796875, -0.492950439453125, -0.46649169921875, -0.440032958984375, -0.41357421875, -0.387115478515625, -0.36065673828125, -0.334197998046875, -0.3077392578125, -0.281280517578125, -0.25482177734375, -0.228363037109375, -0.201904296875, -0.175445556640625, -0.14898681640625, -0.122528076171875, -0.0960693359375, -0.069610595703125, -0.04315185546875, -0.016693115234375, 0.009765625, 0.036224365234375, 0.06268310546875, 0.089141845703125, 0.1156005859375, 0.142059326171875, 0.16851806640625, 0.194976806640625, 0.221435546875, 0.247894287109375, 0.27435302734375, 0.300811767578125, 0.3272705078125, 0.353729248046875, 0.38018798828125, 0.406646728515625, 0.43310546875, 0.459564208984375, 0.48602294921875, 0.512481689453125, 0.5389404296875, 0.565399169921875, 0.59185791015625, 0.618316650390625, 0.644775390625, 0.671234130859375, 0.69769287109375, 0.724151611328125, 0.7506103515625, 0.777069091796875, 0.80352783203125, 0.829986572265625, 0.8564453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 9.0, 10.0, 17.0, 10.0, 28.0, 46.0, 66.0, 87.0, 159.0, 283.0, 542.0, 1112.0, 2483.0, 6578.0, 22727.0, 144994.0, 721116.0, 117769.0, 19863.0, 5956.0, 2394.0, 1048.0, 517.0, 290.0, 166.0, 97.0, 63.0, 42.0, 30.0, 19.0, 9.0, 7.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.97930908203125, -2.8902587890625, -2.80120849609375, -2.712158203125, -2.62310791015625, -2.5340576171875, -2.44500732421875, -2.35595703125, -2.26690673828125, -2.1778564453125, -2.08880615234375, -1.999755859375, -1.91070556640625, -1.8216552734375, -1.73260498046875, -1.6435546875, -1.55450439453125, -1.4654541015625, -1.37640380859375, -1.287353515625, -1.19830322265625, -1.1092529296875, -1.02020263671875, -0.93115234375, -0.84210205078125, -0.7530517578125, -0.66400146484375, -0.574951171875, -0.48590087890625, -0.3968505859375, -0.30780029296875, -0.21875, -0.12969970703125, -0.0406494140625, 0.04840087890625, 0.137451171875, 0.22650146484375, 0.3155517578125, 0.40460205078125, 0.49365234375, 0.58270263671875, 0.6717529296875, 0.76080322265625, 0.849853515625, 0.93890380859375, 1.0279541015625, 1.11700439453125, 1.2060546875, 1.29510498046875, 1.3841552734375, 1.47320556640625, 1.562255859375, 1.65130615234375, 1.7403564453125, 1.82940673828125, 1.91845703125, 2.00750732421875, 2.0965576171875, 2.18560791015625, 2.274658203125, 2.36370849609375, 2.4527587890625, 2.54180908203125, 2.630859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 10.0, 12.0, 30.0, 16.0, 34.0, 29.0, 26.0, 45.0, 58.0, 60.0, 62.0, 71.0, 62.0, 75.0, 61.0, 58.0, 34.0, 38.0, 30.0, 32.0, 24.0, 28.0, 12.0, 9.0, 13.0, 2.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00022840499877929688, -0.00022223219275474548, -0.0002160593867301941, -0.0002098865807056427, -0.0002037137746810913, -0.00019754096865653992, -0.00019136816263198853, -0.00018519535660743713, -0.00017902255058288574, -0.00017284974455833435, -0.00016667693853378296, -0.00016050413250923157, -0.00015433132648468018, -0.00014815852046012878, -0.0001419857144355774, -0.000135812908411026, -0.0001296401023864746, -0.00012346729636192322, -0.00011729449033737183, -0.00011112168431282043, -0.00010494887828826904, -9.877607226371765e-05, -9.260326623916626e-05, -8.643046021461487e-05, -8.025765419006348e-05, -7.408484816551208e-05, -6.79120421409607e-05, -6.17392361164093e-05, -5.556643009185791e-05, -4.939362406730652e-05, -4.322081804275513e-05, -3.7048012018203735e-05, -3.0875205993652344e-05, -2.4702399969100952e-05, -1.852959394454956e-05, -1.2356787919998169e-05, -6.183981895446777e-06, -1.1175870895385742e-08, 6.161630153656006e-06, 1.2334436178207397e-05, 1.850724220275879e-05, 2.468004822731018e-05, 3.085285425186157e-05, 3.7025660276412964e-05, 4.3198466300964355e-05, 4.937127232551575e-05, 5.554407835006714e-05, 6.171688437461853e-05, 6.788969039916992e-05, 7.406249642372131e-05, 8.02353024482727e-05, 8.64081084728241e-05, 9.258091449737549e-05, 9.875372052192688e-05, 0.00010492652654647827, 0.00011109933257102966, 0.00011727213859558105, 0.00012344494462013245, 0.00012961775064468384, 0.00013579055666923523, 0.00014196336269378662, 0.000148136168718338, 0.0001543089747428894, 0.0001604817807674408, 0.0001666545867919922]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 6.0, 5.0, 14.0, 21.0, 24.0, 45.0, 62.0, 72.0, 170.0, 263.0, 514.0, 1024.0, 2108.0, 4673.0, 11779.0, 35738.0, 154226.0, 552093.0, 215150.0, 45627.0, 14399.0, 5527.0, 2434.0, 1146.0, 623.0, 297.0, 180.0, 122.0, 64.0, 41.0, 30.0, 22.0, 16.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3706817626953125, -1.324371337890625, -1.2780609130859375, -1.23175048828125, -1.1854400634765625, -1.139129638671875, -1.0928192138671875, -1.0465087890625, -1.0001983642578125, -0.953887939453125, -0.9075775146484375, -0.86126708984375, -0.8149566650390625, -0.768646240234375, -0.7223358154296875, -0.676025390625, -0.6297149658203125, -0.583404541015625, -0.5370941162109375, -0.49078369140625, -0.4444732666015625, -0.398162841796875, -0.3518524169921875, -0.3055419921875, -0.2592315673828125, -0.212921142578125, -0.1666107177734375, -0.12030029296875, -0.0739898681640625, -0.027679443359375, 0.0186309814453125, 0.06494140625, 0.1112518310546875, 0.157562255859375, 0.2038726806640625, 0.25018310546875, 0.2964935302734375, 0.342803955078125, 0.3891143798828125, 0.4354248046875, 0.4817352294921875, 0.528045654296875, 0.5743560791015625, 0.62066650390625, 0.6669769287109375, 0.713287353515625, 0.7595977783203125, 0.805908203125, 0.8522186279296875, 0.898529052734375, 0.9448394775390625, 0.99114990234375, 1.0374603271484375, 1.083770751953125, 1.1300811767578125, 1.1763916015625, 1.2227020263671875, 1.269012451171875, 1.3153228759765625, 1.36163330078125, 1.4079437255859375, 1.454254150390625, 1.5005645751953125, 1.546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 6.0, 13.0, 14.0, 22.0, 40.0, 23.0, 66.0, 77.0, 67.0, 104.0, 114.0, 108.0, 102.0, 70.0, 45.0, 44.0, 27.0, 23.0, 11.0, 10.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0078125, -0.9669952392578125, -0.926177978515625, -0.8853607177734375, -0.84454345703125, -0.8037261962890625, -0.762908935546875, -0.7220916748046875, -0.6812744140625, -0.6404571533203125, -0.599639892578125, -0.5588226318359375, -0.51800537109375, -0.4771881103515625, -0.436370849609375, -0.3955535888671875, -0.354736328125, -0.3139190673828125, -0.273101806640625, -0.2322845458984375, -0.19146728515625, -0.1506500244140625, -0.109832763671875, -0.0690155029296875, -0.0281982421875, 0.0126190185546875, 0.053436279296875, 0.0942535400390625, 0.13507080078125, 0.1758880615234375, 0.216705322265625, 0.2575225830078125, 0.29833984375, 0.3391571044921875, 0.379974365234375, 0.4207916259765625, 0.46160888671875, 0.5024261474609375, 0.543243408203125, 0.5840606689453125, 0.6248779296875, 0.6656951904296875, 0.706512451171875, 0.7473297119140625, 0.78814697265625, 0.8289642333984375, 0.869781494140625, 0.9105987548828125, 0.951416015625, 0.9922332763671875, 1.033050537109375, 1.0738677978515625, 1.11468505859375, 1.1555023193359375, 1.196319580078125, 1.2371368408203125, 1.2779541015625, 1.3187713623046875, 1.359588623046875, 1.4004058837890625, 1.44122314453125, 1.4820404052734375, 1.522857666015625, 1.5636749267578125, 1.6044921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 15.0, 19.0, 32.0, 62.0, 86.0, 130.0, 194.0, 179.0, 111.0, 55.0, 34.0, 27.0, 10.0, 8.0, 12.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.016237258911133, -24.386547088623047, -23.75685691833496, -23.127168655395508, -22.497478485107422, -21.867788314819336, -21.23809814453125, -20.608409881591797, -19.97871971130371, -19.349029541015625, -18.71933937072754, -18.089651107788086, -17.4599609375, -16.830270767211914, -16.200580596923828, -15.570891380310059, -14.941201210021973, -14.311511039733887, -13.681821823120117, -13.052131652832031, -12.422442436218262, -11.792752265930176, -11.163063049316406, -10.53337287902832, -9.903682708740234, -9.273992538452148, -8.644303321838379, -8.014613151550293, -7.384923934936523, -6.7552337646484375, -6.12554407119751, -5.495854377746582, -4.866164207458496, -4.236474514007568, -3.6067848205566406, -2.977094888687134, -2.347405195236206, -1.7177155017852783, -1.0880255699157715, -0.45833587646484375, 0.17135381698608398, 0.8010435700416565, 1.430733323097229, 2.0604231357574463, 2.690112829208374, 3.3198025226593018, 3.9494924545288086, 4.579182147979736, 5.208871841430664, 5.838561534881592, 6.4682512283325195, 7.0979413986206055, 7.727630615234375, 8.357320785522461, 8.987010955810547, 9.616700172424316, 10.246389389038086, 10.876079559326172, 11.505768775939941, 12.135458946228027, 12.765148162841797, 13.394838333129883, 14.024528503417969, 14.654217720031738, 15.283907890319824]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 17.0, 13.0, 26.0, 89.0, 142.0, 180.0, 176.0, 135.0, 67.0, 39.0, 33.0, 19.0, 14.0, 9.0, 4.0, 7.0, 2.0, 0.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.70224952697754, -15.984796524047852, -15.267342567443848, -14.549888610839844, -13.832435607910156, -13.114982604980469, -12.397528648376465, -11.680074691772461, -10.962621688842773, -10.245168685913086, -9.527714729309082, -8.810260772705078, -8.09280776977539, -7.375354290008545, -6.657900810241699, -5.9404473304748535, -5.222993850708008, -4.505540370941162, -3.7880868911743164, -3.0706334114074707, -2.353179931640625, -1.6357264518737793, -0.9182729721069336, -0.2008194923400879, 0.5166339874267578, 1.2340874671936035, 1.9515409469604492, 2.668994426727295, 3.3864479064941406, 4.103901386260986, 4.821354866027832, 5.538808345794678, 6.256259918212891, 6.973713397979736, 7.691166877746582, 8.408620834350586, 9.126073837280273, 9.843526840209961, 10.560980796813965, 11.278434753417969, 11.995887756347656, 12.713340759277344, 13.430794715881348, 14.148248672485352, 14.865701675415039, 15.583154678344727, 16.300609588623047, 17.018062591552734, 17.735515594482422, 18.45296859741211, 19.170421600341797, 19.887876510620117, 20.605329513549805, 21.322782516479492, 22.040237426757812, 22.7576904296875, 23.475143432617188, 24.192596435546875, 24.910049438476562, 25.627504348754883, 26.34495735168457, 27.062410354614258, 27.779865264892578, 28.497318267822266, 29.214771270751953]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 8.0, 11.0, 13.0, 21.0, 34.0, 70.0, 80.0, 133.0, 244.0, 470.0, 862.0, 1772.0, 4346.0, 13133.0, 63436.0, 3699084.0, 362857.0, 32721.0, 8552.0, 3266.0, 1472.0, 710.0, 368.0, 187.0, 133.0, 87.0, 57.0, 38.0, 32.0, 16.0, 10.0, 15.0, 3.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7109375, -2.616851806640625, -2.52276611328125, -2.428680419921875, -2.3345947265625, -2.240509033203125, -2.14642333984375, -2.052337646484375, -1.958251953125, -1.864166259765625, -1.77008056640625, -1.675994873046875, -1.5819091796875, -1.487823486328125, -1.39373779296875, -1.299652099609375, -1.20556640625, -1.111480712890625, -1.01739501953125, -0.923309326171875, -0.8292236328125, -0.735137939453125, -0.64105224609375, -0.546966552734375, -0.452880859375, -0.358795166015625, -0.26470947265625, -0.170623779296875, -0.0765380859375, 0.017547607421875, 0.11163330078125, 0.205718994140625, 0.2998046875, 0.393890380859375, 0.48797607421875, 0.582061767578125, 0.6761474609375, 0.770233154296875, 0.86431884765625, 0.958404541015625, 1.052490234375, 1.146575927734375, 1.24066162109375, 1.334747314453125, 1.4288330078125, 1.522918701171875, 1.61700439453125, 1.711090087890625, 1.80517578125, 1.899261474609375, 1.99334716796875, 2.087432861328125, 2.1815185546875, 2.275604248046875, 2.36968994140625, 2.463775634765625, 2.557861328125, 2.651947021484375, 2.74603271484375, 2.840118408203125, 2.9342041015625, 3.028289794921875, 3.12237548828125, 3.216461181640625, 3.310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 9.0, 10.0, 15.0, 17.0, 20.0, 50.0, 51.0, 80.0, 107.0, 121.0, 108.0, 95.0, 79.0, 63.0, 42.0, 30.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2236328125, -0.21726036071777344, -0.21088790893554688, -0.2045154571533203, -0.19814300537109375, -0.1917705535888672, -0.18539810180664062, -0.17902565002441406, -0.1726531982421875, -0.16628074645996094, -0.15990829467773438, -0.1535358428955078, -0.14716339111328125, -0.1407909393310547, -0.13441848754882812, -0.12804603576660156, -0.121673583984375, -0.11530113220214844, -0.10892868041992188, -0.10255622863769531, -0.09618377685546875, -0.08981132507324219, -0.08343887329101562, -0.07706642150878906, -0.0706939697265625, -0.06432151794433594, -0.057949066162109375, -0.05157661437988281, -0.04520416259765625, -0.03883171081542969, -0.032459259033203125, -0.026086807250976562, -0.01971435546875, -0.013341903686523438, -0.006969451904296875, -0.0005970001220703125, 0.00577545166015625, 0.012147903442382812, 0.018520355224609375, 0.024892807006835938, 0.0312652587890625, 0.03763771057128906, 0.044010162353515625, 0.05038261413574219, 0.05675506591796875, 0.06312751770019531, 0.06949996948242188, 0.07587242126464844, 0.082244873046875, 0.08861732482910156, 0.09498977661132812, 0.10136222839355469, 0.10773468017578125, 0.11410713195800781, 0.12047958374023438, 0.12685203552246094, 0.1332244873046875, 0.13959693908691406, 0.14596939086914062, 0.1523418426513672, 0.15871429443359375, 0.1650867462158203, 0.17145919799804688, 0.17783164978027344, 0.1842041015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 22.0, 30.0, 60.0, 61.0, 105.0, 148.0, 221.0, 349.0, 538.0, 884.0, 1496.0, 2677.0, 5025.0, 10376.0, 23179.0, 58548.0, 199921.0, 2850101.0, 830002.0, 131316.0, 43004.0, 18029.0, 8378.0, 4243.0, 2170.0, 1276.0, 779.0, 434.0, 289.0, 180.0, 122.0, 77.0, 62.0, 44.0, 28.0, 17.0, 15.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6639862060546875, -1.608245849609375, -1.5525054931640625, -1.49676513671875, -1.4410247802734375, -1.385284423828125, -1.3295440673828125, -1.2738037109375, -1.2180633544921875, -1.162322998046875, -1.1065826416015625, -1.05084228515625, -0.9951019287109375, -0.939361572265625, -0.8836212158203125, -0.827880859375, -0.7721405029296875, -0.716400146484375, -0.6606597900390625, -0.60491943359375, -0.5491790771484375, -0.493438720703125, -0.4376983642578125, -0.3819580078125, -0.3262176513671875, -0.270477294921875, -0.2147369384765625, -0.15899658203125, -0.1032562255859375, -0.047515869140625, 0.0082244873046875, 0.06396484375, 0.1197052001953125, 0.175445556640625, 0.2311859130859375, 0.28692626953125, 0.3426666259765625, 0.398406982421875, 0.4541473388671875, 0.5098876953125, 0.5656280517578125, 0.621368408203125, 0.6771087646484375, 0.73284912109375, 0.7885894775390625, 0.844329833984375, 0.9000701904296875, 0.955810546875, 1.0115509033203125, 1.067291259765625, 1.1230316162109375, 1.17877197265625, 1.2345123291015625, 1.290252685546875, 1.3459930419921875, 1.4017333984375, 1.4574737548828125, 1.513214111328125, 1.5689544677734375, 1.62469482421875, 1.6804351806640625, 1.736175537109375, 1.7919158935546875, 1.84765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 23.0, 17.0, 32.0, 37.0, 37.0, 75.0, 118.0, 157.0, 300.0, 922.0, 1577.0, 285.0, 178.0, 98.0, 52.0, 41.0, 25.0, 25.0, 16.0, 10.0, 7.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.43161964416503906, -0.4208564758300781, -0.4100933074951172, -0.39933013916015625, -0.3885669708251953, -0.3778038024902344, -0.36704063415527344, -0.3562774658203125, -0.34551429748535156, -0.3347511291503906, -0.3239879608154297, -0.31322479248046875, -0.3024616241455078, -0.2916984558105469, -0.28093528747558594, -0.270172119140625, -0.25940895080566406, -0.24864578247070312, -0.2378826141357422, -0.22711944580078125, -0.2163562774658203, -0.20559310913085938, -0.19482994079589844, -0.1840667724609375, -0.17330360412597656, -0.16254043579101562, -0.1517772674560547, -0.14101409912109375, -0.1302509307861328, -0.11948776245117188, -0.10872459411621094, -0.09796142578125, -0.08719825744628906, -0.07643508911132812, -0.06567192077636719, -0.05490875244140625, -0.04414558410644531, -0.033382415771484375, -0.022619247436523438, -0.0118560791015625, -0.0010929107666015625, 0.009670257568359375, 0.020433425903320312, 0.03119659423828125, 0.04195976257324219, 0.052722930908203125, 0.06348609924316406, 0.074249267578125, 0.08501243591308594, 0.09577560424804688, 0.10653877258300781, 0.11730194091796875, 0.1280651092529297, 0.13882827758789062, 0.14959144592285156, 0.1603546142578125, 0.17111778259277344, 0.18188095092773438, 0.1926441192626953, 0.20340728759765625, 0.2141704559326172, 0.22493362426757812, 0.23569679260253906, 0.2464599609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 8.0, 13.0, 20.0, 50.0, 62.0, 95.0, 138.0, 167.0, 177.0, 97.0, 82.0, 36.0, 25.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0077247619628906, -2.92850923538208, -2.8492939472198486, -2.770078659057617, -2.6908631324768066, -2.611647605895996, -2.5324323177337646, -2.453217029571533, -2.3740015029907227, -2.294785976409912, -2.2155706882476807, -2.136355400085449, -2.0571398735046387, -1.9779244661331177, -1.8987090587615967, -1.8194936513900757, -1.7402782440185547, -1.6610628366470337, -1.5818474292755127, -1.5026320219039917, -1.4234166145324707, -1.3442012071609497, -1.2649857997894287, -1.1857703924179077, -1.1065549850463867, -1.0273395776748657, -0.9481241703033447, -0.8689087629318237, -0.7896933555603027, -0.7104779481887817, -0.6312625408172607, -0.5520471334457397, -0.47283172607421875, -0.39361631870269775, -0.31440091133117676, -0.23518550395965576, -0.15597009658813477, -0.07675468921661377, 0.0024607181549072266, 0.08167612552642822, 0.16089153289794922, 0.24010694026947021, 0.3193223476409912, 0.3985377550125122, 0.4777531623840332, 0.5569685697555542, 0.6361839771270752, 0.7153993844985962, 0.7946147918701172, 0.8738301992416382, 0.9530456066131592, 1.0322610139846802, 1.1114764213562012, 1.1906918287277222, 1.2699072360992432, 1.3491226434707642, 1.4283380508422852, 1.5075534582138062, 1.5867688655853271, 1.6659842729568481, 1.7451996803283691, 1.8244150876998901, 1.9036304950714111, 1.9828459024429321, 2.062061309814453]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 6.0, 5.0, 11.0, 16.0, 15.0, 24.0, 19.0, 36.0, 36.0, 38.0, 51.0, 48.0, 58.0, 71.0, 47.0, 59.0, 53.0, 45.0, 52.0, 44.0, 44.0, 32.0, 38.0, 22.0, 29.0, 13.0, 15.0, 8.0, 17.0, 5.0, 4.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1543371677398682, -1.1169861555099487, -1.0796351432800293, -1.0422840118408203, -1.0049329996109009, -0.9675819873809814, -0.9302309155464172, -0.892879843711853, -0.8555288314819336, -0.8181778192520142, -0.78082674741745, -0.7434756755828857, -0.7061246633529663, -0.6687736511230469, -0.6314225792884827, -0.5940715074539185, -0.556720495223999, -0.5193694829940796, -0.4820184111595154, -0.44466736912727356, -0.40731632709503174, -0.3699652850627899, -0.3326142430305481, -0.2952632009983063, -0.25791215896606445, -0.22056111693382263, -0.1832100749015808, -0.145859032869339, -0.10850799083709717, -0.07115694880485535, -0.033805906772613525, 0.003545135259628296, 0.040896058082580566, 0.07824710011482239, 0.11559814214706421, 0.15294918417930603, 0.19030022621154785, 0.22765126824378967, 0.2650023102760315, 0.3023533523082733, 0.33970439434051514, 0.37705543637275696, 0.4144064784049988, 0.4517575204372406, 0.4891085624694824, 0.5264595746994019, 0.5638106465339661, 0.6011617183685303, 0.6385127305984497, 0.6758637428283691, 0.7132148146629333, 0.7505658864974976, 0.787916898727417, 0.8252679109573364, 0.8626189827919006, 0.8999700546264648, 0.9373210668563843, 0.9746720790863037, 1.0120232105255127, 1.0493742227554321, 1.0867252349853516, 1.124076247215271, 1.1614272594451904, 1.1987783908843994, 1.2361294031143188]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 12.0, 23.0, 26.0, 42.0, 65.0, 89.0, 111.0, 184.0, 292.0, 458.0, 836.0, 1430.0, 2553.0, 4835.0, 9489.0, 20818.0, 50557.0, 142291.0, 340486.0, 291306.0, 109212.0, 39293.0, 16816.0, 7924.0, 3937.0, 2183.0, 1264.0, 691.0, 471.0, 292.0, 176.0, 122.0, 74.0, 49.0, 37.0, 27.0, 20.0, 14.0, 11.0, 5.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0939483642578125, -1.056060791015625, -1.0181732177734375, -0.98028564453125, -0.9423980712890625, -0.904510498046875, -0.8666229248046875, -0.8287353515625, -0.7908477783203125, -0.752960205078125, -0.7150726318359375, -0.67718505859375, -0.6392974853515625, -0.601409912109375, -0.5635223388671875, -0.525634765625, -0.4877471923828125, -0.449859619140625, -0.4119720458984375, -0.37408447265625, -0.3361968994140625, -0.298309326171875, -0.2604217529296875, -0.2225341796875, -0.1846466064453125, -0.146759033203125, -0.1088714599609375, -0.07098388671875, -0.0330963134765625, 0.004791259765625, 0.0426788330078125, 0.08056640625, 0.1184539794921875, 0.156341552734375, 0.1942291259765625, 0.23211669921875, 0.2700042724609375, 0.307891845703125, 0.3457794189453125, 0.3836669921875, 0.4215545654296875, 0.459442138671875, 0.4973297119140625, 0.53521728515625, 0.5731048583984375, 0.610992431640625, 0.6488800048828125, 0.686767578125, 0.7246551513671875, 0.762542724609375, 0.8004302978515625, 0.83831787109375, 0.8762054443359375, 0.914093017578125, 0.9519805908203125, 0.9898681640625, 1.0277557373046875, 1.065643310546875, 1.1035308837890625, 1.14141845703125, 1.1793060302734375, 1.217193603515625, 1.2550811767578125, 1.29296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 8.0, 31.0, 34.0, 49.0, 64.0, 92.0, 92.0, 109.0, 104.0, 83.0, 60.0, 52.0, 57.0, 29.0, 23.0, 9.0, 16.0, 8.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2281494140625, -0.22223663330078125, -0.2163238525390625, -0.21041107177734375, -0.204498291015625, -0.19858551025390625, -0.1926727294921875, -0.18675994873046875, -0.18084716796875, -0.17493438720703125, -0.1690216064453125, -0.16310882568359375, -0.157196044921875, -0.15128326416015625, -0.1453704833984375, -0.13945770263671875, -0.133544921875, -0.12763214111328125, -0.1217193603515625, -0.11580657958984375, -0.109893798828125, -0.10398101806640625, -0.0980682373046875, -0.09215545654296875, -0.08624267578125, -0.08032989501953125, -0.0744171142578125, -0.06850433349609375, -0.062591552734375, -0.05667877197265625, -0.0507659912109375, -0.04485321044921875, -0.0389404296875, -0.03302764892578125, -0.0271148681640625, -0.02120208740234375, -0.015289306640625, -0.00937652587890625, -0.0034637451171875, 0.00244903564453125, 0.00836181640625, 0.01427459716796875, 0.0201873779296875, 0.02610015869140625, 0.032012939453125, 0.03792572021484375, 0.0438385009765625, 0.04975128173828125, 0.0556640625, 0.06157684326171875, 0.0674896240234375, 0.07340240478515625, 0.079315185546875, 0.08522796630859375, 0.0911407470703125, 0.09705352783203125, 0.10296630859375, 0.10887908935546875, 0.1147918701171875, 0.12070465087890625, 0.126617431640625, 0.13253021240234375, 0.1384429931640625, 0.14435577392578125, 0.1502685546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 22.0, 18.0, 42.0, 61.0, 82.0, 131.0, 206.0, 313.0, 575.0, 813.0, 1450.0, 2490.0, 4326.0, 7764.0, 14812.0, 29618.0, 60416.0, 121799.0, 215829.0, 251743.0, 166475.0, 84690.0, 40642.0, 20190.0, 10496.0, 5613.0, 3133.0, 1818.0, 1101.0, 641.0, 448.0, 262.0, 168.0, 114.0, 66.0, 41.0, 30.0, 40.0, 16.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.622650146484375, -0.59979248046875, -0.576934814453125, -0.5540771484375, -0.531219482421875, -0.50836181640625, -0.485504150390625, -0.462646484375, -0.439788818359375, -0.41693115234375, -0.394073486328125, -0.3712158203125, -0.348358154296875, -0.32550048828125, -0.302642822265625, -0.27978515625, -0.256927490234375, -0.23406982421875, -0.211212158203125, -0.1883544921875, -0.165496826171875, -0.14263916015625, -0.119781494140625, -0.096923828125, -0.074066162109375, -0.05120849609375, -0.028350830078125, -0.0054931640625, 0.017364501953125, 0.04022216796875, 0.063079833984375, 0.0859375, 0.108795166015625, 0.13165283203125, 0.154510498046875, 0.1773681640625, 0.200225830078125, 0.22308349609375, 0.245941162109375, 0.268798828125, 0.291656494140625, 0.31451416015625, 0.337371826171875, 0.3602294921875, 0.383087158203125, 0.40594482421875, 0.428802490234375, 0.45166015625, 0.474517822265625, 0.49737548828125, 0.520233154296875, 0.5430908203125, 0.565948486328125, 0.58880615234375, 0.611663818359375, 0.634521484375, 0.657379150390625, 0.68023681640625, 0.703094482421875, 0.7259521484375, 0.748809814453125, 0.77166748046875, 0.794525146484375, 0.8173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 14.0, 6.0, 11.0, 14.0, 10.0, 15.0, 17.0, 21.0, 29.0, 43.0, 36.0, 43.0, 39.0, 37.0, 40.0, 47.0, 64.0, 52.0, 48.0, 48.0, 53.0, 38.0, 39.0, 48.0, 37.0, 28.0, 32.0, 20.0, 18.0, 15.0, 12.0, 3.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.57342529296875, -0.5516357421875, -0.52984619140625, -0.508056640625, -0.48626708984375, -0.4644775390625, -0.44268798828125, -0.4208984375, -0.39910888671875, -0.3773193359375, -0.35552978515625, -0.333740234375, -0.31195068359375, -0.2901611328125, -0.26837158203125, -0.24658203125, -0.22479248046875, -0.2030029296875, -0.18121337890625, -0.159423828125, -0.13763427734375, -0.1158447265625, -0.09405517578125, -0.072265625, -0.05047607421875, -0.0286865234375, -0.00689697265625, 0.014892578125, 0.03668212890625, 0.0584716796875, 0.08026123046875, 0.10205078125, 0.12384033203125, 0.1456298828125, 0.16741943359375, 0.189208984375, 0.21099853515625, 0.2327880859375, 0.25457763671875, 0.2763671875, 0.29815673828125, 0.3199462890625, 0.34173583984375, 0.363525390625, 0.38531494140625, 0.4071044921875, 0.42889404296875, 0.45068359375, 0.47247314453125, 0.4942626953125, 0.51605224609375, 0.537841796875, 0.55963134765625, 0.5814208984375, 0.60321044921875, 0.625, 0.64678955078125, 0.6685791015625, 0.69036865234375, 0.712158203125, 0.73394775390625, 0.7557373046875, 0.77752685546875, 0.79931640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 15.0, 21.0, 32.0, 31.0, 42.0, 62.0, 87.0, 169.0, 215.0, 342.0, 608.0, 1082.0, 2316.0, 4904.0, 12765.0, 42012.0, 188267.0, 534420.0, 194420.0, 43301.0, 13204.0, 5002.0, 2353.0, 1174.0, 646.0, 332.0, 246.0, 145.0, 97.0, 69.0, 35.0, 43.0, 16.0, 20.0, 14.0, 5.0, 6.0, 2.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7614593505859375, -1.699676513671875, -1.6378936767578125, -1.57611083984375, -1.5143280029296875, -1.452545166015625, -1.3907623291015625, -1.3289794921875, -1.2671966552734375, -1.205413818359375, -1.1436309814453125, -1.08184814453125, -1.0200653076171875, -0.958282470703125, -0.8964996337890625, -0.834716796875, -0.7729339599609375, -0.711151123046875, -0.6493682861328125, -0.58758544921875, -0.5258026123046875, -0.464019775390625, -0.4022369384765625, -0.3404541015625, -0.2786712646484375, -0.216888427734375, -0.1551055908203125, -0.09332275390625, -0.0315399169921875, 0.030242919921875, 0.0920257568359375, 0.15380859375, 0.2155914306640625, 0.277374267578125, 0.3391571044921875, 0.40093994140625, 0.4627227783203125, 0.524505615234375, 0.5862884521484375, 0.6480712890625, 0.7098541259765625, 0.771636962890625, 0.8334197998046875, 0.89520263671875, 0.9569854736328125, 1.018768310546875, 1.0805511474609375, 1.142333984375, 1.2041168212890625, 1.265899658203125, 1.3276824951171875, 1.38946533203125, 1.4512481689453125, 1.513031005859375, 1.5748138427734375, 1.6365966796875, 1.6983795166015625, 1.760162353515625, 1.8219451904296875, 1.88372802734375, 1.9455108642578125, 2.007293701171875, 2.0690765380859375, 2.130859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 10.0, 23.0, 12.0, 35.0, 46.0, 75.0, 92.0, 96.0, 139.0, 113.0, 114.0, 64.0, 62.0, 28.0, 34.0, 22.0, 13.0, 12.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003039836883544922, -0.0002952590584754944, -0.0002865344285964966, -0.0002778097987174988, -0.000269085168838501, -0.0002603605389595032, -0.00025163590908050537, -0.00024291127920150757, -0.00023418664932250977, -0.00022546201944351196, -0.00021673738956451416, -0.00020801275968551636, -0.00019928812980651855, -0.00019056349992752075, -0.00018183887004852295, -0.00017311424016952515, -0.00016438961029052734, -0.00015566498041152954, -0.00014694035053253174, -0.00013821572065353394, -0.00012949109077453613, -0.00012076646089553833, -0.00011204183101654053, -0.00010331720113754272, -9.459257125854492e-05, -8.586794137954712e-05, -7.714331150054932e-05, -6.841868162155151e-05, -5.969405174255371e-05, -5.096942186355591e-05, -4.2244791984558105e-05, -3.35201621055603e-05, -2.47955322265625e-05, -1.6070902347564697e-05, -7.3462724685668945e-06, 1.3783574104309082e-06, 1.0102987289428711e-05, 1.8827617168426514e-05, 2.7552247047424316e-05, 3.627687692642212e-05, 4.500150680541992e-05, 5.3726136684417725e-05, 6.245076656341553e-05, 7.117539644241333e-05, 7.990002632141113e-05, 8.862465620040894e-05, 9.734928607940674e-05, 0.00010607391595840454, 0.00011479854583740234, 0.00012352317571640015, 0.00013224780559539795, 0.00014097243547439575, 0.00014969706535339355, 0.00015842169523239136, 0.00016714632511138916, 0.00017587095499038696, 0.00018459558486938477, 0.00019332021474838257, 0.00020204484462738037, 0.00021076947450637817, 0.00021949410438537598, 0.00022821873426437378, 0.00023694336414337158, 0.0002456679940223694, 0.0002543926239013672]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 10.0, 15.0, 11.0, 23.0, 27.0, 51.0, 68.0, 96.0, 162.0, 228.0, 406.0, 587.0, 976.0, 1801.0, 3465.0, 6727.0, 14791.0, 35825.0, 102464.0, 286168.0, 355432.0, 149761.0, 50495.0, 19989.0, 8859.0, 4342.0, 2364.0, 1322.0, 730.0, 475.0, 316.0, 186.0, 121.0, 92.0, 47.0, 40.0, 17.0, 21.0, 18.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.030120849609375, -0.99481201171875, -0.959503173828125, -0.9241943359375, -0.888885498046875, -0.85357666015625, -0.818267822265625, -0.782958984375, -0.747650146484375, -0.71234130859375, -0.677032470703125, -0.6417236328125, -0.606414794921875, -0.57110595703125, -0.535797119140625, -0.50048828125, -0.465179443359375, -0.42987060546875, -0.394561767578125, -0.3592529296875, -0.323944091796875, -0.28863525390625, -0.253326416015625, -0.218017578125, -0.182708740234375, -0.14739990234375, -0.112091064453125, -0.0767822265625, -0.041473388671875, -0.00616455078125, 0.029144287109375, 0.064453125, 0.099761962890625, 0.13507080078125, 0.170379638671875, 0.2056884765625, 0.240997314453125, 0.27630615234375, 0.311614990234375, 0.346923828125, 0.382232666015625, 0.41754150390625, 0.452850341796875, 0.4881591796875, 0.523468017578125, 0.55877685546875, 0.594085693359375, 0.62939453125, 0.664703369140625, 0.70001220703125, 0.735321044921875, 0.7706298828125, 0.805938720703125, 0.84124755859375, 0.876556396484375, 0.911865234375, 0.947174072265625, 0.98248291015625, 1.017791748046875, 1.0531005859375, 1.088409423828125, 1.12371826171875, 1.159027099609375, 1.1943359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 7.0, 16.0, 13.0, 14.0, 13.0, 37.0, 43.0, 44.0, 47.0, 45.0, 66.0, 58.0, 48.0, 66.0, 64.0, 54.0, 48.0, 41.0, 34.0, 35.0, 40.0, 30.0, 19.0, 20.0, 18.0, 11.0, 8.0, 6.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5383148193359375, -0.519500732421875, -0.5006866455078125, -0.48187255859375, -0.4630584716796875, -0.444244384765625, -0.4254302978515625, -0.4066162109375, -0.3878021240234375, -0.368988037109375, -0.3501739501953125, -0.33135986328125, -0.3125457763671875, -0.293731689453125, -0.2749176025390625, -0.256103515625, -0.2372894287109375, -0.218475341796875, -0.1996612548828125, -0.18084716796875, -0.1620330810546875, -0.143218994140625, -0.1244049072265625, -0.1055908203125, -0.0867767333984375, -0.067962646484375, -0.0491485595703125, -0.03033447265625, -0.0115203857421875, 0.007293701171875, 0.0261077880859375, 0.044921875, 0.0637359619140625, 0.082550048828125, 0.1013641357421875, 0.12017822265625, 0.1389923095703125, 0.157806396484375, 0.1766204833984375, 0.1954345703125, 0.2142486572265625, 0.233062744140625, 0.2518768310546875, 0.27069091796875, 0.2895050048828125, 0.308319091796875, 0.3271331787109375, 0.345947265625, 0.3647613525390625, 0.383575439453125, 0.4023895263671875, 0.42120361328125, 0.4400177001953125, 0.458831787109375, 0.4776458740234375, 0.4964599609375, 0.5152740478515625, 0.534088134765625, 0.5529022216796875, 0.57171630859375, 0.5905303955078125, 0.609344482421875, 0.6281585693359375, 0.64697265625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 16.0, 48.0, 141.0, 275.0, 249.0, 146.0, 56.0, 26.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.348570823669434, -14.780890464782715, -14.213211059570312, -13.645530700683594, -13.077851295471191, -12.510170936584473, -11.94249153137207, -11.374811172485352, -10.807130813598633, -10.239450454711914, -9.671771049499512, -9.104090690612793, -8.53641128540039, -7.968730926513672, -7.401051044464111, -6.833371162414551, -6.265691757202148, -5.698011875152588, -5.130331993103027, -4.562651634216309, -3.994971990585327, -3.4272921085357666, -2.859611988067627, -2.2919321060180664, -1.7242522239685059, -1.1565723419189453, -0.5888923406600952, -0.021212339401245117, 0.5464675426483154, 1.114147424697876, 1.6818275451660156, 2.249507427215576, 2.817188262939453, 3.3848681449890137, 3.952548027038574, 4.520228385925293, 5.087907791137695, 5.655588150024414, 6.223268032073975, 6.790947914123535, 7.358627796173096, 7.926307678222656, 8.493988037109375, 9.061667442321777, 9.629347801208496, 10.197027206420898, 10.764707565307617, 11.332387924194336, 11.900067329406738, 12.467747688293457, 13.03542709350586, 13.603107452392578, 14.17078685760498, 14.7384672164917, 15.306146621704102, 15.87382698059082, 16.44150733947754, 17.009187698364258, 17.576868057250977, 18.144546508789062, 18.71222686767578, 19.2799072265625, 19.84758758544922, 20.415267944335938, 20.982946395874023]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 5.0, 5.0, 13.0, 14.0, 20.0, 26.0, 33.0, 50.0, 65.0, 64.0, 80.0, 97.0, 94.0, 74.0, 90.0, 62.0, 53.0, 37.0, 34.0, 16.0, 19.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.967996120452881, -7.727425575256348, -7.486854553222656, -7.246284008026123, -7.00571346282959, -6.765142440795898, -6.524571895599365, -6.284001350402832, -6.043430328369141, -5.802859783172607, -5.562288761138916, -5.321718215942383, -5.08114767074585, -4.840577125549316, -4.600006103515625, -4.359435558319092, -4.118865013122559, -3.8782942295074463, -3.637723684310913, -3.397152900695801, -3.1565823554992676, -2.9160115718841553, -2.675440788269043, -2.4348702430725098, -2.1942994594573975, -1.9537287950515747, -1.713158130645752, -1.4725873470306396, -1.232016682624817, -0.9914460182189941, -0.7508752346038818, -0.5103045701980591, -0.2697334289550781, -0.029162734746932983, 0.21140795946121216, 0.4519786834716797, 0.6925493478775024, 0.9331200122833252, 1.1736907958984375, 1.4142614603042603, 1.654832124710083, 1.8954027891159058, 2.1359734535217285, 2.376544237136841, 2.617115020751953, 2.8576855659484863, 3.0982563495635986, 3.338827133178711, 3.579397678375244, 3.8199684619903564, 4.060539245605469, 4.301109790802002, 4.541680335998535, 4.782251358032227, 5.02282190322876, 5.263392448425293, 5.503963470458984, 5.744534015655518, 5.985105037689209, 6.225675582885742, 6.466246128082275, 6.706816673278809, 6.9473876953125, 7.187958240509033, 7.428528785705566]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 33.0, 35.0, 58.0, 103.0, 154.0, 265.0, 470.0, 977.0, 2041.0, 5219.0, 17439.0, 93870.0, 3687606.0, 336086.0, 35126.0, 8715.0, 3115.0, 1362.0, 698.0, 345.0, 171.0, 111.0, 82.0, 55.0, 23.0, 20.0, 11.0, 14.0, 15.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.664031982421875, -2.56439208984375, -2.464752197265625, -2.3651123046875, -2.265472412109375, -2.16583251953125, -2.066192626953125, -1.966552734375, -1.866912841796875, -1.76727294921875, -1.667633056640625, -1.5679931640625, -1.468353271484375, -1.36871337890625, -1.269073486328125, -1.16943359375, -1.069793701171875, -0.97015380859375, -0.870513916015625, -0.7708740234375, -0.671234130859375, -0.57159423828125, -0.471954345703125, -0.372314453125, -0.272674560546875, -0.17303466796875, -0.073394775390625, 0.0262451171875, 0.125885009765625, 0.22552490234375, 0.325164794921875, 0.4248046875, 0.524444580078125, 0.62408447265625, 0.723724365234375, 0.8233642578125, 0.923004150390625, 1.02264404296875, 1.122283935546875, 1.221923828125, 1.321563720703125, 1.42120361328125, 1.520843505859375, 1.6204833984375, 1.720123291015625, 1.81976318359375, 1.919403076171875, 2.01904296875, 2.118682861328125, 2.21832275390625, 2.317962646484375, 2.4176025390625, 2.517242431640625, 2.61688232421875, 2.716522216796875, 2.816162109375, 2.915802001953125, 3.01544189453125, 3.115081787109375, 3.2147216796875, 3.314361572265625, 3.41400146484375, 3.513641357421875, 3.61328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 10.0, 14.0, 27.0, 43.0, 63.0, 69.0, 89.0, 105.0, 114.0, 98.0, 86.0, 75.0, 51.0, 45.0, 23.0, 11.0, 17.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2812824249267578, -0.2744789123535156, -0.26767539978027344, -0.26087188720703125, -0.25406837463378906, -0.24726486206054688, -0.2404613494873047, -0.2336578369140625, -0.2268543243408203, -0.22005081176757812, -0.21324729919433594, -0.20644378662109375, -0.19964027404785156, -0.19283676147460938, -0.1860332489013672, -0.179229736328125, -0.1724262237548828, -0.16562271118164062, -0.15881919860839844, -0.15201568603515625, -0.14521217346191406, -0.13840866088867188, -0.1316051483154297, -0.1248016357421875, -0.11799812316894531, -0.11119461059570312, -0.10439109802246094, -0.09758758544921875, -0.09078407287597656, -0.08398056030273438, -0.07717704772949219, -0.07037353515625, -0.06357002258300781, -0.056766510009765625, -0.04996299743652344, -0.04315948486328125, -0.03635597229003906, -0.029552459716796875, -0.022748947143554688, -0.0159454345703125, -0.009141921997070312, -0.002338409423828125, 0.0044651031494140625, 0.01126861572265625, 0.018072128295898438, 0.024875640869140625, 0.03167915344238281, 0.038482666015625, 0.04528617858886719, 0.052089691162109375, 0.05889320373535156, 0.06569671630859375, 0.07250022888183594, 0.07930374145507812, 0.08610725402832031, 0.0929107666015625, 0.09971427917480469, 0.10651779174804688, 0.11332130432128906, 0.12012481689453125, 0.12692832946777344, 0.13373184204101562, 0.1405353546142578, 0.1473388671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 12.0, 9.0, 17.0, 38.0, 50.0, 82.0, 182.0, 376.0, 990.0, 2679.0, 9141.0, 38751.0, 308880.0, 3593187.0, 198950.0, 29438.0, 7610.0, 2347.0, 812.0, 344.0, 140.0, 88.0, 54.0, 29.0, 23.0, 20.0, 7.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.786834716796875, -2.67718505859375, -2.567535400390625, -2.4578857421875, -2.348236083984375, -2.23858642578125, -2.128936767578125, -2.019287109375, -1.909637451171875, -1.79998779296875, -1.690338134765625, -1.5806884765625, -1.471038818359375, -1.36138916015625, -1.251739501953125, -1.14208984375, -1.032440185546875, -0.92279052734375, -0.813140869140625, -0.7034912109375, -0.593841552734375, -0.48419189453125, -0.374542236328125, -0.264892578125, -0.155242919921875, -0.04559326171875, 0.064056396484375, 0.1737060546875, 0.283355712890625, 0.39300537109375, 0.502655029296875, 0.6123046875, 0.721954345703125, 0.83160400390625, 0.941253662109375, 1.0509033203125, 1.160552978515625, 1.27020263671875, 1.379852294921875, 1.489501953125, 1.599151611328125, 1.70880126953125, 1.818450927734375, 1.9281005859375, 2.037750244140625, 2.14739990234375, 2.257049560546875, 2.36669921875, 2.476348876953125, 2.58599853515625, 2.695648193359375, 2.8052978515625, 2.914947509765625, 3.02459716796875, 3.134246826171875, 3.243896484375, 3.353546142578125, 3.46319580078125, 3.572845458984375, 3.6824951171875, 3.792144775390625, 3.90179443359375, 4.011444091796875, 4.12109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 3.0, 4.0, 15.0, 15.0, 25.0, 22.0, 35.0, 49.0, 79.0, 117.0, 209.0, 340.0, 809.0, 1414.0, 375.0, 153.0, 125.0, 85.0, 60.0, 42.0, 21.0, 14.0, 15.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.438232421875, -0.426422119140625, -0.41461181640625, -0.402801513671875, -0.3909912109375, -0.379180908203125, -0.36737060546875, -0.355560302734375, -0.34375, -0.331939697265625, -0.32012939453125, -0.308319091796875, -0.2965087890625, -0.284698486328125, -0.27288818359375, -0.261077880859375, -0.249267578125, -0.237457275390625, -0.22564697265625, -0.213836669921875, -0.2020263671875, -0.190216064453125, -0.17840576171875, -0.166595458984375, -0.15478515625, -0.142974853515625, -0.13116455078125, -0.119354248046875, -0.1075439453125, -0.095733642578125, -0.08392333984375, -0.072113037109375, -0.060302734375, -0.048492431640625, -0.03668212890625, -0.024871826171875, -0.0130615234375, -0.001251220703125, 0.01055908203125, 0.022369384765625, 0.0341796875, 0.045989990234375, 0.05780029296875, 0.069610595703125, 0.0814208984375, 0.093231201171875, 0.10504150390625, 0.116851806640625, 0.128662109375, 0.140472412109375, 0.15228271484375, 0.164093017578125, 0.1759033203125, 0.187713623046875, 0.19952392578125, 0.211334228515625, 0.22314453125, 0.234954833984375, 0.24676513671875, 0.258575439453125, 0.2703857421875, 0.282196044921875, 0.29400634765625, 0.305816650390625, 0.317626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 17.0, 24.0, 35.0, 70.0, 122.0, 158.0, 186.0, 140.0, 103.0, 56.0, 29.0, 26.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874171495437622, -3.7760050296783447, -3.6778385639190674, -3.57967209815979, -3.4815056324005127, -3.3833391666412354, -3.285172939300537, -3.1870064735412598, -3.0888400077819824, -2.990673542022705, -2.8925070762634277, -2.7943406105041504, -2.696174144744873, -2.5980076789855957, -2.4998412132263184, -2.401674747467041, -2.3035082817077637, -2.2053418159484863, -2.107175350189209, -2.0090088844299316, -1.9108424186706543, -1.812675952911377, -1.7145096063613892, -1.6163431406021118, -1.5181766748428345, -1.4200102090835571, -1.3218437433242798, -1.223677396774292, -1.1255109310150146, -1.0273444652557373, -0.92917799949646, -0.8310115337371826, -0.7328448295593262, -0.6346783638000488, -0.5365118980407715, -0.4383454918861389, -0.3401790261268616, -0.24201256036758423, -0.14384615421295166, -0.045679688453674316, 0.05248677730560303, 0.15065322816371918, 0.24881967902183533, 0.3469861149787903, 0.4451525807380676, 0.543319046497345, 0.6414854526519775, 0.7396519184112549, 0.8378183841705322, 0.9359848499298096, 1.034151315689087, 1.1323177814483643, 1.2304842472076416, 1.328650712966919, 1.4268170595169067, 1.524983525276184, 1.6231499910354614, 1.7213164567947388, 1.8194829225540161, 1.917649269104004, 2.0158157348632812, 2.1139822006225586, 2.212148666381836, 2.3103151321411133, 2.4084815979003906]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 1.0, 6.0, 2.0, 12.0, 10.0, 13.0, 13.0, 21.0, 24.0, 27.0, 37.0, 32.0, 26.0, 49.0, 50.0, 46.0, 57.0, 63.0, 56.0, 53.0, 43.0, 41.0, 38.0, 40.0, 35.0, 40.0, 31.0, 23.0, 19.0, 13.0, 17.0, 12.0, 8.0, 5.0, 8.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.244240164756775, -1.2038975954055786, -1.1635550260543823, -1.123212456703186, -1.0828698873519897, -1.0425273180007935, -1.0021847486495972, -0.9618421196937561, -0.9214995503425598, -0.8811569809913635, -0.8408144116401672, -0.800471842288971, -0.7601292133331299, -0.7197866439819336, -0.6794440746307373, -0.639101505279541, -0.5987589359283447, -0.5584163665771484, -0.5180737972259521, -0.47773119807243347, -0.4373886287212372, -0.3970460593700409, -0.3567034602165222, -0.3163608908653259, -0.27601832151412964, -0.23567575216293335, -0.19533316791057587, -0.15499058365821838, -0.1146480143070221, -0.0743054449558258, -0.03396286070346832, 0.00637972354888916, 0.0467221736907959, 0.08706475049257278, 0.12740732729434967, 0.16774991154670715, 0.20809248089790344, 0.24843505024909973, 0.2887776494026184, 0.3291202187538147, 0.369462788105011, 0.4098053574562073, 0.45014792680740356, 0.49049052596092224, 0.5308331251144409, 0.5711756944656372, 0.6115182638168335, 0.6518608331680298, 0.6922034025192261, 0.7325459718704224, 0.7728885412216187, 0.8132311105728149, 0.8535736799240112, 0.8939162492752075, 0.9342588782310486, 0.9746014475822449, 1.014944076538086, 1.0552866458892822, 1.0956292152404785, 1.1359717845916748, 1.176314353942871, 1.2166569232940674, 1.2569994926452637, 1.29734206199646, 1.3376846313476562]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 10.0, 17.0, 19.0, 21.0, 53.0, 67.0, 101.0, 190.0, 361.0, 668.0, 1462.0, 3100.0, 8025.0, 24809.0, 90365.0, 315545.0, 407902.0, 139827.0, 36771.0, 11261.0, 4186.0, 1835.0, 881.0, 431.0, 249.0, 129.0, 81.0, 60.0, 33.0, 19.0, 19.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.687225341796875, -1.63128662109375, -1.575347900390625, -1.5194091796875, -1.463470458984375, -1.40753173828125, -1.351593017578125, -1.295654296875, -1.239715576171875, -1.18377685546875, -1.127838134765625, -1.0718994140625, -1.015960693359375, -0.96002197265625, -0.904083251953125, -0.84814453125, -0.792205810546875, -0.73626708984375, -0.680328369140625, -0.6243896484375, -0.568450927734375, -0.51251220703125, -0.456573486328125, -0.400634765625, -0.344696044921875, -0.28875732421875, -0.232818603515625, -0.1768798828125, -0.120941162109375, -0.06500244140625, -0.009063720703125, 0.046875, 0.102813720703125, 0.15875244140625, 0.214691162109375, 0.2706298828125, 0.326568603515625, 0.38250732421875, 0.438446044921875, 0.494384765625, 0.550323486328125, 0.60626220703125, 0.662200927734375, 0.7181396484375, 0.774078369140625, 0.83001708984375, 0.885955810546875, 0.94189453125, 0.997833251953125, 1.05377197265625, 1.109710693359375, 1.1656494140625, 1.221588134765625, 1.27752685546875, 1.333465576171875, 1.389404296875, 1.445343017578125, 1.50128173828125, 1.557220458984375, 1.6131591796875, 1.669097900390625, 1.72503662109375, 1.780975341796875, 1.8369140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 8.0, 2.0, 11.0, 16.0, 24.0, 34.0, 52.0, 60.0, 93.0, 86.0, 116.0, 98.0, 106.0, 81.0, 63.0, 45.0, 42.0, 23.0, 15.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.314453125, -0.30727577209472656, -0.3000984191894531, -0.2929210662841797, -0.28574371337890625, -0.2785663604736328, -0.2713890075683594, -0.26421165466308594, -0.2570343017578125, -0.24985694885253906, -0.24267959594726562, -0.2355022430419922, -0.22832489013671875, -0.2211475372314453, -0.21397018432617188, -0.20679283142089844, -0.199615478515625, -0.19243812561035156, -0.18526077270507812, -0.1780834197998047, -0.17090606689453125, -0.1637287139892578, -0.15655136108398438, -0.14937400817871094, -0.1421966552734375, -0.13501930236816406, -0.12784194946289062, -0.12066459655761719, -0.11348724365234375, -0.10630989074707031, -0.09913253784179688, -0.09195518493652344, -0.08477783203125, -0.07760047912597656, -0.07042312622070312, -0.06324577331542969, -0.05606842041015625, -0.04889106750488281, -0.041713714599609375, -0.03453636169433594, -0.0273590087890625, -0.020181655883789062, -0.013004302978515625, -0.0058269500732421875, 0.00135040283203125, 0.008527755737304688, 0.015705108642578125, 0.022882461547851562, 0.030059814453125, 0.03723716735839844, 0.044414520263671875, 0.05159187316894531, 0.05876922607421875, 0.06594657897949219, 0.07312393188476562, 0.08030128479003906, 0.0874786376953125, 0.09465599060058594, 0.10183334350585938, 0.10901069641113281, 0.11618804931640625, 0.12336540222167969, 0.13054275512695312, 0.13772010803222656, 0.1448974609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 17.0, 24.0, 20.0, 31.0, 43.0, 63.0, 85.0, 110.0, 179.0, 232.0, 352.0, 487.0, 825.0, 1179.0, 1966.0, 3233.0, 6128.0, 12271.0, 26091.0, 56896.0, 120543.0, 217341.0, 257275.0, 174331.0, 88369.0, 40903.0, 18921.0, 8970.0, 4624.0, 2582.0, 1444.0, 943.0, 599.0, 445.0, 326.0, 200.0, 146.0, 94.0, 69.0, 50.0, 36.0, 36.0, 17.0, 18.0, 8.0, 6.0, 4.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.017578125, -0.983978271484375, -0.95037841796875, -0.916778564453125, -0.8831787109375, -0.849578857421875, -0.81597900390625, -0.782379150390625, -0.748779296875, -0.715179443359375, -0.68157958984375, -0.647979736328125, -0.6143798828125, -0.580780029296875, -0.54718017578125, -0.513580322265625, -0.47998046875, -0.446380615234375, -0.41278076171875, -0.379180908203125, -0.3455810546875, -0.311981201171875, -0.27838134765625, -0.244781494140625, -0.211181640625, -0.177581787109375, -0.14398193359375, -0.110382080078125, -0.0767822265625, -0.043182373046875, -0.00958251953125, 0.024017333984375, 0.0576171875, 0.091217041015625, 0.12481689453125, 0.158416748046875, 0.1920166015625, 0.225616455078125, 0.25921630859375, 0.292816162109375, 0.326416015625, 0.360015869140625, 0.39361572265625, 0.427215576171875, 0.4608154296875, 0.494415283203125, 0.52801513671875, 0.561614990234375, 0.59521484375, 0.628814697265625, 0.66241455078125, 0.696014404296875, 0.7296142578125, 0.763214111328125, 0.79681396484375, 0.830413818359375, 0.864013671875, 0.897613525390625, 0.93121337890625, 0.964813232421875, 0.9984130859375, 1.032012939453125, 1.06561279296875, 1.099212646484375, 1.1328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 10.0, 13.0, 21.0, 12.0, 14.0, 24.0, 30.0, 29.0, 45.0, 29.0, 34.0, 46.0, 46.0, 50.0, 51.0, 50.0, 47.0, 49.0, 49.0, 57.0, 56.0, 32.0, 34.0, 27.0, 20.0, 26.0, 17.0, 13.0, 11.0, 12.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8062210083007812, -0.7769927978515625, -0.7477645874023438, -0.718536376953125, -0.6893081665039062, -0.6600799560546875, -0.6308517456054688, -0.60162353515625, -0.5723953247070312, -0.5431671142578125, -0.5139389038085938, -0.484710693359375, -0.45548248291015625, -0.4262542724609375, -0.39702606201171875, -0.3677978515625, -0.33856964111328125, -0.3093414306640625, -0.28011322021484375, -0.250885009765625, -0.22165679931640625, -0.1924285888671875, -0.16320037841796875, -0.13397216796875, -0.10474395751953125, -0.0755157470703125, -0.04628753662109375, -0.017059326171875, 0.01216888427734375, 0.0413970947265625, 0.07062530517578125, 0.099853515625, 0.12908172607421875, 0.1583099365234375, 0.18753814697265625, 0.216766357421875, 0.24599456787109375, 0.2752227783203125, 0.30445098876953125, 0.33367919921875, 0.36290740966796875, 0.3921356201171875, 0.42136383056640625, 0.450592041015625, 0.47982025146484375, 0.5090484619140625, 0.5382766723632812, 0.5675048828125, 0.5967330932617188, 0.6259613037109375, 0.6551895141601562, 0.684417724609375, 0.7136459350585938, 0.7428741455078125, 0.7721023559570312, 0.80133056640625, 0.8305587768554688, 0.8597869873046875, 0.8890151977539062, 0.918243408203125, 0.9474716186523438, 0.9766998291015625, 1.0059280395507812, 1.03515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 7.0, 7.0, 18.0, 11.0, 20.0, 42.0, 60.0, 82.0, 137.0, 228.0, 414.0, 757.0, 1356.0, 2935.0, 6442.0, 15799.0, 41630.0, 115697.0, 274811.0, 326209.0, 163329.0, 60066.0, 22086.0, 8710.0, 3772.0, 1871.0, 864.0, 467.0, 283.0, 148.0, 105.0, 73.0, 35.0, 24.0, 18.0, 9.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9150390625, -0.8856887817382812, -0.8563385009765625, -0.8269882202148438, -0.797637939453125, -0.7682876586914062, -0.7389373779296875, -0.7095870971679688, -0.68023681640625, -0.6508865356445312, -0.6215362548828125, -0.5921859741210938, -0.562835693359375, -0.5334854125976562, -0.5041351318359375, -0.47478485107421875, -0.4454345703125, -0.41608428955078125, -0.3867340087890625, -0.35738372802734375, -0.328033447265625, -0.29868316650390625, -0.2693328857421875, -0.23998260498046875, -0.21063232421875, -0.18128204345703125, -0.1519317626953125, -0.12258148193359375, -0.093231201171875, -0.06388092041015625, -0.0345306396484375, -0.00518035888671875, 0.024169921875, 0.05352020263671875, 0.0828704833984375, 0.11222076416015625, 0.141571044921875, 0.17092132568359375, 0.2002716064453125, 0.22962188720703125, 0.25897216796875, 0.28832244873046875, 0.3176727294921875, 0.34702301025390625, 0.376373291015625, 0.40572357177734375, 0.4350738525390625, 0.46442413330078125, 0.4937744140625, 0.5231246948242188, 0.5524749755859375, 0.5818252563476562, 0.611175537109375, 0.6405258178710938, 0.6698760986328125, 0.6992263793945312, 0.72857666015625, 0.7579269409179688, 0.7872772216796875, 0.8166275024414062, 0.845977783203125, 0.8753280639648438, 0.9046783447265625, 0.9340286254882812, 0.96337890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 2.0, 9.0, 5.0, 12.0, 9.0, 33.0, 31.0, 25.0, 37.0, 34.0, 41.0, 50.0, 66.0, 61.0, 59.0, 66.0, 68.0, 52.0, 65.0, 48.0, 40.0, 32.0, 29.0, 30.0, 21.0, 16.0, 8.0, 15.0, 11.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000148773193359375, -0.00014415383338928223, -0.00013953447341918945, -0.00013491511344909668, -0.0001302957534790039, -0.00012567639350891113, -0.00012105703353881836, -0.00011643767356872559, -0.00011181831359863281, -0.00010719895362854004, -0.00010257959365844727, -9.796023368835449e-05, -9.334087371826172e-05, -8.872151374816895e-05, -8.410215377807617e-05, -7.94827938079834e-05, -7.486343383789062e-05, -7.024407386779785e-05, -6.562471389770508e-05, -6.1005353927612305e-05, -5.638599395751953e-05, -5.176663398742676e-05, -4.7147274017333984e-05, -4.252791404724121e-05, -3.790855407714844e-05, -3.3289194107055664e-05, -2.866983413696289e-05, -2.4050474166870117e-05, -1.9431114196777344e-05, -1.481175422668457e-05, -1.0192394256591797e-05, -5.5730342864990234e-06, -9.5367431640625e-07, 3.6656856536865234e-06, 8.285045623779297e-06, 1.290440559387207e-05, 1.7523765563964844e-05, 2.2143125534057617e-05, 2.676248550415039e-05, 3.1381845474243164e-05, 3.600120544433594e-05, 4.062056541442871e-05, 4.5239925384521484e-05, 4.985928535461426e-05, 5.447864532470703e-05, 5.9098005294799805e-05, 6.371736526489258e-05, 6.833672523498535e-05, 7.295608520507812e-05, 7.75754451751709e-05, 8.219480514526367e-05, 8.681416511535645e-05, 9.143352508544922e-05, 9.605288505554199e-05, 0.00010067224502563477, 0.00010529160499572754, 0.00010991096496582031, 0.00011453032493591309, 0.00011914968490600586, 0.00012376904487609863, 0.0001283884048461914, 0.00013300776481628418, 0.00013762712478637695, 0.00014224648475646973, 0.0001468658447265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 8.0, 7.0, 11.0, 21.0, 26.0, 33.0, 48.0, 86.0, 139.0, 222.0, 285.0, 501.0, 827.0, 1456.0, 2917.0, 6072.0, 14643.0, 39042.0, 120363.0, 350517.0, 335747.0, 112734.0, 36969.0, 13965.0, 5855.0, 2632.0, 1368.0, 771.0, 422.0, 283.0, 185.0, 127.0, 68.0, 58.0, 45.0, 23.0, 19.0, 13.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.30078125, -1.264617919921875, -1.22845458984375, -1.192291259765625, -1.1561279296875, -1.119964599609375, -1.08380126953125, -1.047637939453125, -1.011474609375, -0.975311279296875, -0.93914794921875, -0.902984619140625, -0.8668212890625, -0.830657958984375, -0.79449462890625, -0.758331298828125, -0.72216796875, -0.686004638671875, -0.64984130859375, -0.613677978515625, -0.5775146484375, -0.541351318359375, -0.50518798828125, -0.469024658203125, -0.432861328125, -0.396697998046875, -0.36053466796875, -0.324371337890625, -0.2882080078125, -0.252044677734375, -0.21588134765625, -0.179718017578125, -0.1435546875, -0.107391357421875, -0.07122802734375, -0.035064697265625, 0.0010986328125, 0.037261962890625, 0.07342529296875, 0.109588623046875, 0.145751953125, 0.181915283203125, 0.21807861328125, 0.254241943359375, 0.2904052734375, 0.326568603515625, 0.36273193359375, 0.398895263671875, 0.43505859375, 0.471221923828125, 0.50738525390625, 0.543548583984375, 0.5797119140625, 0.615875244140625, 0.65203857421875, 0.688201904296875, 0.724365234375, 0.760528564453125, 0.79669189453125, 0.832855224609375, 0.8690185546875, 0.905181884765625, 0.94134521484375, 0.977508544921875, 1.013671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 3.0, 7.0, 9.0, 17.0, 15.0, 19.0, 26.0, 31.0, 29.0, 25.0, 28.0, 37.0, 47.0, 50.0, 46.0, 61.0, 56.0, 55.0, 45.0, 54.0, 50.0, 46.0, 39.0, 29.0, 36.0, 21.0, 26.0, 15.0, 11.0, 9.0, 10.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.62646484375, -0.6099624633789062, -0.5934600830078125, -0.5769577026367188, -0.560455322265625, -0.5439529418945312, -0.5274505615234375, -0.5109481811523438, -0.49444580078125, -0.47794342041015625, -0.4614410400390625, -0.44493865966796875, -0.428436279296875, -0.41193389892578125, -0.3954315185546875, -0.37892913818359375, -0.3624267578125, -0.34592437744140625, -0.3294219970703125, -0.31291961669921875, -0.296417236328125, -0.27991485595703125, -0.2634124755859375, -0.24691009521484375, -0.23040771484375, -0.21390533447265625, -0.1974029541015625, -0.18090057373046875, -0.164398193359375, -0.14789581298828125, -0.1313934326171875, -0.11489105224609375, -0.098388671875, -0.08188629150390625, -0.0653839111328125, -0.04888153076171875, -0.032379150390625, -0.01587677001953125, 0.0006256103515625, 0.01712799072265625, 0.03363037109375, 0.05013275146484375, 0.0666351318359375, 0.08313751220703125, 0.099639892578125, 0.11614227294921875, 0.1326446533203125, 0.14914703369140625, 0.1656494140625, 0.18215179443359375, 0.1986541748046875, 0.21515655517578125, 0.231658935546875, 0.24816131591796875, 0.2646636962890625, 0.28116607666015625, 0.29766845703125, 0.31417083740234375, 0.3306732177734375, 0.34717559814453125, 0.363677978515625, 0.38018035888671875, 0.3966827392578125, 0.41318511962890625, 0.4296875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 12.0, 12.0, 27.0, 38.0, 63.0, 78.0, 103.0, 117.0, 133.0, 112.0, 85.0, 66.0, 45.0, 33.0, 22.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.11367416381836, -9.795899391174316, -9.478123664855957, -9.160348892211914, -8.842574119567871, -8.524798393249512, -8.207023620605469, -7.889248371124268, -7.571473121643066, -7.253697872161865, -6.935923099517822, -6.618147850036621, -6.30037260055542, -5.982597351074219, -5.664822578430176, -5.347047328948975, -5.029272556304932, -4.7114973068237305, -4.3937225341796875, -4.075947284698486, -3.758172035217285, -3.440397024154663, -3.122622013092041, -2.80484676361084, -2.4870717525482178, -2.1692967414855957, -1.8515214920043945, -1.5337464809417725, -1.2159713506698608, -0.8981962203979492, -0.5804212093353271, -0.262645959854126, 0.055129051208496094, 0.3729041516780853, 0.6906792521476746, 1.0084543228149414, 1.326229453086853, 1.6440045833587646, 1.9617795944213867, 2.279554843902588, 2.59732985496521, 2.915104866027832, 3.232880115509033, 3.5506551265716553, 3.8684301376342773, 4.1862053871154785, 4.50398063659668, 4.821755409240723, 5.139530658721924, 5.457305908203125, 5.775080680847168, 6.092855930328369, 6.41063117980957, 6.728405952453613, 7.0461812019348145, 7.363956451416016, 7.681731224060059, 7.99950647354126, 8.317281723022461, 8.635056495666504, 8.952831268310547, 9.270606994628906, 9.58838176727295, 9.906156539916992, 10.223932266235352]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 12.0, 14.0, 28.0, 20.0, 33.0, 38.0, 52.0, 45.0, 55.0, 59.0, 74.0, 75.0, 75.0, 55.0, 66.0, 73.0, 37.0, 47.0, 31.0, 18.0, 31.0, 22.0, 14.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21395206451416, -8.920344352722168, -8.62673568725586, -8.333127975463867, -8.039520263671875, -7.745912551879883, -7.452304363250732, -7.158696174621582, -6.86508846282959, -6.571480751037598, -6.277872562408447, -5.984264373779297, -5.690656661987305, -5.3970489501953125, -5.103440761566162, -4.809832572937012, -4.5162248611450195, -4.222617149353027, -3.929008960723877, -3.6354010105133057, -3.3417930603027344, -3.048185110092163, -2.754577159881592, -2.4609692096710205, -2.167361259460449, -1.873753309249878, -1.5801453590393066, -1.2865374088287354, -0.9929294586181641, -0.6993215084075928, -0.4057135581970215, -0.1121056079864502, 0.1815013885498047, 0.475109338760376, 0.7687172889709473, 1.0623252391815186, 1.3559331893920898, 1.6495411396026611, 1.9431490898132324, 2.2367570400238037, 2.530364990234375, 2.8239729404449463, 3.1175808906555176, 3.411188840866089, 3.70479679107666, 3.9984047412872314, 4.292012691497803, 4.585620880126953, 4.879228591918945, 5.1728363037109375, 5.466444492340088, 5.760052680969238, 6.0536603927612305, 6.347268104553223, 6.640876293182373, 6.934484481811523, 7.228092193603516, 7.521699905395508, 7.815308094024658, 8.108916282653809, 8.4025239944458, 8.696131706237793, 8.989740371704102, 9.283348083496094, 9.576955795288086]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 16.0, 17.0, 34.0, 59.0, 87.0, 194.0, 419.0, 1161.0, 4756.0, 43750.0, 3960593.0, 170305.0, 9949.0, 1874.0, 578.0, 232.0, 115.0, 56.0, 23.0, 17.0, 12.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.92431640625, -5.7822265625, -5.64013671875, -5.498046875, -5.35595703125, -5.2138671875, -5.07177734375, -4.9296875, -4.78759765625, -4.6455078125, -4.50341796875, -4.361328125, -4.21923828125, -4.0771484375, -3.93505859375, -3.79296875, -3.65087890625, -3.5087890625, -3.36669921875, -3.224609375, -3.08251953125, -2.9404296875, -2.79833984375, -2.65625, -2.51416015625, -2.3720703125, -2.22998046875, -2.087890625, -1.94580078125, -1.8037109375, -1.66162109375, -1.51953125, -1.37744140625, -1.2353515625, -1.09326171875, -0.951171875, -0.80908203125, -0.6669921875, -0.52490234375, -0.3828125, -0.24072265625, -0.0986328125, 0.04345703125, 0.185546875, 0.32763671875, 0.4697265625, 0.61181640625, 0.75390625, 0.89599609375, 1.0380859375, 1.18017578125, 1.322265625, 1.46435546875, 1.6064453125, 1.74853515625, 1.890625, 2.03271484375, 2.1748046875, 2.31689453125, 2.458984375, 2.60107421875, 2.7431640625, 2.88525390625, 3.02734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 8.0, 11.0, 31.0, 33.0, 57.0, 63.0, 93.0, 82.0, 104.0, 113.0, 107.0, 92.0, 64.0, 40.0, 38.0, 18.0, 16.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.457763671875, -0.4475383758544922, -0.4373130798339844, -0.42708778381347656, -0.41686248779296875, -0.40663719177246094, -0.3964118957519531, -0.3861865997314453, -0.3759613037109375, -0.3657360076904297, -0.3555107116699219, -0.34528541564941406, -0.33506011962890625, -0.32483482360839844, -0.3146095275878906, -0.3043842315673828, -0.294158935546875, -0.2839336395263672, -0.2737083435058594, -0.26348304748535156, -0.25325775146484375, -0.24303245544433594, -0.23280715942382812, -0.2225818634033203, -0.2123565673828125, -0.2021312713623047, -0.19190597534179688, -0.18168067932128906, -0.17145538330078125, -0.16123008728027344, -0.15100479125976562, -0.1407794952392578, -0.13055419921875, -0.12032890319824219, -0.11010360717773438, -0.09987831115722656, -0.08965301513671875, -0.07942771911621094, -0.06920242309570312, -0.05897712707519531, -0.0487518310546875, -0.03852653503417969, -0.028301239013671875, -0.018075942993164062, -0.00785064697265625, 0.0023746490478515625, 0.012599945068359375, 0.022825241088867188, 0.033050537109375, 0.04327583312988281, 0.053501129150390625, 0.06372642517089844, 0.07395172119140625, 0.08417701721191406, 0.09440231323242188, 0.10462760925292969, 0.1148529052734375, 0.1250782012939453, 0.13530349731445312, 0.14552879333496094, 0.15575408935546875, 0.16597938537597656, 0.17620468139648438, 0.1864299774169922, 0.1966552734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 12.0, 8.0, 24.0, 40.0, 45.0, 106.0, 184.0, 323.0, 767.0, 1828.0, 4728.0, 14167.0, 52838.0, 323812.0, 3399951.0, 319968.0, 52397.0, 14289.0, 4883.0, 1956.0, 886.0, 441.0, 246.0, 146.0, 96.0, 53.0, 31.0, 15.0, 12.0, 6.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.28143310546875, -2.2171630859375, -2.15289306640625, -2.088623046875, -2.02435302734375, -1.9600830078125, -1.89581298828125, -1.83154296875, -1.76727294921875, -1.7030029296875, -1.63873291015625, -1.574462890625, -1.51019287109375, -1.4459228515625, -1.38165283203125, -1.3173828125, -1.25311279296875, -1.1888427734375, -1.12457275390625, -1.060302734375, -0.99603271484375, -0.9317626953125, -0.86749267578125, -0.80322265625, -0.73895263671875, -0.6746826171875, -0.61041259765625, -0.546142578125, -0.48187255859375, -0.4176025390625, -0.35333251953125, -0.2890625, -0.22479248046875, -0.1605224609375, -0.09625244140625, -0.031982421875, 0.03228759765625, 0.0965576171875, 0.16082763671875, 0.22509765625, 0.28936767578125, 0.3536376953125, 0.41790771484375, 0.482177734375, 0.54644775390625, 0.6107177734375, 0.67498779296875, 0.7392578125, 0.80352783203125, 0.8677978515625, 0.93206787109375, 0.996337890625, 1.06060791015625, 1.1248779296875, 1.18914794921875, 1.25341796875, 1.31768798828125, 1.3819580078125, 1.44622802734375, 1.510498046875, 1.57476806640625, 1.6390380859375, 1.70330810546875, 1.767578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 23.0, 18.0, 27.0, 50.0, 49.0, 93.0, 138.0, 205.0, 367.0, 1341.0, 821.0, 317.0, 171.0, 123.0, 92.0, 57.0, 36.0, 21.0, 26.0, 15.0, 11.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2578125, -0.24703216552734375, -0.2362518310546875, -0.22547149658203125, -0.214691162109375, -0.20391082763671875, -0.1931304931640625, -0.18235015869140625, -0.17156982421875, -0.16078948974609375, -0.1500091552734375, -0.13922882080078125, -0.128448486328125, -0.11766815185546875, -0.1068878173828125, -0.09610748291015625, -0.0853271484375, -0.07454681396484375, -0.0637664794921875, -0.05298614501953125, -0.042205810546875, -0.03142547607421875, -0.0206451416015625, -0.00986480712890625, 0.00091552734375, 0.01169586181640625, 0.0224761962890625, 0.03325653076171875, 0.044036865234375, 0.05481719970703125, 0.0655975341796875, 0.07637786865234375, 0.087158203125, 0.09793853759765625, 0.1087188720703125, 0.11949920654296875, 0.130279541015625, 0.14105987548828125, 0.1518402099609375, 0.16262054443359375, 0.17340087890625, 0.18418121337890625, 0.1949615478515625, 0.20574188232421875, 0.216522216796875, 0.22730255126953125, 0.2380828857421875, 0.24886322021484375, 0.2596435546875, 0.27042388916015625, 0.2812042236328125, 0.29198455810546875, 0.302764892578125, 0.31354522705078125, 0.3243255615234375, 0.33510589599609375, 0.34588623046875, 0.35666656494140625, 0.3674468994140625, 0.37822723388671875, 0.389007568359375, 0.39978790283203125, 0.4105682373046875, 0.42134857177734375, 0.43212890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 15.0, 31.0, 71.0, 122.0, 153.0, 175.0, 148.0, 121.0, 70.0, 42.0, 21.0, 12.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.760511875152588, -1.6604740619659424, -1.5604362487792969, -1.4603984355926514, -1.3603606224060059, -1.2603228092193604, -1.1602851152420044, -1.0602473020553589, -0.9602094888687134, -0.8601716756820679, -0.7601338624954224, -0.6600961089134216, -0.5600582957267761, -0.4600204825401306, -0.3599827289581299, -0.2599449157714844, -0.15990710258483887, -0.05986930429935455, 0.04016849398612976, 0.14020627737045288, 0.2402440905570984, 0.3402819037437439, 0.44031965732574463, 0.5403574705123901, 0.6403952836990356, 0.7404330968856812, 0.8404709100723267, 0.9405086636543274, 1.0405464172363281, 1.1405842304229736, 1.2406220436096191, 1.3406598567962646, 1.4406976699829102, 1.5407354831695557, 1.6407732963562012, 1.7408111095428467, 1.8408489227294922, 1.9408867359161377, 2.040924549102783, 2.1409621238708496, 2.241000175476074, 2.3410379886627197, 2.4410758018493652, 2.5411136150360107, 2.6411514282226562, 2.7411892414093018, 2.8412270545959473, 2.9412646293640137, 3.041302442550659, 3.1413402557373047, 3.24137806892395, 3.3414158821105957, 3.441453695297241, 3.5414915084838867, 3.641529083251953, 3.7415671348571777, 3.841604709625244, 3.9416425228118896, 4.041680335998535, 4.141717910766602, 4.241755962371826, 4.341793537139893, 4.441831588745117, 4.541869163513184, 4.641907215118408]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 14.0, 12.0, 16.0, 19.0, 19.0, 22.0, 23.0, 23.0, 35.0, 27.0, 34.0, 44.0, 42.0, 51.0, 46.0, 32.0, 43.0, 45.0, 48.0, 37.0, 42.0, 30.0, 33.0, 41.0, 19.0, 19.0, 25.0, 24.0, 12.0, 16.0, 18.0, 11.0, 10.0, 14.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0349489450454712, -0.9999313950538635, -0.9649138450622559, -0.929896354675293, -0.8948788046836853, -0.8598612546920776, -0.82484370470047, -0.7898261547088623, -0.7548086643218994, -0.7197911143302917, -0.6847735643386841, -0.6497560739517212, -0.6147385239601135, -0.5797209739685059, -0.5447034239768982, -0.5096858739852905, -0.47466832399368286, -0.4396507740020752, -0.4046332538127899, -0.36961570382118225, -0.334598183631897, -0.2995806336402893, -0.26456308364868164, -0.22954554855823517, -0.1945280134677887, -0.15951047837734222, -0.12449293583631516, -0.08947539329528809, -0.054457858204841614, -0.01944032311439514, 0.015577226877212524, 0.050594761967659, 0.08561229705810547, 0.12062983214855194, 0.1556473672389984, 0.19066491723060608, 0.22568245232105255, 0.260699987411499, 0.2957175374031067, 0.33073508739471436, 0.36575260758399963, 0.4007701575756073, 0.4357876777648926, 0.47080522775650024, 0.5058227777481079, 0.5408402681350708, 0.5758578777313232, 0.6108753681182861, 0.6458929181098938, 0.6809104681015015, 0.7159280180931091, 0.7509455680847168, 0.7859630584716797, 0.8209806084632874, 0.855998158454895, 0.8910157084465027, 0.9260332584381104, 0.961050808429718, 0.9960683584213257, 1.0310858488082886, 1.066103458404541, 1.101120948791504, 1.1361384391784668, 1.1711560487747192, 1.2061735391616821]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 11.0, 9.0, 6.0, 21.0, 23.0, 55.0, 94.0, 184.0, 303.0, 749.0, 1811.0, 5218.0, 20265.0, 93451.0, 357751.0, 410528.0, 121821.0, 26005.0, 6487.0, 2121.0, 840.0, 367.0, 176.0, 91.0, 56.0, 40.0, 24.0, 13.0, 8.0, 7.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.07781982421875, -2.0130615234375, -1.94830322265625, -1.883544921875, -1.81878662109375, -1.7540283203125, -1.68927001953125, -1.62451171875, -1.55975341796875, -1.4949951171875, -1.43023681640625, -1.365478515625, -1.30072021484375, -1.2359619140625, -1.17120361328125, -1.1064453125, -1.04168701171875, -0.9769287109375, -0.91217041015625, -0.847412109375, -0.78265380859375, -0.7178955078125, -0.65313720703125, -0.58837890625, -0.52362060546875, -0.4588623046875, -0.39410400390625, -0.329345703125, -0.26458740234375, -0.1998291015625, -0.13507080078125, -0.0703125, -0.00555419921875, 0.0592041015625, 0.12396240234375, 0.188720703125, 0.25347900390625, 0.3182373046875, 0.38299560546875, 0.44775390625, 0.51251220703125, 0.5772705078125, 0.64202880859375, 0.706787109375, 0.77154541015625, 0.8363037109375, 0.90106201171875, 0.9658203125, 1.03057861328125, 1.0953369140625, 1.16009521484375, 1.224853515625, 1.28961181640625, 1.3543701171875, 1.41912841796875, 1.48388671875, 1.54864501953125, 1.6134033203125, 1.67816162109375, 1.742919921875, 1.80767822265625, 1.8724365234375, 1.93719482421875, 2.001953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 6.0, 14.0, 11.0, 24.0, 40.0, 59.0, 66.0, 83.0, 90.0, 116.0, 107.0, 94.0, 78.0, 64.0, 43.0, 28.0, 25.0, 24.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.435791015625, -0.4258403778076172, -0.4158897399902344, -0.40593910217285156, -0.39598846435546875, -0.38603782653808594, -0.3760871887207031, -0.3661365509033203, -0.3561859130859375, -0.3462352752685547, -0.3362846374511719, -0.32633399963378906, -0.31638336181640625, -0.30643272399902344, -0.2964820861816406, -0.2865314483642578, -0.276580810546875, -0.2666301727294922, -0.2566795349121094, -0.24672889709472656, -0.23677825927734375, -0.22682762145996094, -0.21687698364257812, -0.2069263458251953, -0.1969757080078125, -0.1870250701904297, -0.17707443237304688, -0.16712379455566406, -0.15717315673828125, -0.14722251892089844, -0.13727188110351562, -0.1273212432861328, -0.11737060546875, -0.10741996765136719, -0.09746932983398438, -0.08751869201660156, -0.07756805419921875, -0.06761741638183594, -0.057666778564453125, -0.04771614074707031, -0.0377655029296875, -0.027814865112304688, -0.017864227294921875, -0.007913589477539062, 0.00203704833984375, 0.011987686157226562, 0.021938323974609375, 0.03188896179199219, 0.041839599609375, 0.05179023742675781, 0.061740875244140625, 0.07169151306152344, 0.08164215087890625, 0.09159278869628906, 0.10154342651367188, 0.11149406433105469, 0.1214447021484375, 0.1313953399658203, 0.14134597778320312, 0.15129661560058594, 0.16124725341796875, 0.17119789123535156, 0.18114852905273438, 0.1910991668701172, 0.2010498046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 8.0, 10.0, 7.0, 12.0, 20.0, 28.0, 40.0, 54.0, 96.0, 128.0, 203.0, 286.0, 412.0, 561.0, 951.0, 1574.0, 3130.0, 6770.0, 17370.0, 48660.0, 129516.0, 265548.0, 297694.0, 167942.0, 65808.0, 23699.0, 8974.0, 3942.0, 1959.0, 1083.0, 721.0, 464.0, 275.0, 198.0, 132.0, 82.0, 59.0, 51.0, 34.0, 17.0, 12.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4658203125, -1.4241180419921875, -1.382415771484375, -1.3407135009765625, -1.29901123046875, -1.2573089599609375, -1.215606689453125, -1.1739044189453125, -1.1322021484375, -1.0904998779296875, -1.048797607421875, -1.0070953369140625, -0.96539306640625, -0.9236907958984375, -0.881988525390625, -0.8402862548828125, -0.798583984375, -0.7568817138671875, -0.715179443359375, -0.6734771728515625, -0.63177490234375, -0.5900726318359375, -0.548370361328125, -0.5066680908203125, -0.4649658203125, -0.4232635498046875, -0.381561279296875, -0.3398590087890625, -0.29815673828125, -0.2564544677734375, -0.214752197265625, -0.1730499267578125, -0.13134765625, -0.0896453857421875, -0.047943115234375, -0.0062408447265625, 0.03546142578125, 0.0771636962890625, 0.118865966796875, 0.1605682373046875, 0.2022705078125, 0.2439727783203125, 0.285675048828125, 0.3273773193359375, 0.36907958984375, 0.4107818603515625, 0.452484130859375, 0.4941864013671875, 0.535888671875, 0.5775909423828125, 0.619293212890625, 0.6609954833984375, 0.70269775390625, 0.7444000244140625, 0.786102294921875, 0.8278045654296875, 0.8695068359375, 0.9112091064453125, 0.952911376953125, 0.9946136474609375, 1.03631591796875, 1.0780181884765625, 1.119720458984375, 1.1614227294921875, 1.203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 14.0, 9.0, 12.0, 17.0, 22.0, 25.0, 31.0, 37.0, 39.0, 46.0, 46.0, 41.0, 46.0, 50.0, 57.0, 55.0, 44.0, 50.0, 52.0, 46.0, 36.0, 26.0, 32.0, 18.0, 27.0, 23.0, 20.0, 20.0, 14.0, 7.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.3271484375, -1.2929306030273438, -1.2587127685546875, -1.2244949340820312, -1.190277099609375, -1.1560592651367188, -1.1218414306640625, -1.0876235961914062, -1.05340576171875, -1.0191879272460938, -0.9849700927734375, -0.9507522583007812, -0.916534423828125, -0.8823165893554688, -0.8480987548828125, -0.8138809204101562, -0.7796630859375, -0.7454452514648438, -0.7112274169921875, -0.6770095825195312, -0.642791748046875, -0.6085739135742188, -0.5743560791015625, -0.5401382446289062, -0.50592041015625, -0.47170257568359375, -0.4374847412109375, -0.40326690673828125, -0.369049072265625, -0.33483123779296875, -0.3006134033203125, -0.26639556884765625, -0.232177734375, -0.19795989990234375, -0.1637420654296875, -0.12952423095703125, -0.095306396484375, -0.06108856201171875, -0.0268707275390625, 0.00734710693359375, 0.04156494140625, 0.07578277587890625, 0.1100006103515625, 0.14421844482421875, 0.178436279296875, 0.21265411376953125, 0.2468719482421875, 0.28108978271484375, 0.3153076171875, 0.34952545166015625, 0.3837432861328125, 0.41796112060546875, 0.452178955078125, 0.48639678955078125, 0.5206146240234375, 0.5548324584960938, 0.58905029296875, 0.6232681274414062, 0.6574859619140625, 0.6917037963867188, 0.725921630859375, 0.7601394653320312, 0.7943572998046875, 0.8285751342773438, 0.86279296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 9.0, 11.0, 15.0, 23.0, 38.0, 43.0, 59.0, 112.0, 156.0, 245.0, 392.0, 698.0, 1072.0, 1954.0, 3777.0, 7566.0, 16516.0, 38159.0, 91580.0, 200262.0, 296294.0, 212989.0, 99317.0, 42200.0, 17895.0, 8259.0, 4067.0, 1977.0, 1116.0, 619.0, 353.0, 260.0, 169.0, 93.0, 69.0, 63.0, 34.0, 25.0, 20.0, 13.0, 13.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6826400756835938, -0.6616668701171875, -0.6406936645507812, -0.619720458984375, -0.5987472534179688, -0.5777740478515625, -0.5568008422851562, -0.53582763671875, -0.5148544311523438, -0.4938812255859375, -0.47290802001953125, -0.451934814453125, -0.43096160888671875, -0.4099884033203125, -0.38901519775390625, -0.3680419921875, -0.34706878662109375, -0.3260955810546875, -0.30512237548828125, -0.284149169921875, -0.26317596435546875, -0.2422027587890625, -0.22122955322265625, -0.20025634765625, -0.17928314208984375, -0.1583099365234375, -0.13733673095703125, -0.116363525390625, -0.09539031982421875, -0.0744171142578125, -0.05344390869140625, -0.032470703125, -0.01149749755859375, 0.0094757080078125, 0.03044891357421875, 0.051422119140625, 0.07239532470703125, 0.0933685302734375, 0.11434173583984375, 0.13531494140625, 0.15628814697265625, 0.1772613525390625, 0.19823455810546875, 0.219207763671875, 0.24018096923828125, 0.2611541748046875, 0.28212738037109375, 0.3031005859375, 0.32407379150390625, 0.3450469970703125, 0.36602020263671875, 0.386993408203125, 0.40796661376953125, 0.4289398193359375, 0.44991302490234375, 0.47088623046875, 0.49185943603515625, 0.5128326416015625, 0.5338058471679688, 0.554779052734375, 0.5757522583007812, 0.5967254638671875, 0.6176986694335938, 0.638671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 16.0, 12.0, 24.0, 19.0, 22.0, 30.0, 45.0, 42.0, 42.0, 59.0, 57.0, 57.0, 83.0, 67.0, 49.0, 48.0, 49.0, 47.0, 35.0, 26.0, 22.0, 28.0, 17.0, 21.0, 10.0, 12.0, 9.0, 8.0, 2.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011900998651981354, -0.0001145191490650177, -0.00011002831161022186, -0.00010553747415542603, -0.00010104663670063019, -9.655579924583435e-05, -9.206496179103851e-05, -8.757412433624268e-05, -8.308328688144684e-05, -7.8592449426651e-05, -7.410161197185516e-05, -6.961077451705933e-05, -6.511993706226349e-05, -6.062909960746765e-05, -5.6138262152671814e-05, -5.1647424697875977e-05, -4.715658724308014e-05, -4.26657497882843e-05, -3.8174912333488464e-05, -3.368407487869263e-05, -2.919323742389679e-05, -2.4702399969100952e-05, -2.0211562514305115e-05, -1.5720725059509277e-05, -1.122988760471344e-05, -6.7390501499176025e-06, -2.248212695121765e-06, 2.2426247596740723e-06, 6.73346221446991e-06, 1.1224299669265747e-05, 1.5715137124061584e-05, 2.0205974578857422e-05, 2.469681203365326e-05, 2.9187649488449097e-05, 3.3678486943244934e-05, 3.816932439804077e-05, 4.266016185283661e-05, 4.7150999307632446e-05, 5.1641836762428284e-05, 5.613267421722412e-05, 6.062351167201996e-05, 6.51143491268158e-05, 6.960518658161163e-05, 7.409602403640747e-05, 7.858686149120331e-05, 8.307769894599915e-05, 8.756853640079498e-05, 9.205937385559082e-05, 9.655021131038666e-05, 0.0001010410487651825, 0.00010553188621997833, 0.00011002272367477417, 0.00011451356112957001, 0.00011900439858436584, 0.00012349523603916168, 0.00012798607349395752, 0.00013247691094875336, 0.0001369677484035492, 0.00014145858585834503, 0.00014594942331314087, 0.0001504402607679367, 0.00015493109822273254, 0.00015942193567752838, 0.00016391277313232422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 8.0, 3.0, 7.0, 4.0, 15.0, 11.0, 32.0, 35.0, 41.0, 73.0, 94.0, 155.0, 230.0, 359.0, 636.0, 1132.0, 2144.0, 4708.0, 11740.0, 33587.0, 107760.0, 317593.0, 364760.0, 136279.0, 41614.0, 14253.0, 5552.0, 2507.0, 1296.0, 712.0, 423.0, 258.0, 178.0, 118.0, 67.0, 51.0, 30.0, 23.0, 18.0, 13.0, 10.0, 6.0, 10.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88134765625, -0.8538894653320312, -0.8264312744140625, -0.7989730834960938, -0.771514892578125, -0.7440567016601562, -0.7165985107421875, -0.6891403198242188, -0.66168212890625, -0.6342239379882812, -0.6067657470703125, -0.5793075561523438, -0.551849365234375, -0.5243911743164062, -0.4969329833984375, -0.46947479248046875, -0.4420166015625, -0.41455841064453125, -0.3871002197265625, -0.35964202880859375, -0.332183837890625, -0.30472564697265625, -0.2772674560546875, -0.24980926513671875, -0.22235107421875, -0.19489288330078125, -0.1674346923828125, -0.13997650146484375, -0.112518310546875, -0.08506011962890625, -0.0576019287109375, -0.03014373779296875, -0.002685546875, 0.02477264404296875, 0.0522308349609375, 0.07968902587890625, 0.107147216796875, 0.13460540771484375, 0.1620635986328125, 0.18952178955078125, 0.21697998046875, 0.24443817138671875, 0.2718963623046875, 0.29935455322265625, 0.326812744140625, 0.35427093505859375, 0.3817291259765625, 0.40918731689453125, 0.4366455078125, 0.46410369873046875, 0.4915618896484375, 0.5190200805664062, 0.546478271484375, 0.5739364624023438, 0.6013946533203125, 0.6288528442382812, 0.65631103515625, 0.6837692260742188, 0.7112274169921875, 0.7386856079101562, 0.766143798828125, 0.7936019897460938, 0.8210601806640625, 0.8485183715820312, 0.8759765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 5.0, 6.0, 12.0, 9.0, 14.0, 21.0, 27.0, 30.0, 43.0, 46.0, 53.0, 60.0, 61.0, 70.0, 72.0, 65.0, 78.0, 63.0, 48.0, 52.0, 33.0, 19.0, 25.0, 17.0, 8.0, 15.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49560546875, -0.47869110107421875, -0.4617767333984375, -0.44486236572265625, -0.427947998046875, -0.41103363037109375, -0.3941192626953125, -0.37720489501953125, -0.36029052734375, -0.34337615966796875, -0.3264617919921875, -0.30954742431640625, -0.292633056640625, -0.27571868896484375, -0.2588043212890625, -0.24188995361328125, -0.2249755859375, -0.20806121826171875, -0.1911468505859375, -0.17423248291015625, -0.157318115234375, -0.14040374755859375, -0.1234893798828125, -0.10657501220703125, -0.08966064453125, -0.07274627685546875, -0.0558319091796875, -0.03891754150390625, -0.022003173828125, -0.00508880615234375, 0.0118255615234375, 0.02873992919921875, 0.045654296875, 0.06256866455078125, 0.0794830322265625, 0.09639739990234375, 0.113311767578125, 0.13022613525390625, 0.1471405029296875, 0.16405487060546875, 0.18096923828125, 0.19788360595703125, 0.2147979736328125, 0.23171234130859375, 0.248626708984375, 0.26554107666015625, 0.2824554443359375, 0.29936981201171875, 0.3162841796875, 0.33319854736328125, 0.3501129150390625, 0.36702728271484375, 0.383941650390625, 0.40085601806640625, 0.4177703857421875, 0.43468475341796875, 0.45159912109375, 0.46851348876953125, 0.4854278564453125, 0.5023422241210938, 0.519256591796875, 0.5361709594726562, 0.5530853271484375, 0.5699996948242188, 0.5869140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 4.0, 13.0, 13.0, 11.0, 22.0, 37.0, 58.0, 69.0, 84.0, 112.0, 101.0, 108.0, 96.0, 71.0, 59.0, 36.0, 31.0, 31.0, 7.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.084464073181152, -10.79800033569336, -10.511537551879883, -10.22507381439209, -9.938611030578613, -9.65214729309082, -9.365684509277344, -9.07922077178955, -8.792757987976074, -8.506294250488281, -8.219831466674805, -7.93336820602417, -7.646904945373535, -7.3604416847229, -7.073978424072266, -6.787514686584473, -6.501051425933838, -6.214588165283203, -5.928124904632568, -5.641661643981934, -5.355198383331299, -5.068735122680664, -4.782271385192871, -4.4958086013793945, -4.209344863891602, -3.922881603240967, -3.636418342590332, -3.3499550819396973, -3.0634918212890625, -2.7770285606384277, -2.490565061569214, -2.204101800918579, -1.9176383018493652, -1.6311750411987305, -1.3447117805480957, -1.0582484006881714, -0.7717851400375366, -0.48532187938690186, -0.19885849952697754, 0.08760476112365723, 0.374068021774292, 0.6605312824249268, 0.9469946026802063, 1.2334579229354858, 1.5199211835861206, 1.8063844442367554, 2.0928478240966797, 2.3793110847473145, 2.665774345397949, 2.952237606048584, 3.2387008666992188, 3.5251641273498535, 3.8116273880004883, 4.098090648651123, 4.384553909301758, 4.671017646789551, 4.957480430603027, 5.243943691253662, 5.530406951904297, 5.816870212554932, 6.103333473205566, 6.389796733856201, 6.676259994506836, 6.962723731994629, 7.249186992645264]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 6.0, 18.0, 5.0, 23.0, 26.0, 22.0, 35.0, 40.0, 38.0, 48.0, 65.0, 56.0, 53.0, 66.0, 48.0, 66.0, 50.0, 53.0, 49.0, 45.0, 32.0, 30.0, 29.0, 16.0, 14.0, 18.0, 13.0, 9.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735222339630127, -6.45862340927124, -6.182024002075195, -5.905425071716309, -5.628825664520264, -5.352226734161377, -5.075627326965332, -4.799028396606445, -4.522429466247559, -4.245830535888672, -3.969231128692627, -3.6926321983337402, -3.4160327911376953, -3.1394338607788086, -2.8628346920013428, -2.586235523223877, -2.309636116027832, -2.033036947250366, -1.7564377784729004, -1.4798387289047241, -1.2032395601272583, -0.9266403913497925, -0.6500413417816162, -0.3734421730041504, -0.09684300422668457, 0.17975613474845886, 0.4563552737236023, 0.7329543828964233, 1.0095535516738892, 1.286152720451355, 1.5627517700195312, 1.839350938796997, 2.115950584411621, 2.392549753189087, 2.6691489219665527, 2.9457478523254395, 3.2223472595214844, 3.498946189880371, 3.775545358657837, 4.052144527435303, 4.328743934631348, 4.605342864990234, 4.881942272186279, 5.158541202545166, 5.435140609741211, 5.711739540100098, 5.988338470458984, 6.264937877655029, 6.541536808013916, 6.818135738372803, 7.094735145568848, 7.371334075927734, 7.647933483123779, 7.924532413482666, 8.201131820678711, 8.477730751037598, 8.754329681396484, 9.030928611755371, 9.307527542114258, 9.584127426147461, 9.860726356506348, 10.137325286865234, 10.413924217224121, 10.690523147583008, 10.967123031616211]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 11.0, 8.0, 13.0, 14.0, 17.0, 28.0, 47.0, 56.0, 118.0, 221.0, 411.0, 728.0, 1486.0, 3269.0, 9278.0, 32233.0, 173451.0, 3631127.0, 278707.0, 43246.0, 11934.0, 4164.0, 1754.0, 853.0, 462.0, 239.0, 152.0, 80.0, 53.0, 36.0, 21.0, 13.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.8876953125, -1.837493896484375, -1.78729248046875, -1.737091064453125, -1.6868896484375, -1.636688232421875, -1.58648681640625, -1.536285400390625, -1.486083984375, -1.435882568359375, -1.38568115234375, -1.335479736328125, -1.2852783203125, -1.235076904296875, -1.18487548828125, -1.134674072265625, -1.08447265625, -1.034271240234375, -0.98406982421875, -0.933868408203125, -0.8836669921875, -0.833465576171875, -0.78326416015625, -0.733062744140625, -0.682861328125, -0.632659912109375, -0.58245849609375, -0.532257080078125, -0.4820556640625, -0.431854248046875, -0.38165283203125, -0.331451416015625, -0.28125, -0.231048583984375, -0.18084716796875, -0.130645751953125, -0.0804443359375, -0.030242919921875, 0.01995849609375, 0.070159912109375, 0.120361328125, 0.170562744140625, 0.22076416015625, 0.270965576171875, 0.3211669921875, 0.371368408203125, 0.42156982421875, 0.471771240234375, 0.52197265625, 0.572174072265625, 0.62237548828125, 0.672576904296875, 0.7227783203125, 0.772979736328125, 0.82318115234375, 0.873382568359375, 0.923583984375, 0.973785400390625, 1.02398681640625, 1.074188232421875, 1.1243896484375, 1.174591064453125, 1.22479248046875, 1.274993896484375, 1.3251953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 9.0, 17.0, 28.0, 47.0, 48.0, 66.0, 82.0, 91.0, 103.0, 88.0, 102.0, 65.0, 77.0, 46.0, 35.0, 31.0, 23.0, 14.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.473388671875, -0.4615516662597656, -0.44971466064453125, -0.4378776550292969, -0.4260406494140625, -0.4142036437988281, -0.40236663818359375, -0.3905296325683594, -0.378692626953125, -0.3668556213378906, -0.35501861572265625, -0.3431816101074219, -0.3313446044921875, -0.3195075988769531, -0.30767059326171875, -0.2958335876464844, -0.28399658203125, -0.2721595764160156, -0.26032257080078125, -0.24848556518554688, -0.2366485595703125, -0.22481155395507812, -0.21297454833984375, -0.20113754272460938, -0.189300537109375, -0.17746353149414062, -0.16562652587890625, -0.15378952026367188, -0.1419525146484375, -0.13011550903320312, -0.11827850341796875, -0.10644149780273438, -0.0946044921875, -0.08276748657226562, -0.07093048095703125, -0.059093475341796875, -0.0472564697265625, -0.035419464111328125, -0.02358245849609375, -0.011745452880859375, 9.1552734375e-05, 0.011928558349609375, 0.02376556396484375, 0.035602569580078125, 0.0474395751953125, 0.059276580810546875, 0.07111358642578125, 0.08295059204101562, 0.09478759765625, 0.10662460327148438, 0.11846160888671875, 0.13029861450195312, 0.1421356201171875, 0.15397262573242188, 0.16580963134765625, 0.17764663696289062, 0.189483642578125, 0.20132064819335938, 0.21315765380859375, 0.22499465942382812, 0.2368316650390625, 0.24866867065429688, 0.26050567626953125, 0.2723426818847656, 0.2841796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 12.0, 11.0, 26.0, 36.0, 38.0, 58.0, 83.0, 144.0, 217.0, 411.0, 727.0, 1496.0, 4060.0, 11595.0, 40769.0, 192457.0, 3141050.0, 672158.0, 92990.0, 23417.0, 7468.0, 2751.0, 1074.0, 467.0, 284.0, 164.0, 111.0, 62.0, 32.0, 35.0, 18.0, 15.0, 5.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.58203125, -1.5365447998046875, -1.491058349609375, -1.4455718994140625, -1.40008544921875, -1.3545989990234375, -1.309112548828125, -1.2636260986328125, -1.2181396484375, -1.1726531982421875, -1.127166748046875, -1.0816802978515625, -1.03619384765625, -0.9907073974609375, -0.945220947265625, -0.8997344970703125, -0.854248046875, -0.8087615966796875, -0.763275146484375, -0.7177886962890625, -0.67230224609375, -0.6268157958984375, -0.581329345703125, -0.5358428955078125, -0.4903564453125, -0.4448699951171875, -0.399383544921875, -0.3538970947265625, -0.30841064453125, -0.2629241943359375, -0.217437744140625, -0.1719512939453125, -0.12646484375, -0.0809783935546875, -0.035491943359375, 0.0099945068359375, 0.05548095703125, 0.1009674072265625, 0.146453857421875, 0.1919403076171875, 0.2374267578125, 0.2829132080078125, 0.328399658203125, 0.3738861083984375, 0.41937255859375, 0.4648590087890625, 0.510345458984375, 0.5558319091796875, 0.601318359375, 0.6468048095703125, 0.692291259765625, 0.7377777099609375, 0.78326416015625, 0.8287506103515625, 0.874237060546875, 0.9197235107421875, 0.9652099609375, 1.0106964111328125, 1.056182861328125, 1.1016693115234375, 1.14715576171875, 1.1926422119140625, 1.238128662109375, 1.2836151123046875, 1.3291015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 15.0, 12.0, 11.0, 27.0, 32.0, 65.0, 68.0, 147.0, 210.0, 516.0, 1794.0, 530.0, 222.0, 132.0, 93.0, 61.0, 29.0, 33.0, 25.0, 13.0, 10.0, 4.0, 10.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43310546875, -0.4205589294433594, -0.40801239013671875, -0.3954658508300781, -0.3829193115234375, -0.3703727722167969, -0.35782623291015625, -0.3452796936035156, -0.332733154296875, -0.3201866149902344, -0.30764007568359375, -0.2950935363769531, -0.2825469970703125, -0.2700004577636719, -0.25745391845703125, -0.24490737915039062, -0.23236083984375, -0.21981430053710938, -0.20726776123046875, -0.19472122192382812, -0.1821746826171875, -0.16962814331054688, -0.15708160400390625, -0.14453506469726562, -0.131988525390625, -0.11944198608398438, -0.10689544677734375, -0.09434890747070312, -0.0818023681640625, -0.06925582885742188, -0.05670928955078125, -0.044162750244140625, -0.0316162109375, -0.019069671630859375, -0.00652313232421875, 0.006023406982421875, 0.0185699462890625, 0.031116485595703125, 0.04366302490234375, 0.056209564208984375, 0.068756103515625, 0.08130264282226562, 0.09384918212890625, 0.10639572143554688, 0.1189422607421875, 0.13148880004882812, 0.14403533935546875, 0.15658187866210938, 0.16912841796875, 0.18167495727539062, 0.19422149658203125, 0.20676803588867188, 0.2193145751953125, 0.23186111450195312, 0.24440765380859375, 0.2569541931152344, 0.269500732421875, 0.2820472717285156, 0.29459381103515625, 0.3071403503417969, 0.3196868896484375, 0.3322334289550781, 0.34477996826171875, 0.3573265075683594, 0.369873046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 13.0, 17.0, 31.0, 51.0, 71.0, 88.0, 111.0, 122.0, 124.0, 107.0, 86.0, 64.0, 46.0, 23.0, 17.0, 12.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0657577514648438, -2.994230031967163, -2.9227023124694824, -2.851174831390381, -2.7796471118927, -2.7081193923950195, -2.636591672897339, -2.565063953399658, -2.4935364723205566, -2.422008752822876, -2.3504810333251953, -2.2789535522460938, -2.207425832748413, -2.1358981132507324, -2.0643703937530518, -1.992842674255371, -1.9213149547576904, -1.8497872352600098, -1.7782596349716187, -1.706731915473938, -1.6352043151855469, -1.5636765956878662, -1.4921488761901855, -1.4206211566925049, -1.3490935564041138, -1.277565836906433, -1.206038236618042, -1.1345105171203613, -1.0629827976226807, -0.9914551973342896, -0.9199274778366089, -0.848399817943573, -0.7768720388412476, -0.7053443789482117, -0.6338167190551758, -0.5622889995574951, -0.49076133966445923, -0.41923367977142334, -0.34770599007606506, -0.2761783003807068, -0.2046506404876709, -0.13312296569347382, -0.06159529089927673, 0.009932383894920349, 0.08146005868911743, 0.15298771858215332, 0.2245154082775116, 0.2960430979728699, 0.36757075786590576, 0.43909841775894165, 0.5106260776519775, 0.5821537971496582, 0.6536814570426941, 0.72520911693573, 0.7967368364334106, 0.8682644963264465, 0.9397921562194824, 1.011319875717163, 1.0828474760055542, 1.1543751955032349, 1.225902795791626, 1.2974305152893066, 1.3689582347869873, 1.440485954284668, 1.512013554573059]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 8.0, 3.0, 8.0, 8.0, 9.0, 12.0, 16.0, 12.0, 19.0, 30.0, 40.0, 29.0, 38.0, 31.0, 32.0, 38.0, 40.0, 32.0, 47.0, 51.0, 48.0, 32.0, 48.0, 35.0, 38.0, 34.0, 29.0, 37.0, 30.0, 24.0, 35.0, 19.0, 22.0, 11.0, 8.0, 10.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.2433825731277466, -1.2091513872146606, -1.1749200820922852, -1.1406888961791992, -1.1064577102661133, -1.0722265243530273, -1.0379952192306519, -1.003764033317566, -0.96953284740448, -0.9353016018867493, -0.9010704159736633, -0.8668391704559326, -0.8326079845428467, -0.798376739025116, -0.7641454935073853, -0.7299143075942993, -0.6956830620765686, -0.6614518165588379, -0.627220630645752, -0.5929893851280212, -0.5587581992149353, -0.5245269536972046, -0.49029573798179626, -0.45606452226638794, -0.4218333065509796, -0.3876020908355713, -0.35337087512016296, -0.31913965940475464, -0.2849084138870239, -0.250677227973938, -0.21644598245620728, -0.18221476674079895, -0.1479836106300354, -0.11375239491462708, -0.07952117174863815, -0.04528994858264923, -0.011058732867240906, 0.02317248284816742, 0.05740371346473694, 0.09163492918014526, 0.1258661448955536, 0.16009736061096191, 0.19432857632637024, 0.22855980694293976, 0.2627910375595093, 0.2970222234725952, 0.3312534689903259, 0.36548468470573425, 0.3997159004211426, 0.4339471161365509, 0.46817833185195923, 0.5024095773696899, 0.5366407632827759, 0.5708720088005066, 0.6051032543182373, 0.6393344402313232, 0.6735656261444092, 0.7077968716621399, 0.7420280575752258, 0.7762593030929565, 0.8104904890060425, 0.8447217345237732, 0.8789529800415039, 0.9131841659545898, 0.9474154114723206]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 11.0, 9.0, 30.0, 29.0, 40.0, 57.0, 101.0, 155.0, 221.0, 440.0, 813.0, 1441.0, 3167.0, 7267.0, 18004.0, 47327.0, 122795.0, 265715.0, 309451.0, 163321.0, 65186.0, 24654.0, 10005.0, 4079.0, 1919.0, 939.0, 517.0, 290.0, 178.0, 112.0, 77.0, 56.0, 38.0, 31.0, 21.0, 9.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1484375, -1.1103668212890625, -1.072296142578125, -1.0342254638671875, -0.99615478515625, -0.9580841064453125, -0.920013427734375, -0.8819427490234375, -0.8438720703125, -0.8058013916015625, -0.767730712890625, -0.7296600341796875, -0.69158935546875, -0.6535186767578125, -0.615447998046875, -0.5773773193359375, -0.539306640625, -0.5012359619140625, -0.463165283203125, -0.4250946044921875, -0.38702392578125, -0.3489532470703125, -0.310882568359375, -0.2728118896484375, -0.2347412109375, -0.1966705322265625, -0.158599853515625, -0.1205291748046875, -0.08245849609375, -0.0443878173828125, -0.006317138671875, 0.0317535400390625, 0.06982421875, 0.1078948974609375, 0.145965576171875, 0.1840362548828125, 0.22210693359375, 0.2601776123046875, 0.298248291015625, 0.3363189697265625, 0.3743896484375, 0.4124603271484375, 0.450531005859375, 0.4886016845703125, 0.52667236328125, 0.5647430419921875, 0.602813720703125, 0.6408843994140625, 0.678955078125, 0.7170257568359375, 0.755096435546875, 0.7931671142578125, 0.83123779296875, 0.8693084716796875, 0.907379150390625, 0.9454498291015625, 0.9835205078125, 1.0215911865234375, 1.059661865234375, 1.0977325439453125, 1.13580322265625, 1.1738739013671875, 1.211944580078125, 1.2500152587890625, 1.2880859375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 11.0, 17.0, 26.0, 35.0, 37.0, 52.0, 76.0, 92.0, 83.0, 113.0, 92.0, 76.0, 70.0, 64.0, 43.0, 40.0, 29.0, 17.0, 13.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45556640625, -0.4437446594238281, -0.43192291259765625, -0.4201011657714844, -0.4082794189453125, -0.3964576721191406, -0.38463592529296875, -0.3728141784667969, -0.360992431640625, -0.3491706848144531, -0.33734893798828125, -0.3255271911621094, -0.3137054443359375, -0.3018836975097656, -0.29006195068359375, -0.2782402038574219, -0.26641845703125, -0.2545967102050781, -0.24277496337890625, -0.23095321655273438, -0.2191314697265625, -0.20730972290039062, -0.19548797607421875, -0.18366622924804688, -0.171844482421875, -0.16002273559570312, -0.14820098876953125, -0.13637924194335938, -0.1245574951171875, -0.11273574829101562, -0.10091400146484375, -0.08909225463867188, -0.0772705078125, -0.06544876098632812, -0.05362701416015625, -0.041805267333984375, -0.0299835205078125, -0.018161773681640625, -0.00634002685546875, 0.005481719970703125, 0.017303466796875, 0.029125213623046875, 0.04094696044921875, 0.052768707275390625, 0.0645904541015625, 0.07641220092773438, 0.08823394775390625, 0.10005569458007812, 0.11187744140625, 0.12369918823242188, 0.13552093505859375, 0.14734268188476562, 0.1591644287109375, 0.17098617553710938, 0.18280792236328125, 0.19462966918945312, 0.206451416015625, 0.21827316284179688, 0.23009490966796875, 0.24191665649414062, 0.2537384033203125, 0.2655601501464844, 0.27738189697265625, 0.2892036437988281, 0.301025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 4.0, 12.0, 17.0, 18.0, 22.0, 43.0, 56.0, 81.0, 94.0, 157.0, 235.0, 300.0, 463.0, 731.0, 1150.0, 2007.0, 4575.0, 10963.0, 29697.0, 82619.0, 199344.0, 319909.0, 232738.0, 100845.0, 37450.0, 13506.0, 5347.0, 2418.0, 1337.0, 802.0, 488.0, 337.0, 223.0, 153.0, 131.0, 75.0, 50.0, 49.0, 23.0, 26.0, 17.0, 12.0, 7.0, 9.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154296875, -1.118896484375, -1.08349609375, -1.048095703125, -1.0126953125, -0.977294921875, -0.94189453125, -0.906494140625, -0.87109375, -0.835693359375, -0.80029296875, -0.764892578125, -0.7294921875, -0.694091796875, -0.65869140625, -0.623291015625, -0.587890625, -0.552490234375, -0.51708984375, -0.481689453125, -0.4462890625, -0.410888671875, -0.37548828125, -0.340087890625, -0.3046875, -0.269287109375, -0.23388671875, -0.198486328125, -0.1630859375, -0.127685546875, -0.09228515625, -0.056884765625, -0.021484375, 0.013916015625, 0.04931640625, 0.084716796875, 0.1201171875, 0.155517578125, 0.19091796875, 0.226318359375, 0.26171875, 0.297119140625, 0.33251953125, 0.367919921875, 0.4033203125, 0.438720703125, 0.47412109375, 0.509521484375, 0.544921875, 0.580322265625, 0.61572265625, 0.651123046875, 0.6865234375, 0.721923828125, 0.75732421875, 0.792724609375, 0.828125, 0.863525390625, 0.89892578125, 0.934326171875, 0.9697265625, 1.005126953125, 1.04052734375, 1.075927734375, 1.111328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 11.0, 11.0, 10.0, 15.0, 15.0, 21.0, 20.0, 24.0, 35.0, 38.0, 36.0, 42.0, 47.0, 54.0, 55.0, 45.0, 51.0, 48.0, 39.0, 43.0, 46.0, 36.0, 36.0, 22.0, 43.0, 19.0, 27.0, 14.0, 18.0, 16.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.109375, -1.0761566162109375, -1.042938232421875, -1.0097198486328125, -0.97650146484375, -0.9432830810546875, -0.910064697265625, -0.8768463134765625, -0.8436279296875, -0.8104095458984375, -0.777191162109375, -0.7439727783203125, -0.71075439453125, -0.6775360107421875, -0.644317626953125, -0.6110992431640625, -0.577880859375, -0.5446624755859375, -0.511444091796875, -0.4782257080078125, -0.44500732421875, -0.4117889404296875, -0.378570556640625, -0.3453521728515625, -0.3121337890625, -0.2789154052734375, -0.245697021484375, -0.2124786376953125, -0.17926025390625, -0.1460418701171875, -0.112823486328125, -0.0796051025390625, -0.04638671875, -0.0131683349609375, 0.020050048828125, 0.0532684326171875, 0.08648681640625, 0.1197052001953125, 0.152923583984375, 0.1861419677734375, 0.2193603515625, 0.2525787353515625, 0.285797119140625, 0.3190155029296875, 0.35223388671875, 0.3854522705078125, 0.418670654296875, 0.4518890380859375, 0.485107421875, 0.5183258056640625, 0.551544189453125, 0.5847625732421875, 0.61798095703125, 0.6511993408203125, 0.684417724609375, 0.7176361083984375, 0.7508544921875, 0.7840728759765625, 0.817291259765625, 0.8505096435546875, 0.88372802734375, 0.9169464111328125, 0.950164794921875, 0.9833831787109375, 1.0166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 19.0, 31.0, 30.0, 91.0, 112.0, 239.0, 509.0, 1114.0, 3215.0, 10869.0, 45209.0, 254707.0, 558564.0, 136373.0, 26598.0, 6961.0, 2186.0, 885.0, 338.0, 199.0, 92.0, 53.0, 40.0, 26.0, 12.0, 8.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9879302978515625, -0.955352783203125, -0.9227752685546875, -0.89019775390625, -0.8576202392578125, -0.825042724609375, -0.7924652099609375, -0.7598876953125, -0.7273101806640625, -0.694732666015625, -0.6621551513671875, -0.62957763671875, -0.5970001220703125, -0.564422607421875, -0.5318450927734375, -0.499267578125, -0.4666900634765625, -0.434112548828125, -0.4015350341796875, -0.36895751953125, -0.3363800048828125, -0.303802490234375, -0.2712249755859375, -0.2386474609375, -0.2060699462890625, -0.173492431640625, -0.1409149169921875, -0.10833740234375, -0.0757598876953125, -0.043182373046875, -0.0106048583984375, 0.02197265625, 0.0545501708984375, 0.087127685546875, 0.1197052001953125, 0.15228271484375, 0.1848602294921875, 0.217437744140625, 0.2500152587890625, 0.2825927734375, 0.3151702880859375, 0.347747802734375, 0.3803253173828125, 0.41290283203125, 0.4454803466796875, 0.478057861328125, 0.5106353759765625, 0.543212890625, 0.5757904052734375, 0.608367919921875, 0.6409454345703125, 0.67352294921875, 0.7061004638671875, 0.738677978515625, 0.7712554931640625, 0.8038330078125, 0.8364105224609375, 0.868988037109375, 0.9015655517578125, 0.93414306640625, 0.9667205810546875, 0.999298095703125, 1.0318756103515625, 1.064453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 8.0, 5.0, 9.0, 11.0, 17.0, 19.0, 22.0, 34.0, 33.0, 36.0, 57.0, 55.0, 72.0, 67.0, 79.0, 75.0, 60.0, 71.0, 54.0, 45.0, 40.0, 23.0, 25.0, 18.0, 18.0, 10.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001302957534790039, -0.00012613646686077118, -0.00012197718024253845, -0.00011781789362430573, -0.000113658607006073, -0.00010949932038784027, -0.00010534003376960754, -0.00010118074715137482, -9.702146053314209e-05, -9.286217391490936e-05, -8.870288729667664e-05, -8.454360067844391e-05, -8.038431406021118e-05, -7.622502744197845e-05, -7.206574082374573e-05, -6.7906454205513e-05, -6.374716758728027e-05, -5.9587880969047546e-05, -5.542859435081482e-05, -5.126930773258209e-05, -4.7110021114349365e-05, -4.295073449611664e-05, -3.879144787788391e-05, -3.4632161259651184e-05, -3.0472874641418457e-05, -2.631358802318573e-05, -2.2154301404953003e-05, -1.7995014786720276e-05, -1.3835728168487549e-05, -9.676441550254822e-06, -5.517154932022095e-06, -1.3578683137893677e-06, 2.8014183044433594e-06, 6.9607049226760864e-06, 1.1119991540908813e-05, 1.527927815914154e-05, 1.9438564777374268e-05, 2.3597851395606995e-05, 2.775713801383972e-05, 3.191642463207245e-05, 3.6075711250305176e-05, 4.02349978685379e-05, 4.439428448677063e-05, 4.855357110500336e-05, 5.2712857723236084e-05, 5.687214434146881e-05, 6.103143095970154e-05, 6.519071757793427e-05, 6.935000419616699e-05, 7.350929081439972e-05, 7.766857743263245e-05, 8.182786405086517e-05, 8.59871506690979e-05, 9.014643728733063e-05, 9.430572390556335e-05, 9.846501052379608e-05, 0.00010262429714202881, 0.00010678358376026154, 0.00011094287037849426, 0.00011510215699672699, 0.00011926144361495972, 0.00012342073023319244, 0.00012758001685142517, 0.0001317393034696579, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 5.0, 6.0, 16.0, 16.0, 18.0, 32.0, 60.0, 80.0, 84.0, 141.0, 212.0, 387.0, 656.0, 1281.0, 2669.0, 6773.0, 19184.0, 65370.0, 293193.0, 479973.0, 127062.0, 32880.0, 10489.0, 3983.0, 1774.0, 909.0, 470.0, 279.0, 156.0, 115.0, 63.0, 50.0, 50.0, 28.0, 18.0, 17.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8330078125, -0.805450439453125, -0.77789306640625, -0.750335693359375, -0.7227783203125, -0.695220947265625, -0.66766357421875, -0.640106201171875, -0.612548828125, -0.584991455078125, -0.55743408203125, -0.529876708984375, -0.5023193359375, -0.474761962890625, -0.44720458984375, -0.419647216796875, -0.39208984375, -0.364532470703125, -0.33697509765625, -0.309417724609375, -0.2818603515625, -0.254302978515625, -0.22674560546875, -0.199188232421875, -0.171630859375, -0.144073486328125, -0.11651611328125, -0.088958740234375, -0.0614013671875, -0.033843994140625, -0.00628662109375, 0.021270751953125, 0.048828125, 0.076385498046875, 0.10394287109375, 0.131500244140625, 0.1590576171875, 0.186614990234375, 0.21417236328125, 0.241729736328125, 0.269287109375, 0.296844482421875, 0.32440185546875, 0.351959228515625, 0.3795166015625, 0.407073974609375, 0.43463134765625, 0.462188720703125, 0.48974609375, 0.517303466796875, 0.54486083984375, 0.572418212890625, 0.5999755859375, 0.627532958984375, 0.65509033203125, 0.682647705078125, 0.710205078125, 0.737762451171875, 0.76531982421875, 0.792877197265625, 0.8204345703125, 0.847991943359375, 0.87554931640625, 0.903106689453125, 0.9306640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 17.0, 13.0, 23.0, 15.0, 24.0, 17.0, 36.0, 44.0, 48.0, 55.0, 86.0, 74.0, 72.0, 66.0, 65.0, 45.0, 48.0, 40.0, 36.0, 17.0, 24.0, 19.0, 12.0, 9.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.455078125, -0.4395904541015625, -0.424102783203125, -0.4086151123046875, -0.39312744140625, -0.3776397705078125, -0.362152099609375, -0.3466644287109375, -0.3311767578125, -0.3156890869140625, -0.300201416015625, -0.2847137451171875, -0.26922607421875, -0.2537384033203125, -0.238250732421875, -0.2227630615234375, -0.207275390625, -0.1917877197265625, -0.176300048828125, -0.1608123779296875, -0.14532470703125, -0.1298370361328125, -0.114349365234375, -0.0988616943359375, -0.0833740234375, -0.0678863525390625, -0.052398681640625, -0.0369110107421875, -0.02142333984375, -0.0059356689453125, 0.009552001953125, 0.0250396728515625, 0.04052734375, 0.0560150146484375, 0.071502685546875, 0.0869903564453125, 0.10247802734375, 0.1179656982421875, 0.133453369140625, 0.1489410400390625, 0.1644287109375, 0.1799163818359375, 0.195404052734375, 0.2108917236328125, 0.22637939453125, 0.2418670654296875, 0.257354736328125, 0.2728424072265625, 0.288330078125, 0.3038177490234375, 0.319305419921875, 0.3347930908203125, 0.35028076171875, 0.3657684326171875, 0.381256103515625, 0.3967437744140625, 0.4122314453125, 0.4277191162109375, 0.443206787109375, 0.4586944580078125, 0.47418212890625, 0.4896697998046875, 0.505157470703125, 0.5206451416015625, 0.5361328125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 6.0, 20.0, 47.0, 68.0, 98.0, 171.0, 183.0, 142.0, 102.0, 66.0, 42.0, 20.0, 7.0, 9.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.496323585510254, -6.120082378387451, -5.743841171264648, -5.367599964141846, -4.991358757019043, -4.61511754989624, -4.2388763427734375, -3.8626351356506348, -3.486393928527832, -3.1101527214050293, -2.7339115142822266, -2.357670307159424, -1.981429100036621, -1.6051878929138184, -1.2289466857910156, -0.8527054786682129, -0.47646427154541016, -0.10022306442260742, 0.2760181427001953, 0.652259349822998, 1.0285005569458008, 1.4047417640686035, 1.7809829711914062, 2.157224178314209, 2.5334653854370117, 2.9097065925598145, 3.285947799682617, 3.66218900680542, 4.038430213928223, 4.414671421051025, 4.790912628173828, 5.167153835296631, 5.54339599609375, 5.919637203216553, 6.2958784103393555, 6.672119617462158, 7.048360824584961, 7.424602031707764, 7.800843238830566, 8.177083969116211, 8.553325653076172, 8.929567337036133, 9.305808067321777, 9.682048797607422, 10.058290481567383, 10.434532165527344, 10.810772895812988, 11.187013626098633, 11.563255310058594, 11.939496994018555, 12.3157377243042, 12.691978454589844, 13.068220138549805, 13.444461822509766, 13.82070255279541, 14.196943283081055, 14.573184967041016, 14.949426651000977, 15.325667381286621, 15.701908111572266, 16.078149795532227, 16.454391479492188, 16.830631256103516, 17.206872940063477, 17.583114624023438]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 5.0, 16.0, 17.0, 13.0, 13.0, 28.0, 32.0, 28.0, 27.0, 40.0, 43.0, 47.0, 52.0, 49.0, 51.0, 61.0, 40.0, 55.0, 42.0, 59.0, 46.0, 36.0, 36.0, 21.0, 27.0, 16.0, 23.0, 12.0, 11.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.030461311340332, -5.819243907928467, -5.608026504516602, -5.396809101104736, -5.185591697692871, -4.974374771118164, -4.763157367706299, -4.551939964294434, -4.340722560882568, -4.129505157470703, -3.918287754058838, -3.7070705890655518, -3.4958531856536865, -3.2846357822418213, -3.073418617248535, -2.86220121383667, -2.6509838104248047, -2.4397664070129395, -2.228549003601074, -2.017331838607788, -1.8061144351959229, -1.5948970317840576, -1.383679747581482, -1.1724624633789062, -0.961245059967041, -0.7500277161598206, -0.5388103723526001, -0.32759302854537964, -0.11637568473815918, 0.09484171867370605, 0.30605900287628174, 0.5172762870788574, 0.7284936904907227, 0.9397110342979431, 1.1509283781051636, 1.3621456623077393, 1.5733630657196045, 1.7845804691314697, 1.9957977533340454, 2.207015037536621, 2.4182324409484863, 2.6294498443603516, 2.840667247772217, 3.051884412765503, 3.263101816177368, 3.4743192195892334, 3.6855363845825195, 3.8967537879943848, 4.10797119140625, 4.319188594818115, 4.5304059982299805, 4.741623401641846, 4.952840805053711, 5.164057731628418, 5.375275135040283, 5.586492538452148, 5.797709941864014, 6.008927345275879, 6.220144748687744, 6.431362152099609, 6.642579078674316, 6.85379695892334, 7.065013885498047, 7.276231288909912, 7.487448692321777]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 12.0, 17.0, 26.0, 65.0, 147.0, 309.0, 1054.0, 4010.0, 21851.0, 330096.0, 3776728.0, 49994.0, 7322.0, 1772.0, 517.0, 174.0, 85.0, 47.0, 23.0, 18.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.49359130859375, -2.4110107421875, -2.32843017578125, -2.245849609375, -2.16326904296875, -2.0806884765625, -1.99810791015625, -1.91552734375, -1.83294677734375, -1.7503662109375, -1.66778564453125, -1.585205078125, -1.50262451171875, -1.4200439453125, -1.33746337890625, -1.2548828125, -1.17230224609375, -1.0897216796875, -1.00714111328125, -0.924560546875, -0.84197998046875, -0.7593994140625, -0.67681884765625, -0.59423828125, -0.51165771484375, -0.4290771484375, -0.34649658203125, -0.263916015625, -0.18133544921875, -0.0987548828125, -0.01617431640625, 0.06640625, 0.14898681640625, 0.2315673828125, 0.31414794921875, 0.396728515625, 0.47930908203125, 0.5618896484375, 0.64447021484375, 0.72705078125, 0.80963134765625, 0.8922119140625, 0.97479248046875, 1.057373046875, 1.13995361328125, 1.2225341796875, 1.30511474609375, 1.3876953125, 1.47027587890625, 1.5528564453125, 1.63543701171875, 1.718017578125, 1.80059814453125, 1.8831787109375, 1.96575927734375, 2.04833984375, 2.13092041015625, 2.2135009765625, 2.29608154296875, 2.378662109375, 2.46124267578125, 2.5438232421875, 2.62640380859375, 2.708984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 9.0, 13.0, 28.0, 26.0, 51.0, 51.0, 55.0, 91.0, 72.0, 75.0, 91.0, 73.0, 77.0, 70.0, 45.0, 43.0, 38.0, 34.0, 16.0, 13.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.412841796875, -0.4014015197753906, -0.38996124267578125, -0.3785209655761719, -0.3670806884765625, -0.3556404113769531, -0.34420013427734375, -0.3327598571777344, -0.321319580078125, -0.3098793029785156, -0.29843902587890625, -0.2869987487792969, -0.2755584716796875, -0.2641181945800781, -0.25267791748046875, -0.24123764038085938, -0.22979736328125, -0.21835708618164062, -0.20691680908203125, -0.19547653198242188, -0.1840362548828125, -0.17259597778320312, -0.16115570068359375, -0.14971542358398438, -0.138275146484375, -0.12683486938476562, -0.11539459228515625, -0.10395431518554688, -0.0925140380859375, -0.08107376098632812, -0.06963348388671875, -0.058193206787109375, -0.0467529296875, -0.035312652587890625, -0.02387237548828125, -0.012432098388671875, -0.0009918212890625, 0.010448455810546875, 0.02188873291015625, 0.033329010009765625, 0.044769287109375, 0.056209564208984375, 0.06764984130859375, 0.07909011840820312, 0.0905303955078125, 0.10197067260742188, 0.11341094970703125, 0.12485122680664062, 0.13629150390625, 0.14773178100585938, 0.15917205810546875, 0.17061233520507812, 0.1820526123046875, 0.19349288940429688, 0.20493316650390625, 0.21637344360351562, 0.227813720703125, 0.23925399780273438, 0.25069427490234375, 0.2621345520019531, 0.2735748291015625, 0.2850151062011719, 0.29645538330078125, 0.3078956604003906, 0.3193359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 12.0, 8.0, 15.0, 32.0, 43.0, 60.0, 94.0, 117.0, 233.0, 418.0, 692.0, 1327.0, 2817.0, 6235.0, 15738.0, 47997.0, 204635.0, 3059717.0, 703659.0, 102845.0, 28857.0, 10402.0, 4233.0, 1943.0, 977.0, 497.0, 289.0, 140.0, 82.0, 67.0, 34.0, 21.0, 16.0, 7.0, 14.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.322418212890625, -1.28546142578125, -1.248504638671875, -1.2115478515625, -1.174591064453125, -1.13763427734375, -1.100677490234375, -1.063720703125, -1.026763916015625, -0.98980712890625, -0.952850341796875, -0.9158935546875, -0.878936767578125, -0.84197998046875, -0.805023193359375, -0.76806640625, -0.731109619140625, -0.69415283203125, -0.657196044921875, -0.6202392578125, -0.583282470703125, -0.54632568359375, -0.509368896484375, -0.472412109375, -0.435455322265625, -0.39849853515625, -0.361541748046875, -0.3245849609375, -0.287628173828125, -0.25067138671875, -0.213714599609375, -0.1767578125, -0.139801025390625, -0.10284423828125, -0.065887451171875, -0.0289306640625, 0.008026123046875, 0.04498291015625, 0.081939697265625, 0.118896484375, 0.155853271484375, 0.19281005859375, 0.229766845703125, 0.2667236328125, 0.303680419921875, 0.34063720703125, 0.377593994140625, 0.41455078125, 0.451507568359375, 0.48846435546875, 0.525421142578125, 0.5623779296875, 0.599334716796875, 0.63629150390625, 0.673248291015625, 0.710205078125, 0.747161865234375, 0.78411865234375, 0.821075439453125, 0.8580322265625, 0.894989013671875, 0.93194580078125, 0.968902587890625, 1.005859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 13.0, 8.0, 9.0, 19.0, 27.0, 40.0, 51.0, 79.0, 96.0, 200.0, 323.0, 1243.0, 1057.0, 356.0, 173.0, 99.0, 65.0, 44.0, 47.0, 28.0, 14.0, 14.0, 14.0, 14.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.406005859375, -0.39531707763671875, -0.3846282958984375, -0.37393951416015625, -0.363250732421875, -0.35256195068359375, -0.3418731689453125, -0.33118438720703125, -0.32049560546875, -0.30980682373046875, -0.2991180419921875, -0.28842926025390625, -0.277740478515625, -0.26705169677734375, -0.2563629150390625, -0.24567413330078125, -0.2349853515625, -0.22429656982421875, -0.2136077880859375, -0.20291900634765625, -0.192230224609375, -0.18154144287109375, -0.1708526611328125, -0.16016387939453125, -0.14947509765625, -0.13878631591796875, -0.1280975341796875, -0.11740875244140625, -0.106719970703125, -0.09603118896484375, -0.0853424072265625, -0.07465362548828125, -0.06396484375, -0.05327606201171875, -0.0425872802734375, -0.03189849853515625, -0.021209716796875, -0.01052093505859375, 0.0001678466796875, 0.01085662841796875, 0.02154541015625, 0.03223419189453125, 0.0429229736328125, 0.05361175537109375, 0.064300537109375, 0.07498931884765625, 0.0856781005859375, 0.09636688232421875, 0.1070556640625, 0.11774444580078125, 0.1284332275390625, 0.13912200927734375, 0.149810791015625, 0.16049957275390625, 0.1711883544921875, 0.18187713623046875, 0.19256591796875, 0.20325469970703125, 0.2139434814453125, 0.22463226318359375, 0.235321044921875, 0.24600982666015625, 0.2566986083984375, 0.26738739013671875, 0.278076171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 12.0, 21.0, 63.0, 110.0, 178.0, 198.0, 185.0, 127.0, 56.0, 22.0, 19.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951761245727539, -3.834469795227051, -3.7171785831451416, -3.5998871326446533, -3.482595682144165, -3.365304470062256, -3.2480130195617676, -3.1307215690612793, -3.013430118560791, -2.8961386680603027, -2.7788474559783936, -2.6615560054779053, -2.544264554977417, -2.426973342895508, -2.3096818923950195, -2.1923904418945312, -2.075099229812622, -1.9578078985214233, -1.840516448020935, -1.7232251167297363, -1.605933666229248, -1.4886423349380493, -1.3713510036468506, -1.2540595531463623, -1.1367682218551636, -1.0194768905639648, -0.9021854400634766, -0.7848941087722778, -0.6676027178764343, -0.5503113269805908, -0.4330199956893921, -0.3157286047935486, -0.19843721389770508, -0.08114583790302277, 0.036145538091659546, 0.15343689918518066, 0.27072829008102417, 0.3880196809768677, 0.5053110122680664, 0.6226024031639099, 0.7398937940597534, 0.8571851849555969, 0.9744765758514404, 1.0917679071426392, 1.209059238433838, 1.3263506889343262, 1.443642020225525, 1.5609333515167236, 1.678224802017212, 1.7955161333084106, 1.912807583808899, 2.0300989151000977, 2.147390365600586, 2.264681816101074, 2.3819730281829834, 2.4992644786834717, 2.616555690765381, 2.733847141265869, 2.8511383533477783, 2.9684298038482666, 3.085721254348755, 3.203012466430664, 3.3203039169311523, 3.4375953674316406, 3.554886817932129]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 4.0, 10.0, 10.0, 4.0, 11.0, 8.0, 10.0, 20.0, 16.0, 18.0, 26.0, 27.0, 36.0, 39.0, 46.0, 39.0, 39.0, 51.0, 53.0, 45.0, 29.0, 38.0, 48.0, 41.0, 44.0, 28.0, 31.0, 27.0, 27.0, 32.0, 16.0, 16.0, 16.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 5.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0928044319152832, -1.0589731931686401, -1.025141954421997, -0.991310715675354, -0.9574794769287109, -0.9236482381820679, -0.8898169994354248, -0.8559857606887817, -0.8221545219421387, -0.7883232831954956, -0.7544920444488525, -0.7206608057022095, -0.6868295669555664, -0.6529983282089233, -0.6191670894622803, -0.5853358507156372, -0.5515046715736389, -0.5176734328269958, -0.4838421940803528, -0.4500109553337097, -0.41617971658706665, -0.3823484778404236, -0.3485172688961029, -0.31468603014945984, -0.2808547914028168, -0.2470235526561737, -0.21319231390953064, -0.17936109006404877, -0.1455298513174057, -0.11169861257076263, -0.07786738872528076, -0.044036149978637695, -0.010204911231994629, 0.02362632378935814, 0.05745755881071091, 0.09128879010677338, 0.12512002885341644, 0.1589512676000595, 0.19278249144554138, 0.22661373019218445, 0.2604449689388275, 0.2942762076854706, 0.32810744643211365, 0.3619386553764343, 0.3957698941230774, 0.42960113286972046, 0.4634323716163635, 0.4972636103630066, 0.5310948491096497, 0.5649260878562927, 0.5987573266029358, 0.6325885653495789, 0.6664198040962219, 0.700251042842865, 0.7340822219848633, 0.7679134607315063, 0.8017446994781494, 0.8355759382247925, 0.8694071769714355, 0.9032384157180786, 0.9370696544647217, 0.9709008932113647, 1.0047321319580078, 1.0385633707046509, 1.072394609451294]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 16.0, 26.0, 36.0, 73.0, 135.0, 203.0, 391.0, 834.0, 2002.0, 5618.0, 19281.0, 81853.0, 311548.0, 428725.0, 148940.0, 34606.0, 9004.0, 2970.0, 1148.0, 510.0, 243.0, 150.0, 88.0, 52.0, 38.0, 9.0, 16.0, 11.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.5965576171875, -1.543701171875, -1.4908447265625, -1.43798828125, -1.3851318359375, -1.332275390625, -1.2794189453125, -1.2265625, -1.1737060546875, -1.120849609375, -1.0679931640625, -1.01513671875, -0.9622802734375, -0.909423828125, -0.8565673828125, -0.8037109375, -0.7508544921875, -0.697998046875, -0.6451416015625, -0.59228515625, -0.5394287109375, -0.486572265625, -0.4337158203125, -0.380859375, -0.3280029296875, -0.275146484375, -0.2222900390625, -0.16943359375, -0.1165771484375, -0.063720703125, -0.0108642578125, 0.0419921875, 0.0948486328125, 0.147705078125, 0.2005615234375, 0.25341796875, 0.3062744140625, 0.359130859375, 0.4119873046875, 0.46484375, 0.5177001953125, 0.570556640625, 0.6234130859375, 0.67626953125, 0.7291259765625, 0.781982421875, 0.8348388671875, 0.8876953125, 0.9405517578125, 0.993408203125, 1.0462646484375, 1.09912109375, 1.1519775390625, 1.204833984375, 1.2576904296875, 1.310546875, 1.3634033203125, 1.416259765625, 1.4691162109375, 1.52197265625, 1.5748291015625, 1.627685546875, 1.6805419921875, 1.7333984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 18.0, 22.0, 33.0, 42.0, 56.0, 57.0, 52.0, 89.0, 79.0, 77.0, 89.0, 69.0, 67.0, 54.0, 41.0, 39.0, 30.0, 26.0, 17.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.408447265625, -0.397186279296875, -0.38592529296875, -0.374664306640625, -0.3634033203125, -0.352142333984375, -0.34088134765625, -0.329620361328125, -0.318359375, -0.307098388671875, -0.29583740234375, -0.284576416015625, -0.2733154296875, -0.262054443359375, -0.25079345703125, -0.239532470703125, -0.228271484375, -0.217010498046875, -0.20574951171875, -0.194488525390625, -0.1832275390625, -0.171966552734375, -0.16070556640625, -0.149444580078125, -0.13818359375, -0.126922607421875, -0.11566162109375, -0.104400634765625, -0.0931396484375, -0.081878662109375, -0.07061767578125, -0.059356689453125, -0.048095703125, -0.036834716796875, -0.02557373046875, -0.014312744140625, -0.0030517578125, 0.008209228515625, 0.01947021484375, 0.030731201171875, 0.0419921875, 0.053253173828125, 0.06451416015625, 0.075775146484375, 0.0870361328125, 0.098297119140625, 0.10955810546875, 0.120819091796875, 0.132080078125, 0.143341064453125, 0.15460205078125, 0.165863037109375, 0.1771240234375, 0.188385009765625, 0.19964599609375, 0.210906982421875, 0.22216796875, 0.233428955078125, 0.24468994140625, 0.255950927734375, 0.2672119140625, 0.278472900390625, 0.28973388671875, 0.300994873046875, 0.312255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 9.0, 4.0, 8.0, 15.0, 21.0, 33.0, 33.0, 43.0, 84.0, 115.0, 173.0, 233.0, 321.0, 497.0, 829.0, 1471.0, 3216.0, 8242.0, 25598.0, 90615.0, 280873.0, 391167.0, 170648.0, 49454.0, 14550.0, 4966.0, 2302.0, 1112.0, 631.0, 395.0, 272.0, 178.0, 122.0, 88.0, 66.0, 50.0, 27.0, 24.0, 13.0, 16.0, 16.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4208984375, -1.379425048828125, -1.33795166015625, -1.296478271484375, -1.2550048828125, -1.213531494140625, -1.17205810546875, -1.130584716796875, -1.089111328125, -1.047637939453125, -1.00616455078125, -0.964691162109375, -0.9232177734375, -0.881744384765625, -0.84027099609375, -0.798797607421875, -0.75732421875, -0.715850830078125, -0.67437744140625, -0.632904052734375, -0.5914306640625, -0.549957275390625, -0.50848388671875, -0.467010498046875, -0.425537109375, -0.384063720703125, -0.34259033203125, -0.301116943359375, -0.2596435546875, -0.218170166015625, -0.17669677734375, -0.135223388671875, -0.09375, -0.052276611328125, -0.01080322265625, 0.030670166015625, 0.0721435546875, 0.113616943359375, 0.15509033203125, 0.196563720703125, 0.238037109375, 0.279510498046875, 0.32098388671875, 0.362457275390625, 0.4039306640625, 0.445404052734375, 0.48687744140625, 0.528350830078125, 0.56982421875, 0.611297607421875, 0.65277099609375, 0.694244384765625, 0.7357177734375, 0.777191162109375, 0.81866455078125, 0.860137939453125, 0.901611328125, 0.943084716796875, 0.98455810546875, 1.026031494140625, 1.0675048828125, 1.108978271484375, 1.15045166015625, 1.191925048828125, 1.2333984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 8.0, 6.0, 2.0, 7.0, 7.0, 11.0, 6.0, 12.0, 18.0, 9.0, 19.0, 28.0, 23.0, 32.0, 39.0, 27.0, 38.0, 39.0, 32.0, 38.0, 44.0, 42.0, 33.0, 31.0, 40.0, 31.0, 37.0, 32.0, 27.0, 48.0, 32.0, 25.0, 20.0, 24.0, 20.0, 18.0, 19.0, 16.0, 9.0, 2.0, 11.0, 6.0, 6.0, 7.0, 9.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.94873046875, -0.9200515747070312, -0.8913726806640625, -0.8626937866210938, -0.834014892578125, -0.8053359985351562, -0.7766571044921875, -0.7479782104492188, -0.71929931640625, -0.6906204223632812, -0.6619415283203125, -0.6332626342773438, -0.604583740234375, -0.5759048461914062, -0.5472259521484375, -0.5185470581054688, -0.4898681640625, -0.46118927001953125, -0.4325103759765625, -0.40383148193359375, -0.375152587890625, -0.34647369384765625, -0.3177947998046875, -0.28911590576171875, -0.26043701171875, -0.23175811767578125, -0.2030792236328125, -0.17440032958984375, -0.145721435546875, -0.11704254150390625, -0.0883636474609375, -0.05968475341796875, -0.031005859375, -0.00232696533203125, 0.0263519287109375, 0.05503082275390625, 0.083709716796875, 0.11238861083984375, 0.1410675048828125, 0.16974639892578125, 0.19842529296875, 0.22710418701171875, 0.2557830810546875, 0.28446197509765625, 0.313140869140625, 0.34181976318359375, 0.3704986572265625, 0.39917755126953125, 0.4278564453125, 0.45653533935546875, 0.4852142333984375, 0.5138931274414062, 0.542572021484375, 0.5712509155273438, 0.5999298095703125, 0.6286087036132812, 0.65728759765625, 0.6859664916992188, 0.7146453857421875, 0.7433242797851562, 0.772003173828125, 0.8006820678710938, 0.8293609619140625, 0.8580398559570312, 0.88671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 8.0, 9.0, 13.0, 15.0, 16.0, 29.0, 40.0, 80.0, 130.0, 264.0, 549.0, 1459.0, 3983.0, 14047.0, 85369.0, 706357.0, 203444.0, 23237.0, 5927.0, 1989.0, 772.0, 336.0, 154.0, 96.0, 69.0, 56.0, 26.0, 14.0, 15.0, 9.0, 11.0, 10.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.34906005859375, -1.3035888671875, -1.25811767578125, -1.212646484375, -1.16717529296875, -1.1217041015625, -1.07623291015625, -1.03076171875, -0.98529052734375, -0.9398193359375, -0.89434814453125, -0.848876953125, -0.80340576171875, -0.7579345703125, -0.71246337890625, -0.6669921875, -0.62152099609375, -0.5760498046875, -0.53057861328125, -0.485107421875, -0.43963623046875, -0.3941650390625, -0.34869384765625, -0.30322265625, -0.25775146484375, -0.2122802734375, -0.16680908203125, -0.121337890625, -0.07586669921875, -0.0303955078125, 0.01507568359375, 0.060546875, 0.10601806640625, 0.1514892578125, 0.19696044921875, 0.242431640625, 0.28790283203125, 0.3333740234375, 0.37884521484375, 0.42431640625, 0.46978759765625, 0.5152587890625, 0.56072998046875, 0.606201171875, 0.65167236328125, 0.6971435546875, 0.74261474609375, 0.7880859375, 0.83355712890625, 0.8790283203125, 0.92449951171875, 0.969970703125, 1.01544189453125, 1.0609130859375, 1.10638427734375, 1.15185546875, 1.19732666015625, 1.2427978515625, 1.28826904296875, 1.333740234375, 1.37921142578125, 1.4246826171875, 1.47015380859375, 1.515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 4.0, 12.0, 25.0, 13.0, 34.0, 40.0, 73.0, 71.0, 92.0, 111.0, 110.0, 88.0, 85.0, 52.0, 49.0, 36.0, 21.0, 13.0, 21.0, 7.0, 8.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001437664031982422, -0.0001380518078804016, -0.00013233721256256104, -0.00012662261724472046, -0.00012090802192687988, -0.0001151934266090393, -0.00010947883129119873, -0.00010376423597335815, -9.804964065551758e-05, -9.2335045337677e-05, -8.662045001983643e-05, -8.090585470199585e-05, -7.519125938415527e-05, -6.94766640663147e-05, -6.376206874847412e-05, -5.8047473430633545e-05, -5.233287811279297e-05, -4.661828279495239e-05, -4.0903687477111816e-05, -3.518909215927124e-05, -2.9474496841430664e-05, -2.3759901523590088e-05, -1.8045306205749512e-05, -1.2330710887908936e-05, -6.616115570068359e-06, -9.015202522277832e-07, 4.813075065612793e-06, 1.0527670383453369e-05, 1.6242265701293945e-05, 2.195686101913452e-05, 2.7671456336975098e-05, 3.3386051654815674e-05, 3.910064697265625e-05, 4.4815242290496826e-05, 5.05298376083374e-05, 5.624443292617798e-05, 6.195902824401855e-05, 6.767362356185913e-05, 7.338821887969971e-05, 7.910281419754028e-05, 8.481740951538086e-05, 9.053200483322144e-05, 9.624660015106201e-05, 0.00010196119546890259, 0.00010767579078674316, 0.00011339038610458374, 0.00011910498142242432, 0.0001248195767402649, 0.00013053417205810547, 0.00013624876737594604, 0.00014196336269378662, 0.0001476779580116272, 0.00015339255332946777, 0.00015910714864730835, 0.00016482174396514893, 0.0001705363392829895, 0.00017625093460083008, 0.00018196552991867065, 0.00018768012523651123, 0.0001933947205543518, 0.00019910931587219238, 0.00020482391119003296, 0.00021053850650787354, 0.0002162531018257141, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 2.0, 14.0, 20.0, 46.0, 30.0, 55.0, 120.0, 267.0, 650.0, 1746.0, 5854.0, 35612.0, 795009.0, 189977.0, 14078.0, 3157.0, 1025.0, 427.0, 184.0, 107.0, 66.0, 32.0, 17.0, 16.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8284454345703125, -1.757476806640625, -1.6865081787109375, -1.61553955078125, -1.5445709228515625, -1.473602294921875, -1.4026336669921875, -1.3316650390625, -1.2606964111328125, -1.189727783203125, -1.1187591552734375, -1.04779052734375, -0.9768218994140625, -0.905853271484375, -0.8348846435546875, -0.763916015625, -0.6929473876953125, -0.621978759765625, -0.5510101318359375, -0.48004150390625, -0.4090728759765625, -0.338104248046875, -0.2671356201171875, -0.1961669921875, -0.1251983642578125, -0.054229736328125, 0.0167388916015625, 0.08770751953125, 0.1586761474609375, 0.229644775390625, 0.3006134033203125, 0.37158203125, 0.4425506591796875, 0.513519287109375, 0.5844879150390625, 0.65545654296875, 0.7264251708984375, 0.797393798828125, 0.8683624267578125, 0.9393310546875, 1.0102996826171875, 1.081268310546875, 1.1522369384765625, 1.22320556640625, 1.2941741943359375, 1.365142822265625, 1.4361114501953125, 1.507080078125, 1.5780487060546875, 1.649017333984375, 1.7199859619140625, 1.79095458984375, 1.8619232177734375, 1.932891845703125, 2.0038604736328125, 2.0748291015625, 2.1457977294921875, 2.216766357421875, 2.2877349853515625, 2.35870361328125, 2.4296722412109375, 2.500640869140625, 2.5716094970703125, 2.642578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 7.0, 7.0, 27.0, 51.0, 55.0, 117.0, 145.0, 161.0, 140.0, 96.0, 49.0, 39.0, 36.0, 16.0, 11.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.94219970703125, -0.9078369140625, -0.87347412109375, -0.839111328125, -0.80474853515625, -0.7703857421875, -0.73602294921875, -0.70166015625, -0.66729736328125, -0.6329345703125, -0.59857177734375, -0.564208984375, -0.52984619140625, -0.4954833984375, -0.46112060546875, -0.4267578125, -0.39239501953125, -0.3580322265625, -0.32366943359375, -0.289306640625, -0.25494384765625, -0.2205810546875, -0.18621826171875, -0.15185546875, -0.11749267578125, -0.0831298828125, -0.04876708984375, -0.014404296875, 0.01995849609375, 0.0543212890625, 0.08868408203125, 0.123046875, 0.15740966796875, 0.1917724609375, 0.22613525390625, 0.260498046875, 0.29486083984375, 0.3292236328125, 0.36358642578125, 0.39794921875, 0.43231201171875, 0.4666748046875, 0.50103759765625, 0.535400390625, 0.56976318359375, 0.6041259765625, 0.63848876953125, 0.6728515625, 0.70721435546875, 0.7415771484375, 0.77593994140625, 0.810302734375, 0.84466552734375, 0.8790283203125, 0.91339111328125, 0.94775390625, 0.98211669921875, 1.0164794921875, 1.05084228515625, 1.085205078125, 1.11956787109375, 1.1539306640625, 1.18829345703125, 1.22265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 17.0, 31.0, 68.0, 95.0, 161.0, 153.0, 156.0, 153.0, 76.0, 43.0, 22.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.84821319580078, -18.425582885742188, -18.002952575683594, -17.580322265625, -17.157691955566406, -16.735061645507812, -16.31243133544922, -15.889801979064941, -15.467171669006348, -15.044541358947754, -14.62191104888916, -14.199280738830566, -13.776651382446289, -13.354021072387695, -12.931390762329102, -12.508760452270508, -12.086130142211914, -11.66349983215332, -11.240869522094727, -10.818239212036133, -10.395608901977539, -9.972978591918945, -9.550349235534668, -9.127718925476074, -8.70508861541748, -8.282458305358887, -7.859827995300293, -7.437198162078857, -7.014567852020264, -6.59193754196167, -6.169307708740234, -5.746677398681641, -5.324047088623047, -4.901416778564453, -4.478786468505859, -4.056156635284424, -3.63352632522583, -3.2108960151672363, -2.7882659435272217, -2.365635871887207, -1.9430055618286133, -1.520375370979309, -1.0977451801300049, -0.6751149892807007, -0.2524847984313965, 0.17014551162719727, 0.5927755832672119, 1.0154056549072266, 1.4380359649658203, 1.8606661558151245, 2.2832963466644287, 2.7059264183044434, 3.128556728363037, 3.551187038421631, 3.9738171100616455, 4.39644718170166, 4.819077491760254, 5.241707801818848, 5.664338111877441, 6.086967945098877, 6.509598255157471, 6.9322285652160645, 7.3548583984375, 7.777488708496094, 8.200119018554688]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 11.0, 12.0, 10.0, 10.0, 19.0, 17.0, 19.0, 16.0, 16.0, 33.0, 25.0, 30.0, 36.0, 37.0, 38.0, 34.0, 45.0, 35.0, 50.0, 37.0, 36.0, 55.0, 38.0, 35.0, 37.0, 40.0, 34.0, 21.0, 28.0, 29.0, 19.0, 15.0, 19.0, 12.0, 6.0, 9.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.233152866363525, -6.054147720336914, -5.875142574310303, -5.696137428283691, -5.51713228225708, -5.338127136230469, -5.159121990203857, -4.980116844177246, -4.801111698150635, -4.622106552124023, -4.443101406097412, -4.264096260070801, -4.0850911140441895, -3.906085968017578, -3.727080821990967, -3.5480756759643555, -3.369070291519165, -3.1900651454925537, -3.0110599994659424, -2.832054853439331, -2.6530497074127197, -2.4740445613861084, -2.295039176940918, -2.1160340309143066, -1.9370290040969849, -1.7580238580703735, -1.5790187120437622, -1.4000134468078613, -1.22100830078125, -1.0420031547546387, -0.8629980087280273, -0.683992862701416, -0.5049877166748047, -0.32598257064819336, -0.14697739481925964, 0.03202778100967407, 0.2110329270362854, 0.39003807306289673, 0.5690432786941528, 0.7480484247207642, 0.9270535707473755, 1.1060587167739868, 1.2850638628005981, 1.464069128036499, 1.6430742740631104, 1.8220794200897217, 2.001084566116333, 2.1800897121429443, 2.3590948581695557, 2.538100004196167, 2.7171051502227783, 2.8961102962493896, 3.075115442276001, 3.2541205883026123, 3.4331259727478027, 3.612131118774414, 3.7911362648010254, 3.9701414108276367, 4.149146556854248, 4.328151702880859, 4.507156848907471, 4.686161994934082, 4.865167140960693, 5.044172286987305, 5.223177433013916]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 4.0, 12.0, 7.0, 16.0, 26.0, 31.0, 51.0, 86.0, 137.0, 275.0, 554.0, 1214.0, 2846.0, 7906.0, 26393.0, 120730.0, 2762850.0, 1140700.0, 96234.0, 22386.0, 7031.0, 2532.0, 1097.0, 525.0, 274.0, 138.0, 85.0, 39.0, 30.0, 16.0, 16.0, 9.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2464447021484375, -1.204803466796875, -1.1631622314453125, -1.12152099609375, -1.0798797607421875, -1.038238525390625, -0.9965972900390625, -0.9549560546875, -0.9133148193359375, -0.871673583984375, -0.8300323486328125, -0.78839111328125, -0.7467498779296875, -0.705108642578125, -0.6634674072265625, -0.621826171875, -0.5801849365234375, -0.538543701171875, -0.4969024658203125, -0.45526123046875, -0.4136199951171875, -0.371978759765625, -0.3303375244140625, -0.2886962890625, -0.2470550537109375, -0.205413818359375, -0.1637725830078125, -0.12213134765625, -0.0804901123046875, -0.038848876953125, 0.0027923583984375, 0.04443359375, 0.0860748291015625, 0.127716064453125, 0.1693572998046875, 0.21099853515625, 0.2526397705078125, 0.294281005859375, 0.3359222412109375, 0.3775634765625, 0.4192047119140625, 0.460845947265625, 0.5024871826171875, 0.54412841796875, 0.5857696533203125, 0.627410888671875, 0.6690521240234375, 0.710693359375, 0.7523345947265625, 0.793975830078125, 0.8356170654296875, 0.87725830078125, 0.9188995361328125, 0.960540771484375, 1.0021820068359375, 1.0438232421875, 1.0854644775390625, 1.127105712890625, 1.1687469482421875, 1.21038818359375, 1.2520294189453125, 1.293670654296875, 1.3353118896484375, 1.376953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 22.0, 32.0, 52.0, 52.0, 64.0, 66.0, 79.0, 96.0, 85.0, 81.0, 75.0, 69.0, 42.0, 39.0, 33.0, 27.0, 20.0, 18.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424072265625, -0.4115715026855469, -0.39907073974609375, -0.3865699768066406, -0.3740692138671875, -0.3615684509277344, -0.34906768798828125, -0.3365669250488281, -0.324066162109375, -0.3115653991699219, -0.29906463623046875, -0.2865638732910156, -0.2740631103515625, -0.2615623474121094, -0.24906158447265625, -0.23656082153320312, -0.22406005859375, -0.21155929565429688, -0.19905853271484375, -0.18655776977539062, -0.1740570068359375, -0.16155624389648438, -0.14905548095703125, -0.13655471801757812, -0.124053955078125, -0.11155319213867188, -0.09905242919921875, -0.08655166625976562, -0.0740509033203125, -0.061550140380859375, -0.04904937744140625, -0.036548614501953125, -0.0240478515625, -0.011547088623046875, 0.00095367431640625, 0.013454437255859375, 0.0259552001953125, 0.038455963134765625, 0.05095672607421875, 0.06345748901367188, 0.075958251953125, 0.08845901489257812, 0.10095977783203125, 0.11346054077148438, 0.1259613037109375, 0.13846206665039062, 0.15096282958984375, 0.16346359252929688, 0.17596435546875, 0.18846511840820312, 0.20096588134765625, 0.21346664428710938, 0.2259674072265625, 0.23846817016601562, 0.25096893310546875, 0.2634696960449219, 0.275970458984375, 0.2884712219238281, 0.30097198486328125, 0.3134727478027344, 0.3259735107421875, 0.3384742736816406, 0.35097503662109375, 0.3634757995605469, 0.3759765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 7.0, 9.0, 9.0, 10.0, 14.0, 22.0, 26.0, 36.0, 51.0, 75.0, 130.0, 166.0, 292.0, 438.0, 975.0, 1872.0, 3891.0, 9496.0, 25246.0, 83669.0, 391900.0, 2925274.0, 587899.0, 110828.0, 31409.0, 11265.0, 4698.0, 2129.0, 1031.0, 534.0, 323.0, 193.0, 104.0, 95.0, 64.0, 24.0, 25.0, 10.0, 13.0, 11.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9555892944335938, -0.9243621826171875, -0.8931350708007812, -0.861907958984375, -0.8306808471679688, -0.7994537353515625, -0.7682266235351562, -0.73699951171875, -0.7057723999023438, -0.6745452880859375, -0.6433181762695312, -0.612091064453125, -0.5808639526367188, -0.5496368408203125, -0.5184097290039062, -0.4871826171875, -0.45595550537109375, -0.4247283935546875, -0.39350128173828125, -0.362274169921875, -0.33104705810546875, -0.2998199462890625, -0.26859283447265625, -0.23736572265625, -0.20613861083984375, -0.1749114990234375, -0.14368438720703125, -0.112457275390625, -0.08123016357421875, -0.0500030517578125, -0.01877593994140625, 0.012451171875, 0.04367828369140625, 0.0749053955078125, 0.10613250732421875, 0.137359619140625, 0.16858673095703125, 0.1998138427734375, 0.23104095458984375, 0.26226806640625, 0.29349517822265625, 0.3247222900390625, 0.35594940185546875, 0.387176513671875, 0.41840362548828125, 0.4496307373046875, 0.48085784912109375, 0.5120849609375, 0.5433120727539062, 0.5745391845703125, 0.6057662963867188, 0.636993408203125, 0.6682205200195312, 0.6994476318359375, 0.7306747436523438, 0.76190185546875, 0.7931289672851562, 0.8243560791015625, 0.8555831909179688, 0.886810302734375, 0.9180374145507812, 0.9492645263671875, 0.9804916381835938, 1.01171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 24.0, 16.0, 19.0, 36.0, 74.0, 82.0, 144.0, 223.0, 402.0, 990.0, 1021.0, 394.0, 243.0, 152.0, 70.0, 53.0, 33.0, 21.0, 14.0, 19.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5767669677734375, -0.560272216796875, -0.5437774658203125, -0.52728271484375, -0.5107879638671875, -0.494293212890625, -0.4777984619140625, -0.4613037109375, -0.4448089599609375, -0.428314208984375, -0.4118194580078125, -0.39532470703125, -0.3788299560546875, -0.362335205078125, -0.3458404541015625, -0.329345703125, -0.3128509521484375, -0.296356201171875, -0.2798614501953125, -0.26336669921875, -0.2468719482421875, -0.230377197265625, -0.2138824462890625, -0.1973876953125, -0.1808929443359375, -0.164398193359375, -0.1479034423828125, -0.13140869140625, -0.1149139404296875, -0.098419189453125, -0.0819244384765625, -0.0654296875, -0.0489349365234375, -0.032440185546875, -0.0159454345703125, 0.00054931640625, 0.0170440673828125, 0.033538818359375, 0.0500335693359375, 0.0665283203125, 0.0830230712890625, 0.099517822265625, 0.1160125732421875, 0.13250732421875, 0.1490020751953125, 0.165496826171875, 0.1819915771484375, 0.198486328125, 0.2149810791015625, 0.231475830078125, 0.2479705810546875, 0.26446533203125, 0.2809600830078125, 0.297454833984375, 0.3139495849609375, 0.3304443359375, 0.3469390869140625, 0.363433837890625, 0.3799285888671875, 0.39642333984375, 0.4129180908203125, 0.429412841796875, 0.4459075927734375, 0.46240234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 17.0, 27.0, 38.0, 57.0, 92.0, 86.0, 100.0, 111.0, 96.0, 97.0, 69.0, 55.0, 30.0, 34.0, 24.0, 20.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7610864639282227, -2.670240640640259, -2.579395055770874, -2.48854923248291, -2.3977034091949463, -2.3068578243255615, -2.2160120010375977, -2.125166416168213, -2.034320592880249, -1.9434748888015747, -1.8526290655136108, -1.7617833614349365, -1.6709376573562622, -1.580091953277588, -1.489246129989624, -1.3984004259109497, -1.3075546026229858, -1.2167088985443115, -1.1258630752563477, -1.0350173711776733, -0.944171667098999, -0.8533259034156799, -0.7624801397323608, -0.6716344356536865, -0.5807886719703674, -0.4899429380893707, -0.399097204208374, -0.30825144052505493, -0.21740570664405823, -0.12655997276306152, -0.03571420907974243, 0.055131494998931885, 0.14597725868225098, 0.23682299256324768, 0.3276687264442444, 0.4185144901275635, 0.5093601942062378, 0.6002059578895569, 0.691051721572876, 0.7818974256515503, 0.8727431893348694, 0.9635889530181885, 1.0544346570968628, 1.145280361175537, 1.236126184463501, 1.3269718885421753, 1.4178175926208496, 1.5086634159088135, 1.5995091199874878, 1.690354824066162, 1.781200647354126, 1.8720463514328003, 1.9628920555114746, 2.0537378787994385, 2.1445837020874023, 2.235429286956787, 2.326275110244751, 2.417120933532715, 2.5079665184020996, 2.5988123416900635, 2.6896581649780273, 2.780503749847412, 2.871349573135376, 2.96219539642334, 3.0530409812927246]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 11.0, 10.0, 13.0, 10.0, 20.0, 22.0, 26.0, 23.0, 36.0, 31.0, 42.0, 42.0, 47.0, 51.0, 36.0, 42.0, 36.0, 45.0, 51.0, 37.0, 47.0, 38.0, 33.0, 36.0, 31.0, 30.0, 30.0, 25.0, 17.0, 17.0, 12.0, 13.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6502515077590942, -1.5969529151916504, -1.543654203414917, -1.4903556108474731, -1.4370570182800293, -1.383758306503296, -1.330459713935852, -1.2771611213684082, -1.2238624095916748, -1.170563817024231, -1.1172651052474976, -1.0639665126800537, -1.0106678009033203, -0.9573692083358765, -0.9040706157684326, -0.850771963596344, -0.7974733114242554, -0.7441746592521667, -0.6908760070800781, -0.6375774145126343, -0.5842787623405457, -0.530980110168457, -0.4776814877986908, -0.42438286542892456, -0.37108421325683594, -0.3177855610847473, -0.2644869387149811, -0.21118830144405365, -0.15788966417312622, -0.1045910120010376, -0.05129238963127136, 0.002006232738494873, 0.05530500411987305, 0.10860364139080048, 0.1619022786617279, 0.21520091593265533, 0.26849955320358276, 0.3217982053756714, 0.3750968277454376, 0.42839545011520386, 0.4816941022872925, 0.5349927544593811, 0.5882914066314697, 0.6415899991989136, 0.6948886513710022, 0.7481873035430908, 0.8014858961105347, 0.8547845482826233, 0.9080832004547119, 0.9613818526268005, 1.0146805047988892, 1.067979097366333, 1.1212778091430664, 1.1745764017105103, 1.227874994277954, 1.2811737060546875, 1.3344722986221313, 1.3877708911895752, 1.4410696029663086, 1.4943681955337524, 1.5476667881011963, 1.6009654998779297, 1.6542640924453735, 1.7075626850128174, 1.7608613967895508]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 14.0, 19.0, 30.0, 55.0, 98.0, 119.0, 258.0, 508.0, 1075.0, 2449.0, 6559.0, 19363.0, 61498.0, 195086.0, 425434.0, 228441.0, 72372.0, 22356.0, 7528.0, 2755.0, 1224.0, 581.0, 289.0, 151.0, 102.0, 68.0, 34.0, 26.0, 10.0, 6.0, 18.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.5949859619140625, -1.544464111328125, -1.4939422607421875, -1.44342041015625, -1.3928985595703125, -1.342376708984375, -1.2918548583984375, -1.2413330078125, -1.1908111572265625, -1.140289306640625, -1.0897674560546875, -1.03924560546875, -0.9887237548828125, -0.938201904296875, -0.8876800537109375, -0.837158203125, -0.7866363525390625, -0.736114501953125, -0.6855926513671875, -0.63507080078125, -0.5845489501953125, -0.534027099609375, -0.4835052490234375, -0.4329833984375, -0.3824615478515625, -0.331939697265625, -0.2814178466796875, -0.23089599609375, -0.1803741455078125, -0.129852294921875, -0.0793304443359375, -0.02880859375, 0.0217132568359375, 0.072235107421875, 0.1227569580078125, 0.17327880859375, 0.2238006591796875, 0.274322509765625, 0.3248443603515625, 0.3753662109375, 0.4258880615234375, 0.476409912109375, 0.5269317626953125, 0.57745361328125, 0.6279754638671875, 0.678497314453125, 0.7290191650390625, 0.779541015625, 0.8300628662109375, 0.880584716796875, 0.9311065673828125, 0.98162841796875, 1.0321502685546875, 1.082672119140625, 1.1331939697265625, 1.1837158203125, 1.2342376708984375, 1.284759521484375, 1.3352813720703125, 1.38580322265625, 1.4363250732421875, 1.486846923828125, 1.5373687744140625, 1.587890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 7.0, 16.0, 22.0, 28.0, 58.0, 52.0, 58.0, 79.0, 70.0, 98.0, 99.0, 81.0, 60.0, 59.0, 54.0, 40.0, 38.0, 33.0, 13.0, 6.0, 13.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.3940162658691406, -0.38129425048828125, -0.3685722351074219, -0.3558502197265625, -0.3431282043457031, -0.33040618896484375, -0.3176841735839844, -0.304962158203125, -0.2922401428222656, -0.27951812744140625, -0.2667961120605469, -0.2540740966796875, -0.24135208129882812, -0.22863006591796875, -0.21590805053710938, -0.20318603515625, -0.19046401977539062, -0.17774200439453125, -0.16501998901367188, -0.1522979736328125, -0.13957595825195312, -0.12685394287109375, -0.11413192749023438, -0.101409912109375, -0.08868789672851562, -0.07596588134765625, -0.06324386596679688, -0.0505218505859375, -0.037799835205078125, -0.02507781982421875, -0.012355804443359375, 0.0003662109375, 0.013088226318359375, 0.02581024169921875, 0.038532257080078125, 0.0512542724609375, 0.06397628784179688, 0.07669830322265625, 0.08942031860351562, 0.102142333984375, 0.11486434936523438, 0.12758636474609375, 0.14030838012695312, 0.1530303955078125, 0.16575241088867188, 0.17847442626953125, 0.19119644165039062, 0.20391845703125, 0.21664047241210938, 0.22936248779296875, 0.24208450317382812, 0.2548065185546875, 0.2675285339355469, 0.28025054931640625, 0.2929725646972656, 0.305694580078125, 0.3184165954589844, 0.33113861083984375, 0.3438606262207031, 0.3565826416015625, 0.3693046569824219, 0.38202667236328125, 0.3947486877441406, 0.407470703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 16.0, 15.0, 24.0, 32.0, 52.0, 52.0, 104.0, 164.0, 264.0, 420.0, 749.0, 1283.0, 2579.0, 5942.0, 15007.0, 41684.0, 117838.0, 288027.0, 335637.0, 150840.0, 53997.0, 19329.0, 7430.0, 3259.0, 1616.0, 798.0, 499.0, 303.0, 182.0, 129.0, 81.0, 48.0, 39.0, 18.0, 16.0, 18.0, 6.0, 9.0, 11.0, 5.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.3837890625, -1.3474960327148438, -1.3112030029296875, -1.2749099731445312, -1.238616943359375, -1.2023239135742188, -1.1660308837890625, -1.1297378540039062, -1.09344482421875, -1.0571517944335938, -1.0208587646484375, -0.9845657348632812, -0.948272705078125, -0.9119796752929688, -0.8756866455078125, -0.8393936157226562, -0.8031005859375, -0.7668075561523438, -0.7305145263671875, -0.6942214965820312, -0.657928466796875, -0.6216354370117188, -0.5853424072265625, -0.5490493774414062, -0.51275634765625, -0.47646331787109375, -0.4401702880859375, -0.40387725830078125, -0.367584228515625, -0.33129119873046875, -0.2949981689453125, -0.25870513916015625, -0.222412109375, -0.18611907958984375, -0.1498260498046875, -0.11353302001953125, -0.077239990234375, -0.04094696044921875, -0.0046539306640625, 0.03163909912109375, 0.06793212890625, 0.10422515869140625, 0.1405181884765625, 0.17681121826171875, 0.213104248046875, 0.24939727783203125, 0.2856903076171875, 0.32198333740234375, 0.3582763671875, 0.39456939697265625, 0.4308624267578125, 0.46715545654296875, 0.503448486328125, 0.5397415161132812, 0.5760345458984375, 0.6123275756835938, 0.64862060546875, 0.6849136352539062, 0.7212066650390625, 0.7574996948242188, 0.793792724609375, 0.8300857543945312, 0.8663787841796875, 0.9026718139648438, 0.93896484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 14.0, 17.0, 14.0, 16.0, 16.0, 25.0, 27.0, 26.0, 31.0, 31.0, 38.0, 35.0, 45.0, 43.0, 43.0, 51.0, 46.0, 46.0, 37.0, 36.0, 50.0, 28.0, 26.0, 45.0, 25.0, 33.0, 23.0, 19.0, 22.0, 15.0, 13.0, 12.0, 5.0, 6.0, 3.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.98828125, -0.9542083740234375, -0.920135498046875, -0.8860626220703125, -0.85198974609375, -0.8179168701171875, -0.783843994140625, -0.7497711181640625, -0.7156982421875, -0.6816253662109375, -0.647552490234375, -0.6134796142578125, -0.57940673828125, -0.5453338623046875, -0.511260986328125, -0.4771881103515625, -0.443115234375, -0.4090423583984375, -0.374969482421875, -0.3408966064453125, -0.30682373046875, -0.2727508544921875, -0.238677978515625, -0.2046051025390625, -0.1705322265625, -0.1364593505859375, -0.102386474609375, -0.0683135986328125, -0.03424072265625, -0.0001678466796875, 0.033905029296875, 0.0679779052734375, 0.10205078125, 0.1361236572265625, 0.170196533203125, 0.2042694091796875, 0.23834228515625, 0.2724151611328125, 0.306488037109375, 0.3405609130859375, 0.3746337890625, 0.4087066650390625, 0.442779541015625, 0.4768524169921875, 0.51092529296875, 0.5449981689453125, 0.579071044921875, 0.6131439208984375, 0.647216796875, 0.6812896728515625, 0.715362548828125, 0.7494354248046875, 0.78350830078125, 0.8175811767578125, 0.851654052734375, 0.8857269287109375, 0.9197998046875, 0.9538726806640625, 0.987945556640625, 1.0220184326171875, 1.05609130859375, 1.0901641845703125, 1.124237060546875, 1.1583099365234375, 1.1923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 5.0, 22.0, 35.0, 27.0, 73.0, 130.0, 205.0, 423.0, 925.0, 2286.0, 6236.0, 20784.0, 93930.0, 473208.0, 362043.0, 64524.0, 15349.0, 4989.0, 1750.0, 765.0, 374.0, 187.0, 104.0, 54.0, 31.0, 31.0, 16.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.97503662109375, -0.9412841796875, -0.90753173828125, -0.873779296875, -0.84002685546875, -0.8062744140625, -0.77252197265625, -0.73876953125, -0.70501708984375, -0.6712646484375, -0.63751220703125, -0.603759765625, -0.57000732421875, -0.5362548828125, -0.50250244140625, -0.46875, -0.43499755859375, -0.4012451171875, -0.36749267578125, -0.333740234375, -0.29998779296875, -0.2662353515625, -0.23248291015625, -0.19873046875, -0.16497802734375, -0.1312255859375, -0.09747314453125, -0.063720703125, -0.02996826171875, 0.0037841796875, 0.03753662109375, 0.0712890625, 0.10504150390625, 0.1387939453125, 0.17254638671875, 0.206298828125, 0.24005126953125, 0.2738037109375, 0.30755615234375, 0.34130859375, 0.37506103515625, 0.4088134765625, 0.44256591796875, 0.476318359375, 0.51007080078125, 0.5438232421875, 0.57757568359375, 0.611328125, 0.64508056640625, 0.6788330078125, 0.71258544921875, 0.746337890625, 0.78009033203125, 0.8138427734375, 0.84759521484375, 0.88134765625, 0.91510009765625, 0.9488525390625, 0.98260498046875, 1.016357421875, 1.05010986328125, 1.0838623046875, 1.11761474609375, 1.1513671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 14.0, 10.0, 20.0, 18.0, 27.0, 44.0, 73.0, 70.0, 103.0, 127.0, 127.0, 89.0, 83.0, 53.0, 36.0, 27.0, 17.0, 15.0, 10.0, 11.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016808509826660156, -0.00016077235341072083, -0.0001534596085548401, -0.00014614686369895935, -0.0001388341188430786, -0.00013152137398719788, -0.00012420862913131714, -0.0001168958842754364, -0.00010958313941955566, -0.00010227039456367493, -9.495764970779419e-05, -8.764490485191345e-05, -8.033215999603271e-05, -7.301941514015198e-05, -6.570667028427124e-05, -5.83939254283905e-05, -5.1081180572509766e-05, -4.376843571662903e-05, -3.645569086074829e-05, -2.9142946004867554e-05, -2.1830201148986816e-05, -1.4517456293106079e-05, -7.204711437225342e-06, 1.0803341865539551e-07, 7.420778274536133e-06, 1.473352313041687e-05, 2.2046267986297607e-05, 2.9359012842178345e-05, 3.667175769805908e-05, 4.398450255393982e-05, 5.129724740982056e-05, 5.8609992265701294e-05, 6.592273712158203e-05, 7.323548197746277e-05, 8.05482268333435e-05, 8.786097168922424e-05, 9.517371654510498e-05, 0.00010248646140098572, 0.00010979920625686646, 0.00011711195111274719, 0.00012442469596862793, 0.00013173744082450867, 0.0001390501856803894, 0.00014636293053627014, 0.00015367567539215088, 0.00016098842024803162, 0.00016830116510391235, 0.0001756139099597931, 0.00018292665481567383, 0.00019023939967155457, 0.0001975521445274353, 0.00020486488938331604, 0.00021217763423919678, 0.00021949037909507751, 0.00022680312395095825, 0.000234115868806839, 0.00024142861366271973, 0.00024874135851860046, 0.0002560541033744812, 0.00026336684823036194, 0.0002706795930862427, 0.0002779923379421234, 0.00028530508279800415, 0.0002926178276538849, 0.0002999305725097656]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 9.0, 15.0, 12.0, 42.0, 55.0, 98.0, 152.0, 293.0, 614.0, 1493.0, 3805.0, 12170.0, 53153.0, 381581.0, 497527.0, 74301.0, 15310.0, 4731.0, 1688.0, 694.0, 356.0, 179.0, 115.0, 50.0, 28.0, 29.0, 11.0, 6.0, 5.0, 8.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1517181396484375, -1.116912841796875, -1.0821075439453125, -1.04730224609375, -1.0124969482421875, -0.977691650390625, -0.9428863525390625, -0.9080810546875, -0.8732757568359375, -0.838470458984375, -0.8036651611328125, -0.76885986328125, -0.7340545654296875, -0.699249267578125, -0.6644439697265625, -0.629638671875, -0.5948333740234375, -0.560028076171875, -0.5252227783203125, -0.49041748046875, -0.4556121826171875, -0.420806884765625, -0.3860015869140625, -0.3511962890625, -0.3163909912109375, -0.281585693359375, -0.2467803955078125, -0.21197509765625, -0.1771697998046875, -0.142364501953125, -0.1075592041015625, -0.07275390625, -0.0379486083984375, -0.003143310546875, 0.0316619873046875, 0.06646728515625, 0.1012725830078125, 0.136077880859375, 0.1708831787109375, 0.2056884765625, 0.2404937744140625, 0.275299072265625, 0.3101043701171875, 0.34490966796875, 0.3797149658203125, 0.414520263671875, 0.4493255615234375, 0.484130859375, 0.5189361572265625, 0.553741455078125, 0.5885467529296875, 0.62335205078125, 0.6581573486328125, 0.692962646484375, 0.7277679443359375, 0.7625732421875, 0.7973785400390625, 0.832183837890625, 0.8669891357421875, 0.90179443359375, 0.9365997314453125, 0.971405029296875, 1.0062103271484375, 1.041015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 10.0, 4.0, 9.0, 12.0, 17.0, 24.0, 26.0, 62.0, 76.0, 87.0, 108.0, 134.0, 124.0, 103.0, 67.0, 43.0, 31.0, 14.0, 16.0, 9.0, 9.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8366851806640625, -0.810089111328125, -0.7834930419921875, -0.75689697265625, -0.7303009033203125, -0.703704833984375, -0.6771087646484375, -0.6505126953125, -0.6239166259765625, -0.597320556640625, -0.5707244873046875, -0.54412841796875, -0.5175323486328125, -0.490936279296875, -0.4643402099609375, -0.437744140625, -0.4111480712890625, -0.384552001953125, -0.3579559326171875, -0.33135986328125, -0.3047637939453125, -0.278167724609375, -0.2515716552734375, -0.2249755859375, -0.1983795166015625, -0.171783447265625, -0.1451873779296875, -0.11859130859375, -0.0919952392578125, -0.065399169921875, -0.0388031005859375, -0.01220703125, 0.0143890380859375, 0.040985107421875, 0.0675811767578125, 0.09417724609375, 0.1207733154296875, 0.147369384765625, 0.1739654541015625, 0.2005615234375, 0.2271575927734375, 0.253753662109375, 0.2803497314453125, 0.30694580078125, 0.3335418701171875, 0.360137939453125, 0.3867340087890625, 0.413330078125, 0.4399261474609375, 0.466522216796875, 0.4931182861328125, 0.51971435546875, 0.5463104248046875, 0.572906494140625, 0.5995025634765625, 0.6260986328125, 0.6526947021484375, 0.679290771484375, 0.7058868408203125, 0.73248291015625, 0.7590789794921875, 0.785675048828125, 0.8122711181640625, 0.8388671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 18.0, 27.0, 65.0, 56.0, 77.0, 125.0, 129.0, 127.0, 104.0, 82.0, 65.0, 44.0, 23.0, 22.0, 10.0, 8.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.324390411376953, -8.015144348144531, -7.705897331237793, -7.396650791168213, -7.087404251098633, -6.778157711029053, -6.468911170959473, -6.159665107727051, -5.8504180908203125, -5.541171550750732, -5.231925010681152, -4.922678470611572, -4.613431930541992, -4.304185390472412, -3.994939088821411, -3.685692548751831, -3.37644624710083, -3.06719970703125, -2.75795316696167, -2.44870662689209, -2.1394600868225098, -1.8302136659622192, -1.5209672451019287, -1.2117207050323486, -0.9024741649627686, -0.5932276248931885, -0.2839811444282532, 0.02526533603668213, 0.3345118761062622, 0.6437584161758423, 0.9530048370361328, 1.262251377105713, 1.571497917175293, 1.880744457244873, 2.189990997314453, 2.499237537384033, 2.8084840774536133, 3.1177306175231934, 3.4269769191741943, 3.7362234592437744, 4.045470237731934, 4.354716777801514, 4.663963317871094, 4.973209857940674, 5.282456398010254, 5.591702938079834, 5.900949478149414, 6.210195541381836, 6.519442081451416, 6.828688621520996, 7.137935161590576, 7.447181701660156, 7.756428241729736, 8.065674781799316, 8.374920845031738, 8.684167861938477, 8.993413925170898, 9.30265998840332, 9.611907005310059, 9.92115306854248, 10.230400085449219, 10.53964614868164, 10.848893165588379, 11.1581392288208, 11.467386245727539]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 2.0, 11.0, 11.0, 14.0, 19.0, 17.0, 14.0, 25.0, 19.0, 21.0, 31.0, 32.0, 40.0, 39.0, 53.0, 35.0, 35.0, 43.0, 31.0, 41.0, 39.0, 41.0, 26.0, 29.0, 26.0, 28.0, 25.0, 33.0, 30.0, 21.0, 26.0, 14.0, 14.0, 11.0, 10.0, 9.0, 9.0, 6.0, 6.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.059335231781006, -4.904572010040283, -4.749809265136719, -4.595046043395996, -4.440282821655273, -4.285519599914551, -4.130756855010986, -3.9759936332702637, -3.82123064994812, -3.6664676666259766, -3.511704444885254, -3.3569414615631104, -3.202178478240967, -3.047415256500244, -2.8926522731781006, -2.737889289855957, -2.5831260681152344, -2.428363084793091, -2.273599863052368, -2.1188368797302246, -1.9640737771987915, -1.8093106746673584, -1.6545476913452148, -1.4997845888137817, -1.3450214862823486, -1.1902583837509155, -1.0354952812194824, -0.8807322978973389, -0.7259691953659058, -0.5712060928344727, -0.4164430499076843, -0.261680006980896, -0.10691690444946289, 0.04784616827964783, 0.20260924100875854, 0.35737231373786926, 0.51213538646698, 0.6668984889984131, 0.8216615319252014, 0.9764245748519897, 1.1311876773834229, 1.285950779914856, 1.440713882446289, 1.5954768657684326, 1.7502399682998657, 1.9050030708312988, 2.0597660541534424, 2.214529037475586, 2.3692922592163086, 2.524055242538452, 2.678818464279175, 2.8335814476013184, 2.988344669342041, 3.1431076526641846, 3.297870635986328, 3.452633857727051, 3.6073968410491943, 3.762159824371338, 3.9169230461120605, 4.071686267852783, 4.226449012756348, 4.38121223449707, 4.535975456237793, 4.690738201141357, 4.84550142288208]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 3.0, 7.0, 9.0, 8.0, 23.0, 32.0, 46.0, 74.0, 158.0, 276.0, 516.0, 1086.0, 2416.0, 5998.0, 16744.0, 56989.0, 315293.0, 3511877.0, 214503.0, 44924.0, 13968.0, 5047.0, 2169.0, 927.0, 524.0, 274.0, 137.0, 94.0, 58.0, 33.0, 15.0, 13.0, 14.0, 12.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9470443725585938, -0.9082489013671875, -0.8694534301757812, -0.830657958984375, -0.7918624877929688, -0.7530670166015625, -0.7142715454101562, -0.67547607421875, -0.6366806030273438, -0.5978851318359375, -0.5590896606445312, -0.520294189453125, -0.48149871826171875, -0.4427032470703125, -0.40390777587890625, -0.3651123046875, -0.32631683349609375, -0.2875213623046875, -0.24872589111328125, -0.209930419921875, -0.17113494873046875, -0.1323394775390625, -0.09354400634765625, -0.05474853515625, -0.01595306396484375, 0.0228424072265625, 0.06163787841796875, 0.100433349609375, 0.13922882080078125, 0.1780242919921875, 0.21681976318359375, 0.255615234375, 0.29441070556640625, 0.3332061767578125, 0.37200164794921875, 0.410797119140625, 0.44959259033203125, 0.4883880615234375, 0.5271835327148438, 0.56597900390625, 0.6047744750976562, 0.6435699462890625, 0.6823654174804688, 0.721160888671875, 0.7599563598632812, 0.7987518310546875, 0.8375473022460938, 0.8763427734375, 0.9151382446289062, 0.9539337158203125, 0.9927291870117188, 1.031524658203125, 1.0703201293945312, 1.1091156005859375, 1.1479110717773438, 1.18670654296875, 1.2255020141601562, 1.2642974853515625, 1.3030929565429688, 1.341888427734375, 1.3806838989257812, 1.4194793701171875, 1.4582748413085938, 1.4970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 10.0, 7.0, 8.0, 14.0, 22.0, 22.0, 34.0, 46.0, 42.0, 54.0, 65.0, 67.0, 67.0, 71.0, 89.0, 74.0, 63.0, 55.0, 45.0, 34.0, 31.0, 24.0, 18.0, 13.0, 12.0, 10.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39013671875, -0.3784217834472656, -0.36670684814453125, -0.3549919128417969, -0.3432769775390625, -0.3315620422363281, -0.31984710693359375, -0.3081321716308594, -0.296417236328125, -0.2847023010253906, -0.27298736572265625, -0.2612724304199219, -0.2495574951171875, -0.23784255981445312, -0.22612762451171875, -0.21441268920898438, -0.20269775390625, -0.19098281860351562, -0.17926788330078125, -0.16755294799804688, -0.1558380126953125, -0.14412307739257812, -0.13240814208984375, -0.12069320678710938, -0.108978271484375, -0.09726333618164062, -0.08554840087890625, -0.07383346557617188, -0.0621185302734375, -0.050403594970703125, -0.03868865966796875, -0.026973724365234375, -0.0152587890625, -0.003543853759765625, 0.00817108154296875, 0.019886016845703125, 0.0316009521484375, 0.043315887451171875, 0.05503082275390625, 0.06674575805664062, 0.078460693359375, 0.09017562866210938, 0.10189056396484375, 0.11360549926757812, 0.1253204345703125, 0.13703536987304688, 0.14875030517578125, 0.16046524047851562, 0.17218017578125, 0.18389511108398438, 0.19561004638671875, 0.20732498168945312, 0.2190399169921875, 0.23075485229492188, 0.24246978759765625, 0.2541847229003906, 0.265899658203125, 0.2776145935058594, 0.28932952880859375, 0.3010444641113281, 0.3127593994140625, 0.3244743347167969, 0.33618927001953125, 0.3479042053222656, 0.359619140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 12.0, 18.0, 25.0, 30.0, 77.0, 113.0, 196.0, 369.0, 773.0, 1527.0, 3310.0, 7469.0, 18576.0, 50107.0, 159304.0, 892943.0, 2680766.0, 259315.0, 74246.0, 26175.0, 10322.0, 4446.0, 2060.0, 1018.0, 481.0, 208.0, 152.0, 79.0, 55.0, 36.0, 21.0, 14.0, 12.0, 11.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.857421875, -0.829010009765625, -0.80059814453125, -0.772186279296875, -0.7437744140625, -0.715362548828125, -0.68695068359375, -0.658538818359375, -0.630126953125, -0.601715087890625, -0.57330322265625, -0.544891357421875, -0.5164794921875, -0.488067626953125, -0.45965576171875, -0.431243896484375, -0.40283203125, -0.374420166015625, -0.34600830078125, -0.317596435546875, -0.2891845703125, -0.260772705078125, -0.23236083984375, -0.203948974609375, -0.175537109375, -0.147125244140625, -0.11871337890625, -0.090301513671875, -0.0618896484375, -0.033477783203125, -0.00506591796875, 0.023345947265625, 0.0517578125, 0.080169677734375, 0.10858154296875, 0.136993408203125, 0.1654052734375, 0.193817138671875, 0.22222900390625, 0.250640869140625, 0.279052734375, 0.307464599609375, 0.33587646484375, 0.364288330078125, 0.3927001953125, 0.421112060546875, 0.44952392578125, 0.477935791015625, 0.50634765625, 0.534759521484375, 0.56317138671875, 0.591583251953125, 0.6199951171875, 0.648406982421875, 0.67681884765625, 0.705230712890625, 0.733642578125, 0.762054443359375, 0.79046630859375, 0.818878173828125, 0.8472900390625, 0.875701904296875, 0.90411376953125, 0.932525634765625, 0.9609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 7.0, 12.0, 16.0, 27.0, 30.0, 29.0, 69.0, 68.0, 97.0, 171.0, 262.0, 580.0, 1406.0, 521.0, 235.0, 158.0, 113.0, 63.0, 42.0, 41.0, 21.0, 26.0, 19.0, 17.0, 9.0, 7.0, 3.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3662300109863281, -0.35379791259765625, -0.3413658142089844, -0.3289337158203125, -0.3165016174316406, -0.30406951904296875, -0.2916374206542969, -0.279205322265625, -0.2667732238769531, -0.25434112548828125, -0.24190902709960938, -0.2294769287109375, -0.21704483032226562, -0.20461273193359375, -0.19218063354492188, -0.17974853515625, -0.16731643676757812, -0.15488433837890625, -0.14245223999023438, -0.1300201416015625, -0.11758804321289062, -0.10515594482421875, -0.09272384643554688, -0.080291748046875, -0.06785964965820312, -0.05542755126953125, -0.042995452880859375, -0.0305633544921875, -0.018131256103515625, -0.00569915771484375, 0.006732940673828125, 0.0191650390625, 0.031597137451171875, 0.04402923583984375, 0.056461334228515625, 0.0688934326171875, 0.08132553100585938, 0.09375762939453125, 0.10618972778320312, 0.118621826171875, 0.13105392456054688, 0.14348602294921875, 0.15591812133789062, 0.1683502197265625, 0.18078231811523438, 0.19321441650390625, 0.20564651489257812, 0.21807861328125, 0.23051071166992188, 0.24294281005859375, 0.2553749084472656, 0.2678070068359375, 0.2802391052246094, 0.29267120361328125, 0.3051033020019531, 0.317535400390625, 0.3299674987792969, 0.34239959716796875, 0.3548316955566406, 0.3672637939453125, 0.3796958923339844, 0.39212799072265625, 0.4045600891113281, 0.4169921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 14.0, 16.0, 25.0, 30.0, 42.0, 62.0, 60.0, 83.0, 92.0, 98.0, 103.0, 88.0, 68.0, 73.0, 47.0, 29.0, 17.0, 14.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4498510360717773, -2.374814510345459, -2.2997779846191406, -2.2247414588928223, -2.149704933166504, -2.0746684074401855, -1.9996318817138672, -1.9245953559875488, -1.8495588302612305, -1.774522304534912, -1.6994857788085938, -1.6244492530822754, -1.549412727355957, -1.4743762016296387, -1.3993396759033203, -1.324303150177002, -1.2492666244506836, -1.1742300987243652, -1.0991935729980469, -1.0241570472717285, -0.9491205215454102, -0.8740839958190918, -0.7990474700927734, -0.7240109443664551, -0.6489744186401367, -0.5739378929138184, -0.4989013671875, -0.42386484146118164, -0.3488283157348633, -0.2737917900085449, -0.19875526428222656, -0.1237187385559082, -0.048682451248168945, 0.026354074478149414, 0.10139060020446777, 0.17642712593078613, 0.2514636516571045, 0.32650017738342285, 0.4015367031097412, 0.47657322883605957, 0.5516097545623779, 0.6266462802886963, 0.7016828060150146, 0.776719331741333, 0.8517558574676514, 0.9267923831939697, 1.001828908920288, 1.0768654346466064, 1.1519019603729248, 1.2269384860992432, 1.3019750118255615, 1.3770115375518799, 1.4520480632781982, 1.5270845890045166, 1.602121114730835, 1.6771576404571533, 1.7521941661834717, 1.82723069190979, 1.9022672176361084, 1.9773037433624268, 2.052340269088745, 2.1273767948150635, 2.202413320541382, 2.2774498462677, 2.3524863719940186]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 13.0, 5.0, 7.0, 12.0, 10.0, 16.0, 13.0, 19.0, 18.0, 27.0, 33.0, 24.0, 36.0, 32.0, 30.0, 40.0, 45.0, 39.0, 52.0, 46.0, 45.0, 45.0, 50.0, 35.0, 29.0, 27.0, 34.0, 22.0, 19.0, 29.0, 23.0, 18.0, 23.0, 18.0, 19.0, 6.0, 9.0, 6.0, 4.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3644435405731201, -1.3231252431869507, -1.2818069458007812, -1.2404887676239014, -1.199170470237732, -1.1578521728515625, -1.116533875465393, -1.0752155780792236, -1.0338973999023438, -0.9925791025161743, -0.9512608647346497, -0.9099425673484802, -0.8686243295669556, -0.8273060321807861, -0.7859877347946167, -0.7446694374084473, -0.7033511400222778, -0.6620328426361084, -0.6207146048545837, -0.5793963074684143, -0.5380780696868896, -0.4967597723007202, -0.4554414749145508, -0.41412320733070374, -0.3728049397468567, -0.33148667216300964, -0.2901684045791626, -0.24885010719299316, -0.20753183960914612, -0.16621357202529907, -0.12489528954029083, -0.08357700705528259, -0.042258620262145996, -0.0009403452277183533, 0.04037792980670929, 0.08169620484113693, 0.12301447987556458, 0.16433274745941162, 0.20565102994441986, 0.2469693124294281, 0.28828758001327515, 0.3296058475971222, 0.37092411518096924, 0.41224241256713867, 0.4535606801509857, 0.49487894773483276, 0.5361972451210022, 0.5775154829025269, 0.6188337802886963, 0.6601520776748657, 0.7014703154563904, 0.7427886128425598, 0.7841068506240845, 0.8254251480102539, 0.8667434453964233, 0.9080617427825928, 0.9493799805641174, 0.9906982779502869, 1.0320165157318115, 1.073334813117981, 1.1146531105041504, 1.1559712886810303, 1.1972895860671997, 1.2386078834533691, 1.2799261808395386]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 7.0, 7.0, 13.0, 20.0, 23.0, 30.0, 61.0, 92.0, 124.0, 214.0, 356.0, 557.0, 1096.0, 2158.0, 4201.0, 8716.0, 18418.0, 40188.0, 91917.0, 209367.0, 325266.0, 191761.0, 83820.0, 36816.0, 16735.0, 8271.0, 3788.0, 2058.0, 1001.0, 589.0, 345.0, 204.0, 108.0, 63.0, 44.0, 38.0, 26.0, 22.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.12420654296875, -1.0872802734375, -1.05035400390625, -1.013427734375, -0.97650146484375, -0.9395751953125, -0.90264892578125, -0.86572265625, -0.82879638671875, -0.7918701171875, -0.75494384765625, -0.718017578125, -0.68109130859375, -0.6441650390625, -0.60723876953125, -0.5703125, -0.53338623046875, -0.4964599609375, -0.45953369140625, -0.422607421875, -0.38568115234375, -0.3487548828125, -0.31182861328125, -0.27490234375, -0.23797607421875, -0.2010498046875, -0.16412353515625, -0.127197265625, -0.09027099609375, -0.0533447265625, -0.01641845703125, 0.0205078125, 0.05743408203125, 0.0943603515625, 0.13128662109375, 0.168212890625, 0.20513916015625, 0.2420654296875, 0.27899169921875, 0.31591796875, 0.35284423828125, 0.3897705078125, 0.42669677734375, 0.463623046875, 0.50054931640625, 0.5374755859375, 0.57440185546875, 0.611328125, 0.64825439453125, 0.6851806640625, 0.72210693359375, 0.759033203125, 0.79595947265625, 0.8328857421875, 0.86981201171875, 0.90673828125, 0.94366455078125, 0.9805908203125, 1.01751708984375, 1.054443359375, 1.09136962890625, 1.1282958984375, 1.16522216796875, 1.2021484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 10.0, 19.0, 22.0, 31.0, 50.0, 37.0, 62.0, 63.0, 71.0, 71.0, 74.0, 86.0, 66.0, 69.0, 48.0, 53.0, 34.0, 43.0, 23.0, 15.0, 16.0, 4.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4079780578613281, -0.39579010009765625, -0.3836021423339844, -0.3714141845703125, -0.3592262268066406, -0.34703826904296875, -0.3348503112792969, -0.322662353515625, -0.3104743957519531, -0.29828643798828125, -0.2860984802246094, -0.2739105224609375, -0.2617225646972656, -0.24953460693359375, -0.23734664916992188, -0.22515869140625, -0.21297073364257812, -0.20078277587890625, -0.18859481811523438, -0.1764068603515625, -0.16421890258789062, -0.15203094482421875, -0.13984298706054688, -0.127655029296875, -0.11546707153320312, -0.10327911376953125, -0.09109115600585938, -0.0789031982421875, -0.06671524047851562, -0.05452728271484375, -0.042339324951171875, -0.0301513671875, -0.017963409423828125, -0.00577545166015625, 0.006412506103515625, 0.0186004638671875, 0.030788421630859375, 0.04297637939453125, 0.055164337158203125, 0.067352294921875, 0.07954025268554688, 0.09172821044921875, 0.10391616821289062, 0.1161041259765625, 0.12829208374023438, 0.14048004150390625, 0.15266799926757812, 0.16485595703125, 0.17704391479492188, 0.18923187255859375, 0.20141983032226562, 0.2136077880859375, 0.22579574584960938, 0.23798370361328125, 0.2501716613769531, 0.262359619140625, 0.2745475769042969, 0.28673553466796875, 0.2989234924316406, 0.3111114501953125, 0.3232994079589844, 0.33548736572265625, 0.3476753234863281, 0.35986328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 15.0, 17.0, 32.0, 21.0, 35.0, 58.0, 77.0, 117.0, 173.0, 224.0, 368.0, 617.0, 1223.0, 3453.0, 13886.0, 76766.0, 397048.0, 442812.0, 88678.0, 15834.0, 3844.0, 1310.0, 650.0, 398.0, 273.0, 171.0, 129.0, 106.0, 67.0, 38.0, 31.0, 15.0, 16.0, 20.0, 8.0, 3.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.07574462890625, -2.0147705078125, -1.95379638671875, -1.892822265625, -1.83184814453125, -1.7708740234375, -1.70989990234375, -1.64892578125, -1.58795166015625, -1.5269775390625, -1.46600341796875, -1.405029296875, -1.34405517578125, -1.2830810546875, -1.22210693359375, -1.1611328125, -1.10015869140625, -1.0391845703125, -0.97821044921875, -0.917236328125, -0.85626220703125, -0.7952880859375, -0.73431396484375, -0.67333984375, -0.61236572265625, -0.5513916015625, -0.49041748046875, -0.429443359375, -0.36846923828125, -0.3074951171875, -0.24652099609375, -0.185546875, -0.12457275390625, -0.0635986328125, -0.00262451171875, 0.058349609375, 0.11932373046875, 0.1802978515625, 0.24127197265625, 0.30224609375, 0.36322021484375, 0.4241943359375, 0.48516845703125, 0.546142578125, 0.60711669921875, 0.6680908203125, 0.72906494140625, 0.7900390625, 0.85101318359375, 0.9119873046875, 0.97296142578125, 1.033935546875, 1.09490966796875, 1.1558837890625, 1.21685791015625, 1.27783203125, 1.33880615234375, 1.3997802734375, 1.46075439453125, 1.521728515625, 1.58270263671875, 1.6436767578125, 1.70465087890625, 1.765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 9.0, 9.0, 19.0, 7.0, 15.0, 17.0, 23.0, 29.0, 31.0, 28.0, 37.0, 44.0, 31.0, 44.0, 50.0, 44.0, 49.0, 49.0, 54.0, 47.0, 36.0, 42.0, 33.0, 31.0, 28.0, 24.0, 27.0, 20.0, 21.0, 16.0, 14.0, 17.0, 13.0, 6.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.2421875, -1.20428466796875, -1.1663818359375, -1.12847900390625, -1.090576171875, -1.05267333984375, -1.0147705078125, -0.97686767578125, -0.93896484375, -0.90106201171875, -0.8631591796875, -0.82525634765625, -0.787353515625, -0.74945068359375, -0.7115478515625, -0.67364501953125, -0.6357421875, -0.59783935546875, -0.5599365234375, -0.52203369140625, -0.484130859375, -0.44622802734375, -0.4083251953125, -0.37042236328125, -0.33251953125, -0.29461669921875, -0.2567138671875, -0.21881103515625, -0.180908203125, -0.14300537109375, -0.1051025390625, -0.06719970703125, -0.029296875, 0.00860595703125, 0.0465087890625, 0.08441162109375, 0.122314453125, 0.16021728515625, 0.1981201171875, 0.23602294921875, 0.27392578125, 0.31182861328125, 0.3497314453125, 0.38763427734375, 0.425537109375, 0.46343994140625, 0.5013427734375, 0.53924560546875, 0.5771484375, 0.61505126953125, 0.6529541015625, 0.69085693359375, 0.728759765625, 0.76666259765625, 0.8045654296875, 0.84246826171875, 0.88037109375, 0.91827392578125, 0.9561767578125, 0.99407958984375, 1.031982421875, 1.06988525390625, 1.1077880859375, 1.14569091796875, 1.18359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 13.0, 21.0, 35.0, 56.0, 92.0, 143.0, 242.0, 431.0, 832.0, 1758.0, 4427.0, 18077.0, 482936.0, 512293.0, 18921.0, 4583.0, 1774.0, 877.0, 403.0, 247.0, 153.0, 87.0, 52.0, 18.0, 21.0, 16.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.6451416015625, -2.553955078125, -2.4627685546875, -2.37158203125, -2.2803955078125, -2.189208984375, -2.0980224609375, -2.0068359375, -1.9156494140625, -1.824462890625, -1.7332763671875, -1.64208984375, -1.5509033203125, -1.459716796875, -1.3685302734375, -1.27734375, -1.1861572265625, -1.094970703125, -1.0037841796875, -0.91259765625, -0.8214111328125, -0.730224609375, -0.6390380859375, -0.5478515625, -0.4566650390625, -0.365478515625, -0.2742919921875, -0.18310546875, -0.0919189453125, -0.000732421875, 0.0904541015625, 0.181640625, 0.2728271484375, 0.364013671875, 0.4552001953125, 0.54638671875, 0.6375732421875, 0.728759765625, 0.8199462890625, 0.9111328125, 1.0023193359375, 1.093505859375, 1.1846923828125, 1.27587890625, 1.3670654296875, 1.458251953125, 1.5494384765625, 1.640625, 1.7318115234375, 1.822998046875, 1.9141845703125, 2.00537109375, 2.0965576171875, 2.187744140625, 2.2789306640625, 2.3701171875, 2.4613037109375, 2.552490234375, 2.6436767578125, 2.73486328125, 2.8260498046875, 2.917236328125, 3.0084228515625, 3.099609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 10.0, 27.0, 40.0, 68.0, 111.0, 156.0, 177.0, 128.0, 99.0, 58.0, 29.0, 28.0, 15.0, 9.0, 6.0, 10.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004487037658691406, -0.00043727457523345947, -0.0004258453845977783, -0.00041441619396209717, -0.000402987003326416, -0.00039155781269073486, -0.0003801286220550537, -0.00036869943141937256, -0.0003572702407836914, -0.00034584105014801025, -0.0003344118595123291, -0.00032298266887664795, -0.0003115534782409668, -0.00030012428760528564, -0.0002886950969696045, -0.00027726590633392334, -0.0002658367156982422, -0.00025440752506256104, -0.00024297833442687988, -0.00023154914379119873, -0.00022011995315551758, -0.00020869076251983643, -0.00019726157188415527, -0.00018583238124847412, -0.00017440319061279297, -0.00016297399997711182, -0.00015154480934143066, -0.0001401156187057495, -0.00012868642807006836, -0.00011725723743438721, -0.00010582804679870605, -9.43988561630249e-05, -8.296966552734375e-05, -7.15404748916626e-05, -6.0111284255981445e-05, -4.868209362030029e-05, -3.725290298461914e-05, -2.5823712348937988e-05, -1.4394521713256836e-05, -2.9653310775756836e-06, 8.463859558105469e-06, 1.989305019378662e-05, 3.1322240829467773e-05, 4.2751431465148926e-05, 5.418062210083008e-05, 6.560981273651123e-05, 7.703900337219238e-05, 8.846819400787354e-05, 9.989738464355469e-05, 0.00011132657527923584, 0.000122755765914917, 0.00013418495655059814, 0.0001456141471862793, 0.00015704333782196045, 0.0001684725284576416, 0.00017990171909332275, 0.0001913309097290039, 0.00020276010036468506, 0.0002141892910003662, 0.00022561848163604736, 0.00023704767227172852, 0.00024847686290740967, 0.0002599060535430908, 0.00027133524417877197, 0.0002827644348144531]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 10.0, 14.0, 20.0, 35.0, 47.0, 89.0, 157.0, 291.0, 640.0, 1532.0, 4580.0, 21287.0, 842596.0, 162510.0, 9732.0, 2885.0, 1111.0, 466.0, 209.0, 117.0, 75.0, 40.0, 27.0, 19.0, 10.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.23858642578125, -3.1334228515625, -3.02825927734375, -2.923095703125, -2.81793212890625, -2.7127685546875, -2.60760498046875, -2.50244140625, -2.39727783203125, -2.2921142578125, -2.18695068359375, -2.081787109375, -1.97662353515625, -1.8714599609375, -1.76629638671875, -1.6611328125, -1.55596923828125, -1.4508056640625, -1.34564208984375, -1.240478515625, -1.13531494140625, -1.0301513671875, -0.92498779296875, -0.81982421875, -0.71466064453125, -0.6094970703125, -0.50433349609375, -0.399169921875, -0.29400634765625, -0.1888427734375, -0.08367919921875, 0.021484375, 0.12664794921875, 0.2318115234375, 0.33697509765625, 0.442138671875, 0.54730224609375, 0.6524658203125, 0.75762939453125, 0.86279296875, 0.96795654296875, 1.0731201171875, 1.17828369140625, 1.283447265625, 1.38861083984375, 1.4937744140625, 1.59893798828125, 1.7041015625, 1.80926513671875, 1.9144287109375, 2.01959228515625, 2.124755859375, 2.22991943359375, 2.3350830078125, 2.44024658203125, 2.54541015625, 2.65057373046875, 2.7557373046875, 2.86090087890625, 2.966064453125, 3.07122802734375, 3.1763916015625, 3.28155517578125, 3.38671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 15.0, 19.0, 34.0, 64.0, 151.0, 294.0, 219.0, 98.0, 42.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7978515625, -1.7308502197265625, -1.663848876953125, -1.5968475341796875, -1.52984619140625, -1.4628448486328125, -1.395843505859375, -1.3288421630859375, -1.2618408203125, -1.1948394775390625, -1.127838134765625, -1.0608367919921875, -0.99383544921875, -0.9268341064453125, -0.859832763671875, -0.7928314208984375, -0.725830078125, -0.6588287353515625, -0.591827392578125, -0.5248260498046875, -0.45782470703125, -0.3908233642578125, -0.323822021484375, -0.2568206787109375, -0.1898193359375, -0.1228179931640625, -0.055816650390625, 0.0111846923828125, 0.07818603515625, 0.1451873779296875, 0.212188720703125, 0.2791900634765625, 0.34619140625, 0.4131927490234375, 0.480194091796875, 0.5471954345703125, 0.61419677734375, 0.6811981201171875, 0.748199462890625, 0.8152008056640625, 0.8822021484375, 0.9492034912109375, 1.016204833984375, 1.0832061767578125, 1.15020751953125, 1.2172088623046875, 1.284210205078125, 1.3512115478515625, 1.418212890625, 1.4852142333984375, 1.552215576171875, 1.6192169189453125, 1.68621826171875, 1.7532196044921875, 1.820220947265625, 1.8872222900390625, 1.9542236328125, 2.0212249755859375, 2.088226318359375, 2.1552276611328125, 2.22222900390625, 2.2892303466796875, 2.356231689453125, 2.4232330322265625, 2.490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 12.0, 32.0, 126.0, 277.0, 294.0, 175.0, 63.0, 22.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.672521591186523, -10.712645530700684, -9.752769470214844, -8.79289436340332, -7.8330183029174805, -6.873142242431641, -5.913266658782959, -4.953391075134277, -3.9935150146484375, -3.0336391925811768, -2.073763370513916, -1.1138875484466553, -0.15401172637939453, 0.8058643341064453, 1.765739917755127, 2.7256155014038086, 3.6854915618896484, 4.645367622375488, 5.60524320602417, 6.565118789672852, 7.524994850158691, 8.484870910644531, 9.444746017456055, 10.404622077941895, 11.364498138427734, 12.324374198913574, 13.284250259399414, 14.244125366210938, 15.204001426696777, 16.163877487182617, 17.12375259399414, 18.083629608154297, 19.043502807617188, 20.00337791442871, 20.963254928588867, 21.92313003540039, 22.883007049560547, 23.84288215637207, 24.802757263183594, 25.76263427734375, 26.722509384155273, 27.682384490966797, 28.642261505126953, 29.602136611938477, 30.56201171875, 31.521888732910156, 32.48176574707031, 33.4416389465332, 34.40151596069336, 35.361392974853516, 36.321266174316406, 37.28114318847656, 38.24102020263672, 39.200897216796875, 40.160770416259766, 41.12064743041992, 42.08052062988281, 43.04039764404297, 44.00027084350586, 44.960147857666016, 45.92002487182617, 46.87989807128906, 47.83977508544922, 48.799652099609375, 49.75952911376953]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 7.0, 7.0, 14.0, 5.0, 9.0, 14.0, 9.0, 18.0, 30.0, 19.0, 19.0, 26.0, 28.0, 29.0, 32.0, 34.0, 30.0, 44.0, 46.0, 41.0, 55.0, 39.0, 36.0, 32.0, 37.0, 29.0, 42.0, 34.0, 22.0, 18.0, 29.0, 19.0, 22.0, 18.0, 19.0, 17.0, 10.0, 16.0, 5.0, 4.0, 8.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-6.79135274887085, -6.589838981628418, -6.3883256912231445, -6.186811923980713, -5.985298156738281, -5.783784866333008, -5.582271099090576, -5.3807573318481445, -5.179244041442871, -4.9777302742004395, -4.776216983795166, -4.574703216552734, -4.373189449310303, -4.171675682067871, -3.9701623916625977, -3.768648624420166, -3.5671348571777344, -3.365621328353882, -3.16410756111145, -2.9625940322875977, -2.761080265045166, -2.5595667362213135, -2.358053207397461, -2.1565394401550293, -1.9550259113311768, -1.7535122632980347, -1.5519986152648926, -1.35048508644104, -1.148971438407898, -0.9474577903747559, -0.7459442615509033, -0.5444306135177612, -0.34291744232177734, -0.14140382409095764, 0.06010979413986206, 0.2616233825683594, 0.46313703060150146, 0.6646506786346436, 0.8661642074584961, 1.0676778554916382, 1.2691915035247803, 1.4707051515579224, 1.6722187995910645, 1.873732328414917, 2.0752458572387695, 2.276759624481201, 2.4782731533050537, 2.6797866821289062, 2.881300449371338, 3.0828139781951904, 3.284327745437622, 3.4858412742614746, 3.6873550415039062, 3.888868570327759, 4.090382099151611, 4.291895866394043, 4.493409156799316, 4.694922924041748, 4.8964362144470215, 5.097949981689453, 5.299463748931885, 5.500977516174316, 5.70249080657959, 5.9040045738220215, 6.105518341064453]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 3.0, 10.0, 5.0, 14.0, 26.0, 32.0, 71.0, 100.0, 147.0, 246.0, 477.0, 1005.0, 2201.0, 5469.0, 14679.0, 46922.0, 227562.0, 3466818.0, 340122.0, 59454.0, 17431.0, 6459.0, 2537.0, 1111.0, 553.0, 316.0, 182.0, 129.0, 75.0, 47.0, 24.0, 14.0, 17.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.362152099609375, -1.31903076171875, -1.275909423828125, -1.2327880859375, -1.189666748046875, -1.14654541015625, -1.103424072265625, -1.060302734375, -1.017181396484375, -0.97406005859375, -0.930938720703125, -0.8878173828125, -0.844696044921875, -0.80157470703125, -0.758453369140625, -0.71533203125, -0.672210693359375, -0.62908935546875, -0.585968017578125, -0.5428466796875, -0.499725341796875, -0.45660400390625, -0.413482666015625, -0.370361328125, -0.327239990234375, -0.28411865234375, -0.240997314453125, -0.1978759765625, -0.154754638671875, -0.11163330078125, -0.068511962890625, -0.025390625, 0.017730712890625, 0.06085205078125, 0.103973388671875, 0.1470947265625, 0.190216064453125, 0.23333740234375, 0.276458740234375, 0.319580078125, 0.362701416015625, 0.40582275390625, 0.448944091796875, 0.4920654296875, 0.535186767578125, 0.57830810546875, 0.621429443359375, 0.66455078125, 0.707672119140625, 0.75079345703125, 0.793914794921875, 0.8370361328125, 0.880157470703125, 0.92327880859375, 0.966400146484375, 1.009521484375, 1.052642822265625, 1.09576416015625, 1.138885498046875, 1.1820068359375, 1.225128173828125, 1.26824951171875, 1.311370849609375, 1.3544921875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 12.0, 12.0, 18.0, 22.0, 28.0, 35.0, 43.0, 55.0, 44.0, 56.0, 66.0, 53.0, 70.0, 64.0, 70.0, 67.0, 44.0, 51.0, 34.0, 29.0, 32.0, 19.0, 19.0, 11.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.409423828125, -0.3974647521972656, -0.38550567626953125, -0.3735466003417969, -0.3615875244140625, -0.3496284484863281, -0.33766937255859375, -0.3257102966308594, -0.313751220703125, -0.3017921447753906, -0.28983306884765625, -0.2778739929199219, -0.2659149169921875, -0.2539558410644531, -0.24199676513671875, -0.23003768920898438, -0.21807861328125, -0.20611953735351562, -0.19416046142578125, -0.18220138549804688, -0.1702423095703125, -0.15828323364257812, -0.14632415771484375, -0.13436508178710938, -0.122406005859375, -0.11044692993164062, -0.09848785400390625, -0.08652877807617188, -0.0745697021484375, -0.06261062622070312, -0.05065155029296875, -0.038692474365234375, -0.0267333984375, -0.014774322509765625, -0.00281524658203125, 0.009143829345703125, 0.0211029052734375, 0.033061981201171875, 0.04502105712890625, 0.056980133056640625, 0.068939208984375, 0.08089828491210938, 0.09285736083984375, 0.10481643676757812, 0.1167755126953125, 0.12873458862304688, 0.14069366455078125, 0.15265274047851562, 0.16461181640625, 0.17657089233398438, 0.18852996826171875, 0.20048904418945312, 0.2124481201171875, 0.22440719604492188, 0.23636627197265625, 0.24832534790039062, 0.260284423828125, 0.2722434997558594, 0.28420257568359375, 0.2961616516113281, 0.3081207275390625, 0.3200798034667969, 0.33203887939453125, 0.3439979553222656, 0.35595703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 6.0, 3.0, 9.0, 6.0, 15.0, 27.0, 27.0, 64.0, 118.0, 146.0, 237.0, 347.0, 637.0, 1164.0, 1984.0, 3851.0, 7989.0, 17536.0, 42512.0, 119679.0, 457261.0, 2796205.0, 531670.0, 131289.0, 46145.0, 18210.0, 8217.0, 3883.0, 2113.0, 1194.0, 679.0, 393.0, 236.0, 148.0, 97.0, 65.0, 41.0, 19.0, 12.0, 13.0, 16.0, 13.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.013671875, -0.9866714477539062, -0.9596710205078125, -0.9326705932617188, -0.905670166015625, -0.8786697387695312, -0.8516693115234375, -0.8246688842773438, -0.79766845703125, -0.7706680297851562, -0.7436676025390625, -0.7166671752929688, -0.689666748046875, -0.6626663208007812, -0.6356658935546875, -0.6086654663085938, -0.5816650390625, -0.5546646118164062, -0.5276641845703125, -0.5006637573242188, -0.473663330078125, -0.44666290283203125, -0.4196624755859375, -0.39266204833984375, -0.36566162109375, -0.33866119384765625, -0.3116607666015625, -0.28466033935546875, -0.257659912109375, -0.23065948486328125, -0.2036590576171875, -0.17665863037109375, -0.149658203125, -0.12265777587890625, -0.0956573486328125, -0.06865692138671875, -0.041656494140625, -0.01465606689453125, 0.0123443603515625, 0.03934478759765625, 0.06634521484375, 0.09334564208984375, 0.1203460693359375, 0.14734649658203125, 0.174346923828125, 0.20134735107421875, 0.2283477783203125, 0.25534820556640625, 0.2823486328125, 0.30934906005859375, 0.3363494873046875, 0.36334991455078125, 0.390350341796875, 0.41735076904296875, 0.4443511962890625, 0.47135162353515625, 0.49835205078125, 0.5253524780273438, 0.5523529052734375, 0.5793533325195312, 0.606353759765625, 0.6333541870117188, 0.6603546142578125, 0.6873550415039062, 0.71435546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 9.0, 10.0, 15.0, 14.0, 29.0, 35.0, 47.0, 85.0, 103.0, 128.0, 241.0, 440.0, 1115.0, 846.0, 323.0, 194.0, 116.0, 81.0, 64.0, 54.0, 30.0, 22.0, 15.0, 12.0, 8.0, 2.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5226783752441406, -0.5067825317382812, -0.4908866882324219, -0.4749908447265625, -0.4590950012207031, -0.44319915771484375, -0.4273033142089844, -0.411407470703125, -0.3955116271972656, -0.37961578369140625, -0.3637199401855469, -0.3478240966796875, -0.3319282531738281, -0.31603240966796875, -0.3001365661621094, -0.28424072265625, -0.2683448791503906, -0.25244903564453125, -0.23655319213867188, -0.2206573486328125, -0.20476150512695312, -0.18886566162109375, -0.17296981811523438, -0.157073974609375, -0.14117813110351562, -0.12528228759765625, -0.10938644409179688, -0.0934906005859375, -0.07759475708007812, -0.06169891357421875, -0.045803070068359375, -0.0299072265625, -0.014011383056640625, 0.00188446044921875, 0.017780303955078125, 0.0336761474609375, 0.049571990966796875, 0.06546783447265625, 0.08136367797851562, 0.097259521484375, 0.11315536499023438, 0.12905120849609375, 0.14494705200195312, 0.1608428955078125, 0.17673873901367188, 0.19263458251953125, 0.20853042602539062, 0.22442626953125, 0.24032211303710938, 0.25621795654296875, 0.2721138000488281, 0.2880096435546875, 0.3039054870605469, 0.31980133056640625, 0.3356971740722656, 0.351593017578125, 0.3674888610839844, 0.38338470458984375, 0.3992805480957031, 0.4151763916015625, 0.4310722351074219, 0.44696807861328125, 0.4628639221191406, 0.478759765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 12.0, 47.0, 156.0, 243.0, 255.0, 181.0, 83.0, 19.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.820655822753906, -14.526803016662598, -14.232950210571289, -13.93909740447998, -13.645244598388672, -13.351391792297363, -13.057538986206055, -12.763686180114746, -12.469833374023438, -12.175980567932129, -11.88212776184082, -11.588274955749512, -11.294422149658203, -11.000569343566895, -10.706716537475586, -10.412863731384277, -10.119010925292969, -9.82515811920166, -9.531305313110352, -9.237452507019043, -8.943599700927734, -8.649746894836426, -8.355894088745117, -8.062041282653809, -7.7681884765625, -7.474335670471191, -7.180482864379883, -6.886630058288574, -6.592777252197266, -6.298924446105957, -6.005071640014648, -5.71121883392334, -5.417365074157715, -5.123512268066406, -4.829659461975098, -4.535806655883789, -4.2419538497924805, -3.948101043701172, -3.6542482376098633, -3.3603954315185547, -3.066542625427246, -2.7726898193359375, -2.478837013244629, -2.1849842071533203, -1.8911314010620117, -1.5972785949707031, -1.3034257888793945, -1.009572982788086, -0.7157201766967773, -0.42186737060546875, -0.12801456451416016, 0.16583824157714844, 0.45969104766845703, 0.7535438537597656, 1.0473966598510742, 1.3412494659423828, 1.6351022720336914, 1.928955078125, 2.2228078842163086, 2.516660690307617, 2.810513496398926, 3.1043663024902344, 3.398219108581543, 3.6920719146728516, 3.98592472076416]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 14.0, 5.0, 8.0, 9.0, 19.0, 15.0, 20.0, 21.0, 24.0, 26.0, 35.0, 27.0, 39.0, 45.0, 32.0, 38.0, 37.0, 43.0, 53.0, 46.0, 47.0, 47.0, 23.0, 40.0, 40.0, 30.0, 30.0, 29.0, 20.0, 17.0, 24.0, 15.0, 20.0, 14.0, 9.0, 9.0, 6.0, 11.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.092529535293579, -2.0316882133483887, -1.9708471298217773, -1.9100059270858765, -1.8491647243499756, -1.7883235216140747, -1.7274823188781738, -1.6666409969329834, -1.605799913406372, -1.5449587106704712, -1.4841175079345703, -1.4232763051986694, -1.3624351024627686, -1.3015938997268677, -1.2407526969909668, -1.1799113750457764, -1.1190701723098755, -1.0582289695739746, -0.9973877668380737, -0.9365465641021729, -0.875705361366272, -0.8148641586303711, -0.7540228962898254, -0.6931816935539246, -0.6323404908180237, -0.5714992880821228, -0.5106580853462219, -0.44981685280799866, -0.3889756500720978, -0.3281344473361969, -0.26729321479797363, -0.20645201206207275, -0.14561092853546143, -0.08476971834897995, -0.023928508162498474, 0.0369127094745636, 0.09775391221046448, 0.15859511494636536, 0.21943634748458862, 0.2802775502204895, 0.3411187529563904, 0.40195995569229126, 0.46280115842819214, 0.5236424207687378, 0.5844836235046387, 0.6453248262405396, 0.7061660289764404, 0.7670072317123413, 0.8278484344482422, 0.8886896371841431, 0.949530839920044, 1.0103720426559448, 1.0712132453918457, 1.1320544481277466, 1.1928956508636475, 1.253736972808838, 1.3145780563354492, 1.37541925907135, 1.436260461807251, 1.4971016645431519, 1.5579428672790527, 1.6187840700149536, 1.6796252727508545, 1.740466594696045, 1.8013077974319458]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 12.0, 13.0, 26.0, 34.0, 56.0, 98.0, 139.0, 257.0, 428.0, 827.0, 1517.0, 3171.0, 6606.0, 14770.0, 35278.0, 96595.0, 444745.0, 317777.0, 74395.0, 28385.0, 12191.0, 5553.0, 2650.0, 1307.0, 754.0, 394.0, 209.0, 121.0, 69.0, 59.0, 39.0, 19.0, 14.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.372406005859375, -1.32489013671875, -1.277374267578125, -1.2298583984375, -1.182342529296875, -1.13482666015625, -1.087310791015625, -1.039794921875, -0.992279052734375, -0.94476318359375, -0.897247314453125, -0.8497314453125, -0.802215576171875, -0.75469970703125, -0.707183837890625, -0.65966796875, -0.612152099609375, -0.56463623046875, -0.517120361328125, -0.4696044921875, -0.422088623046875, -0.37457275390625, -0.327056884765625, -0.279541015625, -0.232025146484375, -0.18450927734375, -0.136993408203125, -0.0894775390625, -0.041961669921875, 0.00555419921875, 0.053070068359375, 0.1005859375, 0.148101806640625, 0.19561767578125, 0.243133544921875, 0.2906494140625, 0.338165283203125, 0.38568115234375, 0.433197021484375, 0.480712890625, 0.528228759765625, 0.57574462890625, 0.623260498046875, 0.6707763671875, 0.718292236328125, 0.76580810546875, 0.813323974609375, 0.86083984375, 0.908355712890625, 0.95587158203125, 1.003387451171875, 1.0509033203125, 1.098419189453125, 1.14593505859375, 1.193450927734375, 1.240966796875, 1.288482666015625, 1.33599853515625, 1.383514404296875, 1.4310302734375, 1.478546142578125, 1.52606201171875, 1.573577880859375, 1.62109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 13.0, 15.0, 17.0, 27.0, 33.0, 39.0, 50.0, 44.0, 60.0, 60.0, 63.0, 55.0, 65.0, 76.0, 77.0, 60.0, 54.0, 39.0, 43.0, 24.0, 23.0, 19.0, 12.0, 8.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46044921875, -0.4475860595703125, -0.434722900390625, -0.4218597412109375, -0.40899658203125, -0.3961334228515625, -0.383270263671875, -0.3704071044921875, -0.3575439453125, -0.3446807861328125, -0.331817626953125, -0.3189544677734375, -0.30609130859375, -0.2932281494140625, -0.280364990234375, -0.2675018310546875, -0.254638671875, -0.2417755126953125, -0.228912353515625, -0.2160491943359375, -0.20318603515625, -0.1903228759765625, -0.177459716796875, -0.1645965576171875, -0.1517333984375, -0.1388702392578125, -0.126007080078125, -0.1131439208984375, -0.10028076171875, -0.0874176025390625, -0.074554443359375, -0.0616912841796875, -0.048828125, -0.0359649658203125, -0.023101806640625, -0.0102386474609375, 0.00262451171875, 0.0154876708984375, 0.028350830078125, 0.0412139892578125, 0.0540771484375, 0.0669403076171875, 0.079803466796875, 0.0926666259765625, 0.10552978515625, 0.1183929443359375, 0.131256103515625, 0.1441192626953125, 0.156982421875, 0.1698455810546875, 0.182708740234375, 0.1955718994140625, 0.20843505859375, 0.2212982177734375, 0.234161376953125, 0.2470245361328125, 0.2598876953125, 0.2727508544921875, 0.285614013671875, 0.2984771728515625, 0.31134033203125, 0.3242034912109375, 0.337066650390625, 0.3499298095703125, 0.36279296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 4.0, 4.0, 15.0, 12.0, 19.0, 30.0, 28.0, 51.0, 59.0, 83.0, 95.0, 158.0, 205.0, 308.0, 446.0, 693.0, 1294.0, 2940.0, 8385.0, 27760.0, 110392.0, 635274.0, 197587.0, 42405.0, 12120.0, 4105.0, 1636.0, 816.0, 469.0, 323.0, 203.0, 168.0, 105.0, 71.0, 58.0, 56.0, 41.0, 35.0, 25.0, 12.0, 16.0, 11.0, 4.0, 4.0, 4.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6806182861328125, -1.621978759765625, -1.5633392333984375, -1.50469970703125, -1.4460601806640625, -1.387420654296875, -1.3287811279296875, -1.2701416015625, -1.2115020751953125, -1.152862548828125, -1.0942230224609375, -1.03558349609375, -0.9769439697265625, -0.918304443359375, -0.8596649169921875, -0.801025390625, -0.7423858642578125, -0.683746337890625, -0.6251068115234375, -0.56646728515625, -0.5078277587890625, -0.449188232421875, -0.3905487060546875, -0.3319091796875, -0.2732696533203125, -0.214630126953125, -0.1559906005859375, -0.09735107421875, -0.0387115478515625, 0.019927978515625, 0.0785675048828125, 0.13720703125, 0.1958465576171875, 0.254486083984375, 0.3131256103515625, 0.37176513671875, 0.4304046630859375, 0.489044189453125, 0.5476837158203125, 0.6063232421875, 0.6649627685546875, 0.723602294921875, 0.7822418212890625, 0.84088134765625, 0.8995208740234375, 0.958160400390625, 1.0167999267578125, 1.075439453125, 1.1340789794921875, 1.192718505859375, 1.2513580322265625, 1.30999755859375, 1.3686370849609375, 1.427276611328125, 1.4859161376953125, 1.5445556640625, 1.6031951904296875, 1.661834716796875, 1.7204742431640625, 1.77911376953125, 1.8377532958984375, 1.896392822265625, 1.9550323486328125, 2.013671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 10.0, 11.0, 28.0, 25.0, 23.0, 27.0, 39.0, 45.0, 32.0, 62.0, 57.0, 54.0, 57.0, 51.0, 57.0, 61.0, 57.0, 43.0, 50.0, 29.0, 27.0, 40.0, 18.0, 21.0, 11.0, 9.0, 7.0, 14.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.704010009765625, -1.65118408203125, -1.598358154296875, -1.5455322265625, -1.492706298828125, -1.43988037109375, -1.387054443359375, -1.334228515625, -1.281402587890625, -1.22857666015625, -1.175750732421875, -1.1229248046875, -1.070098876953125, -1.01727294921875, -0.964447021484375, -0.91162109375, -0.858795166015625, -0.80596923828125, -0.753143310546875, -0.7003173828125, -0.647491455078125, -0.59466552734375, -0.541839599609375, -0.489013671875, -0.436187744140625, -0.38336181640625, -0.330535888671875, -0.2777099609375, -0.224884033203125, -0.17205810546875, -0.119232177734375, -0.06640625, -0.013580322265625, 0.03924560546875, 0.092071533203125, 0.1448974609375, 0.197723388671875, 0.25054931640625, 0.303375244140625, 0.356201171875, 0.409027099609375, 0.46185302734375, 0.514678955078125, 0.5675048828125, 0.620330810546875, 0.67315673828125, 0.725982666015625, 0.77880859375, 0.831634521484375, 0.88446044921875, 0.937286376953125, 0.9901123046875, 1.042938232421875, 1.09576416015625, 1.148590087890625, 1.201416015625, 1.254241943359375, 1.30706787109375, 1.359893798828125, 1.4127197265625, 1.465545654296875, 1.51837158203125, 1.571197509765625, 1.6240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 15.0, 27.0, 35.0, 43.0, 72.0, 98.0, 186.0, 382.0, 840.0, 2029.0, 5551.0, 18430.0, 79011.0, 715881.0, 181053.0, 31135.0, 8615.0, 2914.0, 1084.0, 485.0, 256.0, 146.0, 92.0, 56.0, 29.0, 23.0, 19.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.4112396240234375, -1.369354248046875, -1.3274688720703125, -1.28558349609375, -1.2436981201171875, -1.201812744140625, -1.1599273681640625, -1.1180419921875, -1.0761566162109375, -1.034271240234375, -0.9923858642578125, -0.95050048828125, -0.9086151123046875, -0.866729736328125, -0.8248443603515625, -0.782958984375, -0.7410736083984375, -0.699188232421875, -0.6573028564453125, -0.61541748046875, -0.5735321044921875, -0.531646728515625, -0.4897613525390625, -0.4478759765625, -0.4059906005859375, -0.364105224609375, -0.3222198486328125, -0.28033447265625, -0.2384490966796875, -0.196563720703125, -0.1546783447265625, -0.11279296875, -0.0709075927734375, -0.029022216796875, 0.0128631591796875, 0.05474853515625, 0.0966339111328125, 0.138519287109375, 0.1804046630859375, 0.2222900390625, 0.2641754150390625, 0.306060791015625, 0.3479461669921875, 0.38983154296875, 0.4317169189453125, 0.473602294921875, 0.5154876708984375, 0.557373046875, 0.5992584228515625, 0.641143798828125, 0.6830291748046875, 0.72491455078125, 0.7667999267578125, 0.808685302734375, 0.8505706787109375, 0.8924560546875, 0.9343414306640625, 0.976226806640625, 1.0181121826171875, 1.05999755859375, 1.1018829345703125, 1.143768310546875, 1.1856536865234375, 1.2275390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 12.0, 21.0, 31.0, 57.0, 125.0, 233.0, 207.0, 97.0, 47.0, 32.0, 25.0, 15.0, 13.0, 9.0, 8.0, 11.0, 5.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003001689910888672, -0.0002904273569583893, -0.0002806857228279114, -0.00027094408869743347, -0.00026120245456695557, -0.00025146082043647766, -0.00024171918630599976, -0.00023197755217552185, -0.00022223591804504395, -0.00021249428391456604, -0.00020275264978408813, -0.00019301101565361023, -0.00018326938152313232, -0.00017352774739265442, -0.00016378611326217651, -0.0001540444791316986, -0.0001443028450012207, -0.0001345612108707428, -0.0001248195767402649, -0.00011507794260978699, -0.00010533630847930908, -9.559467434883118e-05, -8.585304021835327e-05, -7.611140608787537e-05, -6.636977195739746e-05, -5.6628137826919556e-05, -4.688650369644165e-05, -3.7144869565963745e-05, -2.740323543548584e-05, -1.7661601305007935e-05, -7.91996717453003e-06, 1.821666955947876e-06, 1.1563301086425781e-05, 2.1304935216903687e-05, 3.104656934738159e-05, 4.07882034778595e-05, 5.05298376083374e-05, 6.027147173881531e-05, 7.001310586929321e-05, 7.975473999977112e-05, 8.949637413024902e-05, 9.923800826072693e-05, 0.00010897964239120483, 0.00011872127652168274, 0.00012846291065216064, 0.00013820454478263855, 0.00014794617891311646, 0.00015768781304359436, 0.00016742944717407227, 0.00017717108130455017, 0.00018691271543502808, 0.00019665434956550598, 0.0002063959836959839, 0.0002161376178264618, 0.0002258792519569397, 0.0002356208860874176, 0.0002453625202178955, 0.0002551041543483734, 0.0002648457884788513, 0.0002745874226093292, 0.00028432905673980713, 0.00029407069087028503, 0.00030381232500076294, 0.00031355395913124084, 0.00032329559326171875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 14.0, 12.0, 16.0, 21.0, 26.0, 33.0, 43.0, 62.0, 108.0, 167.0, 243.0, 429.0, 927.0, 1973.0, 4974.0, 14891.0, 59297.0, 734772.0, 187072.0, 28598.0, 8622.0, 3202.0, 1349.0, 690.0, 333.0, 208.0, 120.0, 102.0, 59.0, 43.0, 41.0, 28.0, 16.0, 15.0, 8.0, 7.0, 4.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.599609375, -1.5535888671875, -1.507568359375, -1.4615478515625, -1.41552734375, -1.3695068359375, -1.323486328125, -1.2774658203125, -1.2314453125, -1.1854248046875, -1.139404296875, -1.0933837890625, -1.04736328125, -1.0013427734375, -0.955322265625, -0.9093017578125, -0.86328125, -0.8172607421875, -0.771240234375, -0.7252197265625, -0.67919921875, -0.6331787109375, -0.587158203125, -0.5411376953125, -0.4951171875, -0.4490966796875, -0.403076171875, -0.3570556640625, -0.31103515625, -0.2650146484375, -0.218994140625, -0.1729736328125, -0.126953125, -0.0809326171875, -0.034912109375, 0.0111083984375, 0.05712890625, 0.1031494140625, 0.149169921875, 0.1951904296875, 0.2412109375, 0.2872314453125, 0.333251953125, 0.3792724609375, 0.42529296875, 0.4713134765625, 0.517333984375, 0.5633544921875, 0.609375, 0.6553955078125, 0.701416015625, 0.7474365234375, 0.79345703125, 0.8394775390625, 0.885498046875, 0.9315185546875, 0.9775390625, 1.0235595703125, 1.069580078125, 1.1156005859375, 1.16162109375, 1.2076416015625, 1.253662109375, 1.2996826171875, 1.345703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 4.0, 6.0, 3.0, 9.0, 9.0, 10.0, 14.0, 22.0, 30.0, 44.0, 94.0, 143.0, 203.0, 156.0, 77.0, 46.0, 28.0, 20.0, 21.0, 7.0, 5.0, 10.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.0643768310546875, -1.028167724609375, -0.9919586181640625, -0.95574951171875, -0.9195404052734375, -0.883331298828125, -0.8471221923828125, -0.8109130859375, -0.7747039794921875, -0.738494873046875, -0.7022857666015625, -0.66607666015625, -0.6298675537109375, -0.593658447265625, -0.5574493408203125, -0.521240234375, -0.4850311279296875, -0.448822021484375, -0.4126129150390625, -0.37640380859375, -0.3401947021484375, -0.303985595703125, -0.2677764892578125, -0.2315673828125, -0.1953582763671875, -0.159149169921875, -0.1229400634765625, -0.08673095703125, -0.0505218505859375, -0.014312744140625, 0.0218963623046875, 0.05810546875, 0.0943145751953125, 0.130523681640625, 0.1667327880859375, 0.20294189453125, 0.2391510009765625, 0.275360107421875, 0.3115692138671875, 0.3477783203125, 0.3839874267578125, 0.420196533203125, 0.4564056396484375, 0.49261474609375, 0.5288238525390625, 0.565032958984375, 0.6012420654296875, 0.637451171875, 0.6736602783203125, 0.709869384765625, 0.7460784912109375, 0.78228759765625, 0.8184967041015625, 0.854705810546875, 0.8909149169921875, 0.9271240234375, 0.9633331298828125, 0.999542236328125, 1.0357513427734375, 1.07196044921875, 1.1081695556640625, 1.144378662109375, 1.1805877685546875, 1.216796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 20.0, 33.0, 66.0, 124.0, 166.0, 184.0, 173.0, 103.0, 69.0, 25.0, 13.0, 9.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.543813705444336, -21.04570770263672, -20.5476016998291, -20.049495697021484, -19.5513916015625, -19.053285598754883, -18.555179595947266, -18.05707359313965, -17.55896759033203, -17.060861587524414, -16.562755584716797, -16.064651489257812, -15.566544532775879, -15.068439483642578, -14.570333480834961, -14.072227478027344, -13.574122428894043, -13.076016426086426, -12.577911376953125, -12.079805374145508, -11.58169937133789, -11.083593368530273, -10.585488319396973, -10.087382316589355, -9.589277267456055, -9.091171264648438, -8.593066215515137, -8.09496021270752, -7.596854209899902, -7.098748683929443, -6.600643157958984, -6.102537155151367, -5.60443115234375, -5.106325626373291, -4.608219623565674, -4.110114097595215, -3.6120083332061768, -3.1139025688171387, -2.6157970428466797, -2.1176912784576416, -1.6195855140686035, -1.1214797496795654, -0.6233741044998169, -0.12526845932006836, 0.3728373050689697, 0.8709430694580078, 1.3690485954284668, 1.8671543598175049, 2.365260124206543, 2.863365888595581, 3.361471652984619, 3.859577178955078, 4.357683181762695, 4.855788707733154, 5.353894233703613, 5.8520002365112305, 6.3501057624816895, 6.848211288452148, 7.346317291259766, 7.844422817230225, 8.342528343200684, 8.8406343460083, 9.338739395141602, 9.836845397949219, 10.334951400756836]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 14.0, 14.0, 14.0, 19.0, 32.0, 22.0, 28.0, 22.0, 33.0, 43.0, 40.0, 37.0, 43.0, 43.0, 48.0, 36.0, 48.0, 41.0, 45.0, 40.0, 44.0, 37.0, 27.0, 32.0, 28.0, 24.0, 14.0, 28.0, 11.0, 10.0, 9.0, 9.0, 9.0, 7.0, 6.0, 5.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.527933120727539, -7.322896480560303, -7.117860317230225, -6.912823677062988, -6.70778751373291, -6.502750873565674, -6.2977142333984375, -6.092678070068359, -5.887641429901123, -5.682604789733887, -5.477568626403809, -5.272531986236572, -5.067495346069336, -4.862459182739258, -4.6574225425720215, -4.452385902404785, -4.247349739074707, -4.042313098907471, -3.8372769355773926, -3.6322402954101562, -3.427203893661499, -3.222167491912842, -3.0171308517456055, -2.8120944499969482, -2.607058048248291, -2.402021646499634, -2.1969852447509766, -1.9919486045837402, -1.786912202835083, -1.5818758010864258, -1.376839280128479, -1.1718027591705322, -0.966766357421875, -0.761729896068573, -0.556693434715271, -0.351656973361969, -0.146620512008667, 0.058415889739990234, 0.263452410697937, 0.4684889316558838, 0.673525333404541, 0.878561794757843, 1.083598256111145, 1.2886347770690918, 1.493671178817749, 1.6987075805664062, 1.903744101524353, 2.1087806224823, 2.313817024230957, 2.5188534259796143, 2.7238898277282715, 2.928926467895508, 3.133962869644165, 3.3389992713928223, 3.5440359115600586, 3.749072313308716, 3.954108715057373, 4.159145355224609, 4.3641815185546875, 4.569218158721924, 4.77425479888916, 4.979290962219238, 5.184327602386475, 5.389364242553711, 5.594400405883789]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 15.0, 13.0, 47.0, 96.0, 201.0, 488.0, 1273.0, 3573.0, 12315.0, 57025.0, 1141640.0, 2892339.0, 66154.0, 13223.0, 3715.0, 1271.0, 489.0, 218.0, 81.0, 46.0, 20.0, 13.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.40594482421875, -2.3372802734375, -2.26861572265625, -2.199951171875, -2.13128662109375, -2.0626220703125, -1.99395751953125, -1.92529296875, -1.85662841796875, -1.7879638671875, -1.71929931640625, -1.650634765625, -1.58197021484375, -1.5133056640625, -1.44464111328125, -1.3759765625, -1.30731201171875, -1.2386474609375, -1.16998291015625, -1.101318359375, -1.03265380859375, -0.9639892578125, -0.89532470703125, -0.82666015625, -0.75799560546875, -0.6893310546875, -0.62066650390625, -0.552001953125, -0.48333740234375, -0.4146728515625, -0.34600830078125, -0.27734375, -0.20867919921875, -0.1400146484375, -0.07135009765625, -0.002685546875, 0.06597900390625, 0.1346435546875, 0.20330810546875, 0.27197265625, 0.34063720703125, 0.4093017578125, 0.47796630859375, 0.546630859375, 0.61529541015625, 0.6839599609375, 0.75262451171875, 0.8212890625, 0.88995361328125, 0.9586181640625, 1.02728271484375, 1.095947265625, 1.16461181640625, 1.2332763671875, 1.30194091796875, 1.37060546875, 1.43927001953125, 1.5079345703125, 1.57659912109375, 1.645263671875, 1.71392822265625, 1.7825927734375, 1.85125732421875, 1.919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 9.0, 11.0, 9.0, 10.0, 12.0, 14.0, 26.0, 27.0, 26.0, 37.0, 40.0, 45.0, 56.0, 64.0, 73.0, 56.0, 72.0, 68.0, 51.0, 54.0, 70.0, 43.0, 24.0, 29.0, 15.0, 18.0, 18.0, 8.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4408988952636719, -0.42769622802734375, -0.4144935607910156, -0.4012908935546875, -0.3880882263183594, -0.37488555908203125, -0.3616828918457031, -0.348480224609375, -0.3352775573730469, -0.32207489013671875, -0.3088722229003906, -0.2956695556640625, -0.2824668884277344, -0.26926422119140625, -0.2560615539550781, -0.24285888671875, -0.22965621948242188, -0.21645355224609375, -0.20325088500976562, -0.1900482177734375, -0.17684555053710938, -0.16364288330078125, -0.15044021606445312, -0.137237548828125, -0.12403488159179688, -0.11083221435546875, -0.09762954711914062, -0.0844268798828125, -0.07122421264648438, -0.05802154541015625, -0.044818878173828125, -0.0316162109375, -0.018413543701171875, -0.00521087646484375, 0.007991790771484375, 0.0211944580078125, 0.034397125244140625, 0.04759979248046875, 0.060802459716796875, 0.074005126953125, 0.08720779418945312, 0.10041046142578125, 0.11361312866210938, 0.1268157958984375, 0.14001846313476562, 0.15322113037109375, 0.16642379760742188, 0.17962646484375, 0.19282913208007812, 0.20603179931640625, 0.21923446655273438, 0.2324371337890625, 0.24563980102539062, 0.25884246826171875, 0.2720451354980469, 0.285247802734375, 0.2984504699707031, 0.31165313720703125, 0.3248558044433594, 0.3380584716796875, 0.3512611389160156, 0.36446380615234375, 0.3776664733886719, 0.390869140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 9.0, 5.0, 17.0, 18.0, 25.0, 49.0, 61.0, 121.0, 188.0, 285.0, 489.0, 898.0, 1633.0, 3085.0, 6387.0, 14074.0, 35264.0, 111072.0, 626908.0, 3025797.0, 259365.0, 65611.0, 23283.0, 9799.0, 4622.0, 2281.0, 1213.0, 636.0, 391.0, 240.0, 161.0, 87.0, 79.0, 46.0, 32.0, 22.0, 11.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2275390625, -1.1927490234375, -1.157958984375, -1.1231689453125, -1.08837890625, -1.0535888671875, -1.018798828125, -0.9840087890625, -0.94921875, -0.9144287109375, -0.879638671875, -0.8448486328125, -0.81005859375, -0.7752685546875, -0.740478515625, -0.7056884765625, -0.6708984375, -0.6361083984375, -0.601318359375, -0.5665283203125, -0.53173828125, -0.4969482421875, -0.462158203125, -0.4273681640625, -0.392578125, -0.3577880859375, -0.322998046875, -0.2882080078125, -0.25341796875, -0.2186279296875, -0.183837890625, -0.1490478515625, -0.1142578125, -0.0794677734375, -0.044677734375, -0.0098876953125, 0.02490234375, 0.0596923828125, 0.094482421875, 0.1292724609375, 0.1640625, 0.1988525390625, 0.233642578125, 0.2684326171875, 0.30322265625, 0.3380126953125, 0.372802734375, 0.4075927734375, 0.4423828125, 0.4771728515625, 0.511962890625, 0.5467529296875, 0.58154296875, 0.6163330078125, 0.651123046875, 0.6859130859375, 0.720703125, 0.7554931640625, 0.790283203125, 0.8250732421875, 0.85986328125, 0.8946533203125, 0.929443359375, 0.9642333984375, 0.9990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 10.0, 7.0, 12.0, 23.0, 28.0, 33.0, 49.0, 72.0, 96.0, 185.0, 370.0, 1096.0, 1165.0, 351.0, 182.0, 115.0, 78.0, 51.0, 32.0, 30.0, 22.0, 15.0, 5.0, 12.0, 2.0, 1.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5250930786132812, -0.5086822509765625, -0.49227142333984375, -0.475860595703125, -0.45944976806640625, -0.4430389404296875, -0.42662811279296875, -0.41021728515625, -0.39380645751953125, -0.3773956298828125, -0.36098480224609375, -0.344573974609375, -0.32816314697265625, -0.3117523193359375, -0.29534149169921875, -0.2789306640625, -0.26251983642578125, -0.2461090087890625, -0.22969818115234375, -0.213287353515625, -0.19687652587890625, -0.1804656982421875, -0.16405487060546875, -0.14764404296875, -0.13123321533203125, -0.1148223876953125, -0.09841156005859375, -0.082000732421875, -0.06558990478515625, -0.0491790771484375, -0.03276824951171875, -0.016357421875, 5.340576171875e-05, 0.0164642333984375, 0.03287506103515625, 0.049285888671875, 0.06569671630859375, 0.0821075439453125, 0.09851837158203125, 0.11492919921875, 0.13134002685546875, 0.1477508544921875, 0.16416168212890625, 0.180572509765625, 0.19698333740234375, 0.2133941650390625, 0.22980499267578125, 0.2462158203125, 0.26262664794921875, 0.2790374755859375, 0.29544830322265625, 0.311859130859375, 0.32826995849609375, 0.3446807861328125, 0.36109161376953125, 0.37750244140625, 0.39391326904296875, 0.4103240966796875, 0.42673492431640625, 0.443145751953125, 0.45955657958984375, 0.4759674072265625, 0.49237823486328125, 0.5087890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 15.0, 26.0, 48.0, 97.0, 127.0, 169.0, 162.0, 167.0, 86.0, 57.0, 23.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.354272842407227, -6.191716194152832, -6.029159069061279, -5.866602420806885, -5.704045295715332, -5.5414886474609375, -5.378931999206543, -5.216375350952148, -5.053818225860596, -4.891261577606201, -4.728704452514648, -4.566147804260254, -4.403591156005859, -4.241034030914307, -4.078477382659912, -3.9159204959869385, -3.753363609313965, -3.590806722640991, -3.4282498359680176, -3.265693187713623, -3.1031363010406494, -2.940579414367676, -2.7780227661132812, -2.6154658794403076, -2.452908992767334, -2.2903521060943604, -2.1277952194213867, -1.9652385711669922, -1.8026816844940186, -1.640124797821045, -1.4775680303573608, -1.3150112628936768, -1.1524543762207031, -0.9898975491523743, -0.8273407220840454, -0.6647838950157166, -0.5022270679473877, -0.33967024087905884, -0.17711341381072998, -0.014556646347045898, 0.14800024032592773, 0.3105570673942566, 0.47311389446258545, 0.6356707215309143, 0.7982275485992432, 0.960784375667572, 1.1233412027359009, 1.285897970199585, 1.4484548568725586, 1.6110117435455322, 1.7735685110092163, 1.9361252784729004, 2.098682165145874, 2.2612390518188477, 2.423795700073242, 2.586352586746216, 2.7489094734191895, 2.911466360092163, 3.0740232467651367, 3.2365798950195312, 3.399136781692505, 3.5616936683654785, 3.724250316619873, 3.8868072032928467, 4.04936408996582]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 10.0, 12.0, 14.0, 17.0, 23.0, 19.0, 33.0, 25.0, 38.0, 36.0, 49.0, 41.0, 59.0, 51.0, 45.0, 54.0, 51.0, 53.0, 45.0, 44.0, 32.0, 35.0, 33.0, 32.0, 24.0, 18.0, 31.0, 15.0, 12.0, 11.0, 7.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13521671295166, -2.0713541507720947, -2.00749135017395, -1.9436287879943848, -1.8797661066055298, -1.8159034252166748, -1.7520408630371094, -1.6881781816482544, -1.6243155002593994, -1.5604528188705444, -1.4965901374816895, -1.432727575302124, -1.368864893913269, -1.305002212524414, -1.2411396503448486, -1.1772769689559937, -1.1134142875671387, -1.0495516061782837, -0.9856889843940735, -0.9218263626098633, -0.8579636812210083, -0.7941009998321533, -0.7302383780479431, -0.6663757562637329, -0.6025130748748779, -0.538650393486023, -0.47478777170181274, -0.41092512011528015, -0.34706246852874756, -0.28319981694221497, -0.21933716535568237, -0.15547451376914978, -0.09161186218261719, -0.027749210596084595, 0.036113440990448, 0.09997609257698059, 0.16383874416351318, 0.22770139575004578, 0.29156404733657837, 0.35542669892311096, 0.41928935050964355, 0.48315200209617615, 0.5470146536827087, 0.610877275466919, 0.6747399568557739, 0.7386026382446289, 0.8024652600288391, 0.8663278818130493, 0.9301905632019043, 0.9940532445907593, 1.0579159259796143, 1.1217784881591797, 1.1856411695480347, 1.2495038509368896, 1.313366413116455, 1.37722909450531, 1.441091775894165, 1.50495445728302, 1.568817138671875, 1.6326797008514404, 1.6965423822402954, 1.7604050636291504, 1.8242676258087158, 1.8881303071975708, 1.9519929885864258]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 10.0, 10.0, 14.0, 22.0, 44.0, 52.0, 84.0, 127.0, 249.0, 416.0, 908.0, 1891.0, 4366.0, 10730.0, 28220.0, 84275.0, 369976.0, 404376.0, 92468.0, 29843.0, 11755.0, 4770.0, 1965.0, 918.0, 465.0, 243.0, 123.0, 74.0, 51.0, 37.0, 18.0, 10.0, 8.0, 9.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4453125, -1.4028472900390625, -1.360382080078125, -1.3179168701171875, -1.27545166015625, -1.2329864501953125, -1.190521240234375, -1.1480560302734375, -1.1055908203125, -1.0631256103515625, -1.020660400390625, -0.9781951904296875, -0.93572998046875, -0.8932647705078125, -0.850799560546875, -0.8083343505859375, -0.765869140625, -0.7234039306640625, -0.680938720703125, -0.6384735107421875, -0.59600830078125, -0.5535430908203125, -0.511077880859375, -0.4686126708984375, -0.4261474609375, -0.3836822509765625, -0.341217041015625, -0.2987518310546875, -0.25628662109375, -0.2138214111328125, -0.171356201171875, -0.1288909912109375, -0.08642578125, -0.0439605712890625, -0.001495361328125, 0.0409698486328125, 0.08343505859375, 0.1259002685546875, 0.168365478515625, 0.2108306884765625, 0.2532958984375, 0.2957611083984375, 0.338226318359375, 0.3806915283203125, 0.42315673828125, 0.4656219482421875, 0.508087158203125, 0.5505523681640625, 0.593017578125, 0.6354827880859375, 0.677947998046875, 0.7204132080078125, 0.76287841796875, 0.8053436279296875, 0.847808837890625, 0.8902740478515625, 0.9327392578125, 0.9752044677734375, 1.017669677734375, 1.0601348876953125, 1.10260009765625, 1.1450653076171875, 1.187530517578125, 1.2299957275390625, 1.2724609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 13.0, 9.0, 14.0, 14.0, 20.0, 26.0, 29.0, 38.0, 36.0, 49.0, 50.0, 62.0, 48.0, 56.0, 60.0, 53.0, 63.0, 63.0, 53.0, 45.0, 55.0, 31.0, 26.0, 21.0, 13.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4296875, -0.4169807434082031, -0.40427398681640625, -0.3915672302246094, -0.3788604736328125, -0.3661537170410156, -0.35344696044921875, -0.3407402038574219, -0.328033447265625, -0.3153266906738281, -0.30261993408203125, -0.2899131774902344, -0.2772064208984375, -0.2644996643066406, -0.25179290771484375, -0.23908615112304688, -0.22637939453125, -0.21367263793945312, -0.20096588134765625, -0.18825912475585938, -0.1755523681640625, -0.16284561157226562, -0.15013885498046875, -0.13743209838867188, -0.124725341796875, -0.11201858520507812, -0.09931182861328125, -0.08660507202148438, -0.0738983154296875, -0.061191558837890625, -0.04848480224609375, -0.035778045654296875, -0.0230712890625, -0.010364532470703125, 0.00234222412109375, 0.015048980712890625, 0.0277557373046875, 0.040462493896484375, 0.05316925048828125, 0.06587600708007812, 0.078582763671875, 0.09128952026367188, 0.10399627685546875, 0.11670303344726562, 0.1294097900390625, 0.14211654663085938, 0.15482330322265625, 0.16753005981445312, 0.18023681640625, 0.19294357299804688, 0.20565032958984375, 0.21835708618164062, 0.2310638427734375, 0.24377059936523438, 0.25647735595703125, 0.2691841125488281, 0.281890869140625, 0.2945976257324219, 0.30730438232421875, 0.3200111389160156, 0.3327178955078125, 0.3454246520996094, 0.35813140869140625, 0.3708381652832031, 0.383544921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 10.0, 8.0, 15.0, 18.0, 29.0, 26.0, 49.0, 75.0, 146.0, 205.0, 369.0, 703.0, 1710.0, 4500.0, 11882.0, 35192.0, 129111.0, 614057.0, 182773.0, 43539.0, 14674.0, 5349.0, 2076.0, 918.0, 433.0, 260.0, 146.0, 92.0, 59.0, 31.0, 28.0, 23.0, 16.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.4430694580078125, -1.395904541015625, -1.3487396240234375, -1.30157470703125, -1.2544097900390625, -1.207244873046875, -1.1600799560546875, -1.1129150390625, -1.0657501220703125, -1.018585205078125, -0.9714202880859375, -0.92425537109375, -0.8770904541015625, -0.829925537109375, -0.7827606201171875, -0.735595703125, -0.6884307861328125, -0.641265869140625, -0.5941009521484375, -0.54693603515625, -0.4997711181640625, -0.452606201171875, -0.4054412841796875, -0.3582763671875, -0.3111114501953125, -0.263946533203125, -0.2167816162109375, -0.16961669921875, -0.1224517822265625, -0.075286865234375, -0.0281219482421875, 0.01904296875, 0.0662078857421875, 0.113372802734375, 0.1605377197265625, 0.20770263671875, 0.2548675537109375, 0.302032470703125, 0.3491973876953125, 0.3963623046875, 0.4435272216796875, 0.490692138671875, 0.5378570556640625, 0.58502197265625, 0.6321868896484375, 0.679351806640625, 0.7265167236328125, 0.773681640625, 0.8208465576171875, 0.868011474609375, 0.9151763916015625, 0.96234130859375, 1.0095062255859375, 1.056671142578125, 1.1038360595703125, 1.1510009765625, 1.1981658935546875, 1.245330810546875, 1.2924957275390625, 1.33966064453125, 1.3868255615234375, 1.433990478515625, 1.4811553955078125, 1.5283203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 14.0, 10.0, 14.0, 16.0, 17.0, 29.0, 29.0, 34.0, 32.0, 38.0, 44.0, 49.0, 54.0, 45.0, 56.0, 52.0, 63.0, 50.0, 50.0, 31.0, 38.0, 44.0, 37.0, 26.0, 14.0, 26.0, 13.0, 15.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4169921875, -1.368865966796875, -1.32073974609375, -1.272613525390625, -1.2244873046875, -1.176361083984375, -1.12823486328125, -1.080108642578125, -1.031982421875, -0.983856201171875, -0.93572998046875, -0.887603759765625, -0.8394775390625, -0.791351318359375, -0.74322509765625, -0.695098876953125, -0.64697265625, -0.598846435546875, -0.55072021484375, -0.502593994140625, -0.4544677734375, -0.406341552734375, -0.35821533203125, -0.310089111328125, -0.261962890625, -0.213836669921875, -0.16571044921875, -0.117584228515625, -0.0694580078125, -0.021331787109375, 0.02679443359375, 0.074920654296875, 0.123046875, 0.171173095703125, 0.21929931640625, 0.267425537109375, 0.3155517578125, 0.363677978515625, 0.41180419921875, 0.459930419921875, 0.508056640625, 0.556182861328125, 0.60430908203125, 0.652435302734375, 0.7005615234375, 0.748687744140625, 0.79681396484375, 0.844940185546875, 0.89306640625, 0.941192626953125, 0.98931884765625, 1.037445068359375, 1.0855712890625, 1.133697509765625, 1.18182373046875, 1.229949951171875, 1.278076171875, 1.326202392578125, 1.37432861328125, 1.422454833984375, 1.4705810546875, 1.518707275390625, 1.56683349609375, 1.614959716796875, 1.6630859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 11.0, 12.0, 21.0, 31.0, 40.0, 50.0, 98.0, 159.0, 276.0, 499.0, 986.0, 2035.0, 4663.0, 11299.0, 28805.0, 76492.0, 338593.0, 433286.0, 93536.0, 33933.0, 13383.0, 5411.0, 2426.0, 1131.0, 576.0, 311.0, 187.0, 107.0, 70.0, 55.0, 27.0, 21.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5955886840820312, -0.5764312744140625, -0.5572738647460938, -0.538116455078125, -0.5189590454101562, -0.4998016357421875, -0.48064422607421875, -0.46148681640625, -0.44232940673828125, -0.4231719970703125, -0.40401458740234375, -0.384857177734375, -0.36569976806640625, -0.3465423583984375, -0.32738494873046875, -0.3082275390625, -0.28907012939453125, -0.2699127197265625, -0.25075531005859375, -0.231597900390625, -0.21244049072265625, -0.1932830810546875, -0.17412567138671875, -0.15496826171875, -0.13581085205078125, -0.1166534423828125, -0.09749603271484375, -0.078338623046875, -0.05918121337890625, -0.0400238037109375, -0.02086639404296875, -0.001708984375, 0.01744842529296875, 0.0366058349609375, 0.05576324462890625, 0.074920654296875, 0.09407806396484375, 0.1132354736328125, 0.13239288330078125, 0.15155029296875, 0.17070770263671875, 0.1898651123046875, 0.20902252197265625, 0.228179931640625, 0.24733734130859375, 0.2664947509765625, 0.28565216064453125, 0.3048095703125, 0.32396697998046875, 0.3431243896484375, 0.36228179931640625, 0.381439208984375, 0.40059661865234375, 0.4197540283203125, 0.43891143798828125, 0.45806884765625, 0.47722625732421875, 0.4963836669921875, 0.5155410766601562, 0.534698486328125, 0.5538558959960938, 0.5730133056640625, 0.5921707153320312, 0.611328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 5.0, 19.0, 23.0, 19.0, 58.0, 80.0, 176.0, 198.0, 158.0, 74.0, 45.0, 25.0, 18.0, 16.0, 11.0, 10.0, 7.0, 4.0, 4.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0003178119659423828, -0.00031048431992530823, -0.00030315667390823364, -0.00029582902789115906, -0.00028850138187408447, -0.0002811737358570099, -0.0002738460898399353, -0.0002665184438228607, -0.00025919079780578613, -0.00025186315178871155, -0.00024453550577163696, -0.00023720785975456238, -0.0002298802137374878, -0.0002225525677204132, -0.00021522492170333862, -0.00020789727568626404, -0.00020056962966918945, -0.00019324198365211487, -0.00018591433763504028, -0.0001785866916179657, -0.0001712590456008911, -0.00016393139958381653, -0.00015660375356674194, -0.00014927610754966736, -0.00014194846153259277, -0.0001346208155155182, -0.0001272931694984436, -0.00011996552348136902, -0.00011263787746429443, -0.00010531023144721985, -9.798258543014526e-05, -9.065493941307068e-05, -8.33272933959961e-05, -7.599964737892151e-05, -6.867200136184692e-05, -6.134435534477234e-05, -5.4016709327697754e-05, -4.668906331062317e-05, -3.9361417293548584e-05, -3.2033771276474e-05, -2.4706125259399414e-05, -1.737847924232483e-05, -1.0050833225250244e-05, -2.723187208175659e-06, 4.604458808898926e-06, 1.193210482597351e-05, 1.9259750843048096e-05, 2.658739686012268e-05, 3.3915042877197266e-05, 4.124268889427185e-05, 4.8570334911346436e-05, 5.589798092842102e-05, 6.32256269454956e-05, 7.055327296257019e-05, 7.788091897964478e-05, 8.520856499671936e-05, 9.253621101379395e-05, 9.986385703086853e-05, 0.00010719150304794312, 0.0001145191490650177, 0.00012184679508209229, 0.00012917444109916687, 0.00013650208711624146, 0.00014382973313331604, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 11.0, 7.0, 12.0, 29.0, 31.0, 43.0, 92.0, 140.0, 228.0, 461.0, 943.0, 2054.0, 5184.0, 14995.0, 54239.0, 346883.0, 519158.0, 73733.0, 19299.0, 6216.0, 2411.0, 1129.0, 556.0, 259.0, 175.0, 89.0, 55.0, 36.0, 30.0, 13.0, 20.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6221389770507812, -0.5963287353515625, -0.5705184936523438, -0.544708251953125, -0.5188980102539062, -0.4930877685546875, -0.46727752685546875, -0.44146728515625, -0.41565704345703125, -0.3898468017578125, -0.36403656005859375, -0.338226318359375, -0.31241607666015625, -0.2866058349609375, -0.26079559326171875, -0.2349853515625, -0.20917510986328125, -0.1833648681640625, -0.15755462646484375, -0.131744384765625, -0.10593414306640625, -0.0801239013671875, -0.05431365966796875, -0.02850341796875, -0.00269317626953125, 0.0231170654296875, 0.04892730712890625, 0.074737548828125, 0.10054779052734375, 0.1263580322265625, 0.15216827392578125, 0.177978515625, 0.20378875732421875, 0.2295989990234375, 0.25540924072265625, 0.281219482421875, 0.30702972412109375, 0.3328399658203125, 0.35865020751953125, 0.38446044921875, 0.41027069091796875, 0.4360809326171875, 0.46189117431640625, 0.487701416015625, 0.5135116577148438, 0.5393218994140625, 0.5651321411132812, 0.5909423828125, 0.6167526245117188, 0.6425628662109375, 0.6683731079101562, 0.694183349609375, 0.7199935913085938, 0.7458038330078125, 0.7716140747070312, 0.79742431640625, 0.8232345581054688, 0.8490447998046875, 0.8748550415039062, 0.900665283203125, 0.9264755249023438, 0.9522857666015625, 0.9780960083007812, 1.00390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 7.0, 7.0, 13.0, 24.0, 21.0, 28.0, 51.0, 68.0, 88.0, 113.0, 125.0, 113.0, 97.0, 63.0, 43.0, 30.0, 14.0, 20.0, 15.0, 7.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.556640625, -0.5356292724609375, -0.514617919921875, -0.4936065673828125, -0.47259521484375, -0.4515838623046875, -0.430572509765625, -0.4095611572265625, -0.3885498046875, -0.3675384521484375, -0.346527099609375, -0.3255157470703125, -0.30450439453125, -0.2834930419921875, -0.262481689453125, -0.2414703369140625, -0.220458984375, -0.1994476318359375, -0.178436279296875, -0.1574249267578125, -0.13641357421875, -0.1154022216796875, -0.094390869140625, -0.0733795166015625, -0.0523681640625, -0.0313568115234375, -0.010345458984375, 0.0106658935546875, 0.03167724609375, 0.0526885986328125, 0.073699951171875, 0.0947113037109375, 0.11572265625, 0.1367340087890625, 0.157745361328125, 0.1787567138671875, 0.19976806640625, 0.2207794189453125, 0.241790771484375, 0.2628021240234375, 0.2838134765625, 0.3048248291015625, 0.325836181640625, 0.3468475341796875, 0.36785888671875, 0.3888702392578125, 0.409881591796875, 0.4308929443359375, 0.451904296875, 0.4729156494140625, 0.493927001953125, 0.5149383544921875, 0.53594970703125, 0.5569610595703125, 0.577972412109375, 0.5989837646484375, 0.6199951171875, 0.6410064697265625, 0.662017822265625, 0.6830291748046875, 0.70404052734375, 0.7250518798828125, 0.746063232421875, 0.7670745849609375, 0.7880859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 11.0, 17.0, 79.0, 220.0, 286.0, 226.0, 115.0, 41.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.3907470703125, -37.66062545776367, -36.93050765991211, -36.20038604736328, -35.47026443481445, -34.74014663696289, -34.01002502441406, -33.279903411865234, -32.549781799316406, -31.81966209411621, -31.089540481567383, -30.359420776367188, -29.62929916381836, -28.899179458618164, -28.16905975341797, -27.43893814086914, -26.708820343017578, -25.978700637817383, -25.248579025268555, -24.51845932006836, -23.78833770751953, -23.058218002319336, -22.32809829711914, -21.597976684570312, -20.867856979370117, -20.137737274169922, -19.407615661621094, -18.6774959564209, -17.947376251220703, -17.217254638671875, -16.48713493347168, -15.757014274597168, -15.026893615722656, -14.296772956848145, -13.566652297973633, -12.836532592773438, -12.106411933898926, -11.376291275024414, -10.646171569824219, -9.916050910949707, -9.185930252075195, -8.455809593200684, -7.72568941116333, -6.995569229125977, -6.265448570251465, -5.535327911376953, -4.8052077293396, -4.075087547302246, -3.3449668884277344, -2.6148464679718018, -1.8847260475158691, -1.1546056270599365, -0.4244852066040039, 0.3056352138519287, 1.0357556343078613, 1.7658758163452148, 2.4959964752197266, 3.226116895675659, 3.956237316131592, 4.686357498168945, 5.416478157043457, 6.146598815917969, 6.876718997955322, 7.606839179992676, 8.336959838867188]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 6.0, 8.0, 10.0, 5.0, 13.0, 8.0, 15.0, 22.0, 22.0, 23.0, 19.0, 23.0, 30.0, 30.0, 29.0, 36.0, 44.0, 45.0, 33.0, 42.0, 44.0, 47.0, 37.0, 39.0, 32.0, 35.0, 33.0, 37.0, 28.0, 27.0, 16.0, 23.0, 19.0, 21.0, 11.0, 20.0, 15.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.060344696044922, -4.887916564941406, -4.715488433837891, -4.543060302734375, -4.370632171630859, -4.198204040527344, -4.025775909423828, -3.8533477783203125, -3.680919647216797, -3.5084915161132812, -3.3360633850097656, -3.16363525390625, -2.9912071228027344, -2.8187789916992188, -2.646350860595703, -2.4739227294921875, -2.301494598388672, -2.1290664672851562, -1.9566383361816406, -1.784210205078125, -1.6117820739746094, -1.4393539428710938, -1.2669258117675781, -1.0944976806640625, -0.9220695495605469, -0.7496414184570312, -0.5772132873535156, -0.40478515625, -0.23235702514648438, -0.05992889404296875, 0.11249923706054688, 0.2849273681640625, 0.4573554992675781, 0.6297836303710938, 0.8022117614746094, 0.974639892578125, 1.1470680236816406, 1.3194961547851562, 1.4919242858886719, 1.6643524169921875, 1.8367805480957031, 2.0092086791992188, 2.1816368103027344, 2.35406494140625, 2.5264930725097656, 2.6989212036132812, 2.871349334716797, 3.0437774658203125, 3.216205596923828, 3.3886337280273438, 3.5610618591308594, 3.733489990234375, 3.9059181213378906, 4.078346252441406, 4.250774383544922, 4.4232025146484375, 4.595630645751953, 4.768058776855469, 4.940486907958984, 5.1129150390625, 5.285343170166016, 5.457771301269531, 5.630199432373047, 5.8026275634765625, 5.975055694580078]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 11.0, 15.0, 22.0, 35.0, 62.0, 83.0, 137.0, 226.0, 361.0, 639.0, 1129.0, 2221.0, 4752.0, 10287.0, 26569.0, 81039.0, 446291.0, 3335660.0, 200636.0, 51006.0, 18125.0, 7501.0, 3472.0, 1730.0, 925.0, 492.0, 294.0, 186.0, 133.0, 84.0, 45.0, 25.0, 17.0, 14.0, 13.0, 11.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2220916748046875, -1.175628662109375, -1.1291656494140625, -1.08270263671875, -1.0362396240234375, -0.989776611328125, -0.9433135986328125, -0.8968505859375, -0.8503875732421875, -0.803924560546875, -0.7574615478515625, -0.71099853515625, -0.6645355224609375, -0.618072509765625, -0.5716094970703125, -0.525146484375, -0.4786834716796875, -0.432220458984375, -0.3857574462890625, -0.33929443359375, -0.2928314208984375, -0.246368408203125, -0.1999053955078125, -0.1534423828125, -0.1069793701171875, -0.060516357421875, -0.0140533447265625, 0.03240966796875, 0.0788726806640625, 0.125335693359375, 0.1717987060546875, 0.21826171875, 0.2647247314453125, 0.311187744140625, 0.3576507568359375, 0.40411376953125, 0.4505767822265625, 0.497039794921875, 0.5435028076171875, 0.5899658203125, 0.6364288330078125, 0.682891845703125, 0.7293548583984375, 0.77581787109375, 0.8222808837890625, 0.868743896484375, 0.9152069091796875, 0.961669921875, 1.0081329345703125, 1.054595947265625, 1.1010589599609375, 1.14752197265625, 1.1939849853515625, 1.240447998046875, 1.2869110107421875, 1.3333740234375, 1.3798370361328125, 1.426300048828125, 1.4727630615234375, 1.51922607421875, 1.5656890869140625, 1.612152099609375, 1.6586151123046875, 1.705078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 3.0, 6.0, 7.0, 5.0, 16.0, 12.0, 17.0, 22.0, 37.0, 24.0, 26.0, 30.0, 47.0, 55.0, 62.0, 62.0, 71.0, 61.0, 62.0, 53.0, 57.0, 51.0, 32.0, 41.0, 34.0, 31.0, 22.0, 8.0, 10.0, 12.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4658203125, -0.4527626037597656, -0.43970489501953125, -0.4266471862792969, -0.4135894775390625, -0.4005317687988281, -0.38747406005859375, -0.3744163513183594, -0.361358642578125, -0.3483009338378906, -0.33524322509765625, -0.3221855163574219, -0.3091278076171875, -0.2960700988769531, -0.28301239013671875, -0.2699546813964844, -0.25689697265625, -0.24383926391601562, -0.23078155517578125, -0.21772384643554688, -0.2046661376953125, -0.19160842895507812, -0.17855072021484375, -0.16549301147460938, -0.152435302734375, -0.13937759399414062, -0.12631988525390625, -0.11326217651367188, -0.1002044677734375, -0.08714675903320312, -0.07408905029296875, -0.061031341552734375, -0.0479736328125, -0.034915924072265625, -0.02185821533203125, -0.008800506591796875, 0.0042572021484375, 0.017314910888671875, 0.03037261962890625, 0.043430328369140625, 0.056488037109375, 0.06954574584960938, 0.08260345458984375, 0.09566116333007812, 0.1087188720703125, 0.12177658081054688, 0.13483428955078125, 0.14789199829101562, 0.16094970703125, 0.17400741577148438, 0.18706512451171875, 0.20012283325195312, 0.2131805419921875, 0.22623825073242188, 0.23929595947265625, 0.2523536682128906, 0.265411376953125, 0.2784690856933594, 0.29152679443359375, 0.3045845031738281, 0.3176422119140625, 0.3306999206542969, 0.34375762939453125, 0.3568153381347656, 0.369873046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 11.0, 9.0, 20.0, 36.0, 49.0, 47.0, 94.0, 119.0, 184.0, 297.0, 506.0, 726.0, 1169.0, 2048.0, 3841.0, 7595.0, 15257.0, 35040.0, 89827.0, 306289.0, 2993406.0, 526895.0, 125003.0, 45787.0, 19981.0, 9166.0, 4690.0, 2399.0, 1433.0, 828.0, 496.0, 315.0, 225.0, 136.0, 93.0, 91.0, 38.0, 39.0, 29.0, 23.0, 21.0, 6.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.158203125, -1.121612548828125, -1.08502197265625, -1.048431396484375, -1.0118408203125, -0.975250244140625, -0.93865966796875, -0.902069091796875, -0.865478515625, -0.828887939453125, -0.79229736328125, -0.755706787109375, -0.7191162109375, -0.682525634765625, -0.64593505859375, -0.609344482421875, -0.57275390625, -0.536163330078125, -0.49957275390625, -0.462982177734375, -0.4263916015625, -0.389801025390625, -0.35321044921875, -0.316619873046875, -0.280029296875, -0.243438720703125, -0.20684814453125, -0.170257568359375, -0.1336669921875, -0.097076416015625, -0.06048583984375, -0.023895263671875, 0.0126953125, 0.049285888671875, 0.08587646484375, 0.122467041015625, 0.1590576171875, 0.195648193359375, 0.23223876953125, 0.268829345703125, 0.305419921875, 0.342010498046875, 0.37860107421875, 0.415191650390625, 0.4517822265625, 0.488372802734375, 0.52496337890625, 0.561553955078125, 0.59814453125, 0.634735107421875, 0.67132568359375, 0.707916259765625, 0.7445068359375, 0.781097412109375, 0.81768798828125, 0.854278564453125, 0.890869140625, 0.927459716796875, 0.96405029296875, 1.000640869140625, 1.0372314453125, 1.073822021484375, 1.11041259765625, 1.147003173828125, 1.18359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 9.0, 17.0, 16.0, 39.0, 39.0, 65.0, 91.0, 159.0, 317.0, 1510.0, 1043.0, 293.0, 167.0, 82.0, 64.0, 39.0, 30.0, 20.0, 14.0, 10.0, 12.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.67236328125, -0.64990234375, -0.62744140625, -0.60498046875, -0.58251953125, -0.56005859375, -0.53759765625, -0.51513671875, -0.49267578125, -0.47021484375, -0.44775390625, -0.42529296875, -0.40283203125, -0.38037109375, -0.35791015625, -0.33544921875, -0.31298828125, -0.29052734375, -0.26806640625, -0.24560546875, -0.22314453125, -0.20068359375, -0.17822265625, -0.15576171875, -0.13330078125, -0.11083984375, -0.08837890625, -0.06591796875, -0.04345703125, -0.02099609375, 0.00146484375, 0.02392578125, 0.04638671875, 0.06884765625, 0.09130859375, 0.11376953125, 0.13623046875, 0.15869140625, 0.18115234375, 0.20361328125, 0.22607421875, 0.24853515625, 0.27099609375, 0.29345703125, 0.31591796875, 0.33837890625, 0.36083984375, 0.38330078125, 0.40576171875, 0.42822265625, 0.45068359375, 0.47314453125, 0.49560546875, 0.51806640625, 0.54052734375, 0.56298828125, 0.58544921875, 0.60791015625, 0.63037109375, 0.65283203125, 0.67529296875, 0.69775390625, 0.72021484375, 0.74267578125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 10.0, 20.0, 50.0, 107.0, 140.0, 195.0, 176.0, 140.0, 83.0, 45.0, 18.0, 6.0, 9.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.638930320739746, -7.436737537384033, -7.23454475402832, -7.032351970672607, -6.8301591873168945, -6.627966403961182, -6.425773620605469, -6.223580360412598, -6.021388053894043, -5.81919527053833, -5.617002487182617, -5.414809703826904, -5.212616920471191, -5.0104241371154785, -4.808231353759766, -4.6060380935668945, -4.403845310211182, -4.201652526855469, -3.999459743499756, -3.797266960144043, -3.59507417678833, -3.392881393432617, -3.190688371658325, -2.9884955883026123, -2.7863028049468994, -2.5841100215911865, -2.3819172382354736, -2.1797242164611816, -1.9775315523147583, -1.7753387689590454, -1.573145866394043, -1.37095308303833, -1.1687607765197754, -0.9665679931640625, -0.7643751502037048, -0.5621823072433472, -0.3599895238876343, -0.1577967405319214, 0.044396162033081055, 0.24658894538879395, 0.44878172874450684, 0.6509745121002197, 0.8531673550605774, 1.055360198020935, 1.257552981376648, 1.4597457647323608, 1.6619386672973633, 1.8641314506530762, 2.066324234008789, 2.268517017364502, 2.470709800720215, 2.6729025840759277, 2.8750953674316406, 3.0772881507873535, 3.2794811725616455, 3.4816739559173584, 3.6838667392730713, 3.886059522628784, 4.088252544403076, 4.290445327758789, 4.492638111114502, 4.694830894470215, 4.897023677825928, 5.099216461181641, 5.3014092445373535]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 14.0, 11.0, 12.0, 12.0, 8.0, 12.0, 17.0, 20.0, 21.0, 21.0, 26.0, 34.0, 50.0, 29.0, 41.0, 29.0, 49.0, 43.0, 55.0, 44.0, 34.0, 34.0, 40.0, 35.0, 49.0, 32.0, 37.0, 19.0, 24.0, 23.0, 23.0, 20.0, 13.0, 13.0, 12.0, 5.0, 4.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9029884338378906, -1.8425865173339844, -1.7821846008300781, -1.7217828035354614, -1.6613808870315552, -1.600978970527649, -1.5405771732330322, -1.480175256729126, -1.4197733402252197, -1.3593714237213135, -1.2989695072174072, -1.2385677099227905, -1.1781657934188843, -1.117763876914978, -1.0573620796203613, -0.9969601631164551, -0.9365582466125488, -0.8761563301086426, -0.8157544732093811, -0.7553526163101196, -0.6949506998062134, -0.6345487833023071, -0.5741469264030457, -0.5137450695037842, -0.45334315299987793, -0.39294126629829407, -0.3325393795967102, -0.27213749289512634, -0.21173560619354248, -0.15133371949195862, -0.09093183279037476, -0.030529946088790894, 0.02987205982208252, 0.09027394652366638, 0.15067583322525024, 0.2110777199268341, 0.27147960662841797, 0.33188149333000183, 0.3922833800315857, 0.45268526673316956, 0.5130871534347534, 0.5734890699386597, 0.6338909268379211, 0.6942927837371826, 0.7546947002410889, 0.8150966167449951, 0.8754984736442566, 0.9359003305435181, 0.9963022470474243, 1.0567041635513306, 1.1171059608459473, 1.1775078773498535, 1.2379097938537598, 1.298311710357666, 1.3587136268615723, 1.419115424156189, 1.4795173406600952, 1.5399192571640015, 1.6003210544586182, 1.6607229709625244, 1.7211248874664307, 1.781526803970337, 1.8419287204742432, 1.9023305177688599, 1.9627324342727661]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 7.0, 13.0, 15.0, 25.0, 40.0, 52.0, 81.0, 141.0, 243.0, 477.0, 831.0, 1671.0, 3406.0, 7453.0, 16919.0, 37827.0, 82196.0, 177101.0, 338716.0, 207508.0, 94275.0, 43397.0, 19403.0, 8768.0, 3992.0, 1905.0, 961.0, 439.0, 241.0, 155.0, 106.0, 60.0, 49.0, 22.0, 18.0, 7.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.470703125, -1.43157958984375, -1.3924560546875, -1.35333251953125, -1.314208984375, -1.27508544921875, -1.2359619140625, -1.19683837890625, -1.15771484375, -1.11859130859375, -1.0794677734375, -1.04034423828125, -1.001220703125, -0.96209716796875, -0.9229736328125, -0.88385009765625, -0.8447265625, -0.80560302734375, -0.7664794921875, -0.72735595703125, -0.688232421875, -0.64910888671875, -0.6099853515625, -0.57086181640625, -0.53173828125, -0.49261474609375, -0.4534912109375, -0.41436767578125, -0.375244140625, -0.33612060546875, -0.2969970703125, -0.25787353515625, -0.21875, -0.17962646484375, -0.1405029296875, -0.10137939453125, -0.062255859375, -0.02313232421875, 0.0159912109375, 0.05511474609375, 0.09423828125, 0.13336181640625, 0.1724853515625, 0.21160888671875, 0.250732421875, 0.28985595703125, 0.3289794921875, 0.36810302734375, 0.4072265625, 0.44635009765625, 0.4854736328125, 0.52459716796875, 0.563720703125, 0.60284423828125, 0.6419677734375, 0.68109130859375, 0.72021484375, 0.75933837890625, 0.7984619140625, 0.83758544921875, 0.876708984375, 0.91583251953125, 0.9549560546875, 0.99407958984375, 1.033203125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 14.0, 9.0, 21.0, 9.0, 24.0, 19.0, 30.0, 28.0, 39.0, 56.0, 48.0, 61.0, 67.0, 53.0, 64.0, 62.0, 49.0, 58.0, 54.0, 36.0, 27.0, 41.0, 31.0, 22.0, 17.0, 18.0, 13.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.470703125, -0.4572868347167969, -0.44387054443359375, -0.4304542541503906, -0.4170379638671875, -0.4036216735839844, -0.39020538330078125, -0.3767890930175781, -0.363372802734375, -0.3499565124511719, -0.33654022216796875, -0.3231239318847656, -0.3097076416015625, -0.2962913513183594, -0.28287506103515625, -0.2694587707519531, -0.25604248046875, -0.24262619018554688, -0.22920989990234375, -0.21579360961914062, -0.2023773193359375, -0.18896102905273438, -0.17554473876953125, -0.16212844848632812, -0.148712158203125, -0.13529586791992188, -0.12187957763671875, -0.10846328735351562, -0.0950469970703125, -0.08163070678710938, -0.06821441650390625, -0.054798126220703125, -0.0413818359375, -0.027965545654296875, -0.01454925537109375, -0.001132965087890625, 0.0122833251953125, 0.025699615478515625, 0.03911590576171875, 0.052532196044921875, 0.065948486328125, 0.07936477661132812, 0.09278106689453125, 0.10619735717773438, 0.1196136474609375, 0.13302993774414062, 0.14644622802734375, 0.15986251831054688, 0.17327880859375, 0.18669509887695312, 0.20011138916015625, 0.21352767944335938, 0.2269439697265625, 0.24036026000976562, 0.25377655029296875, 0.2671928405761719, 0.280609130859375, 0.2940254211425781, 0.30744171142578125, 0.3208580017089844, 0.3342742919921875, 0.3476905822753906, 0.36110687255859375, 0.3745231628417969, 0.387939453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 0.0, 8.0, 8.0, 2.0, 7.0, 21.0, 15.0, 20.0, 28.0, 36.0, 52.0, 65.0, 82.0, 126.0, 166.0, 226.0, 303.0, 495.0, 759.0, 1306.0, 2893.0, 8769.0, 33708.0, 133582.0, 533514.0, 245356.0, 62706.0, 15249.0, 4487.0, 1736.0, 969.0, 534.0, 348.0, 288.0, 170.0, 130.0, 105.0, 77.0, 58.0, 27.0, 27.0, 22.0, 25.0, 15.0, 9.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.06640625, -2.0032501220703125, -1.940093994140625, -1.8769378662109375, -1.81378173828125, -1.7506256103515625, -1.687469482421875, -1.6243133544921875, -1.5611572265625, -1.4980010986328125, -1.434844970703125, -1.3716888427734375, -1.30853271484375, -1.2453765869140625, -1.182220458984375, -1.1190643310546875, -1.055908203125, -0.9927520751953125, -0.929595947265625, -0.8664398193359375, -0.80328369140625, -0.7401275634765625, -0.676971435546875, -0.6138153076171875, -0.5506591796875, -0.4875030517578125, -0.424346923828125, -0.3611907958984375, -0.29803466796875, -0.2348785400390625, -0.171722412109375, -0.1085662841796875, -0.04541015625, 0.0177459716796875, 0.080902099609375, 0.1440582275390625, 0.20721435546875, 0.2703704833984375, 0.333526611328125, 0.3966827392578125, 0.4598388671875, 0.5229949951171875, 0.586151123046875, 0.6493072509765625, 0.71246337890625, 0.7756195068359375, 0.838775634765625, 0.9019317626953125, 0.965087890625, 1.0282440185546875, 1.091400146484375, 1.1545562744140625, 1.21771240234375, 1.2808685302734375, 1.344024658203125, 1.4071807861328125, 1.4703369140625, 1.5334930419921875, 1.596649169921875, 1.6598052978515625, 1.72296142578125, 1.7861175537109375, 1.849273681640625, 1.9124298095703125, 1.9755859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 6.0, 3.0, 9.0, 7.0, 9.0, 10.0, 8.0, 12.0, 20.0, 21.0, 26.0, 33.0, 27.0, 42.0, 43.0, 54.0, 45.0, 56.0, 43.0, 48.0, 49.0, 52.0, 51.0, 47.0, 46.0, 38.0, 32.0, 36.0, 21.0, 14.0, 13.0, 11.0, 11.0, 9.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.912109375, -1.854644775390625, -1.79718017578125, -1.739715576171875, -1.6822509765625, -1.624786376953125, -1.56732177734375, -1.509857177734375, -1.452392578125, -1.394927978515625, -1.33746337890625, -1.279998779296875, -1.2225341796875, -1.165069580078125, -1.10760498046875, -1.050140380859375, -0.99267578125, -0.935211181640625, -0.87774658203125, -0.820281982421875, -0.7628173828125, -0.705352783203125, -0.64788818359375, -0.590423583984375, -0.532958984375, -0.475494384765625, -0.41802978515625, -0.360565185546875, -0.3031005859375, -0.245635986328125, -0.18817138671875, -0.130706787109375, -0.0732421875, -0.015777587890625, 0.04168701171875, 0.099151611328125, 0.1566162109375, 0.214080810546875, 0.27154541015625, 0.329010009765625, 0.386474609375, 0.443939208984375, 0.50140380859375, 0.558868408203125, 0.6163330078125, 0.673797607421875, 0.73126220703125, 0.788726806640625, 0.84619140625, 0.903656005859375, 0.96112060546875, 1.018585205078125, 1.0760498046875, 1.133514404296875, 1.19097900390625, 1.248443603515625, 1.305908203125, 1.363372802734375, 1.42083740234375, 1.478302001953125, 1.5357666015625, 1.593231201171875, 1.65069580078125, 1.708160400390625, 1.765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 12.0, 27.0, 45.0, 64.0, 110.0, 182.0, 336.0, 752.0, 2088.0, 6958.0, 34519.0, 203908.0, 650716.0, 120274.0, 21124.0, 4571.0, 1536.0, 653.0, 266.0, 120.0, 94.0, 60.0, 30.0, 25.0, 16.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.615234375, -1.571990966796875, -1.52874755859375, -1.485504150390625, -1.4422607421875, -1.399017333984375, -1.35577392578125, -1.312530517578125, -1.269287109375, -1.226043701171875, -1.18280029296875, -1.139556884765625, -1.0963134765625, -1.053070068359375, -1.00982666015625, -0.966583251953125, -0.92333984375, -0.880096435546875, -0.83685302734375, -0.793609619140625, -0.7503662109375, -0.707122802734375, -0.66387939453125, -0.620635986328125, -0.577392578125, -0.534149169921875, -0.49090576171875, -0.447662353515625, -0.4044189453125, -0.361175537109375, -0.31793212890625, -0.274688720703125, -0.2314453125, -0.188201904296875, -0.14495849609375, -0.101715087890625, -0.0584716796875, -0.015228271484375, 0.02801513671875, 0.071258544921875, 0.114501953125, 0.157745361328125, 0.20098876953125, 0.244232177734375, 0.2874755859375, 0.330718994140625, 0.37396240234375, 0.417205810546875, 0.46044921875, 0.503692626953125, 0.54693603515625, 0.590179443359375, 0.6334228515625, 0.676666259765625, 0.71990966796875, 0.763153076171875, 0.806396484375, 0.849639892578125, 0.89288330078125, 0.936126708984375, 0.9793701171875, 1.022613525390625, 1.06585693359375, 1.109100341796875, 1.15234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 11.0, 11.0, 20.0, 24.0, 26.0, 28.0, 32.0, 40.0, 50.0, 66.0, 132.0, 138.0, 97.0, 64.0, 45.0, 41.0, 32.0, 26.0, 15.0, 22.0, 8.0, 17.0, 14.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002073049545288086, -0.00019999034702777863, -0.00019267573952674866, -0.0001853611320257187, -0.00017804652452468872, -0.00017073191702365875, -0.00016341730952262878, -0.00015610270202159882, -0.00014878809452056885, -0.00014147348701953888, -0.0001341588795185089, -0.00012684427201747894, -0.00011952966451644897, -0.000112215057015419, -0.00010490044951438904, -9.758584201335907e-05, -9.02712345123291e-05, -8.295662701129913e-05, -7.564201951026917e-05, -6.83274120092392e-05, -6.101280450820923e-05, -5.369819700717926e-05, -4.638358950614929e-05, -3.9068982005119324e-05, -3.1754374504089355e-05, -2.4439767003059387e-05, -1.712515950202942e-05, -9.81055200099945e-06, -2.4959444999694824e-06, 4.818663001060486e-06, 1.2133270502090454e-05, 1.9447878003120422e-05, 2.676248550415039e-05, 3.407709300518036e-05, 4.139170050621033e-05, 4.8706308007240295e-05, 5.6020915508270264e-05, 6.333552300930023e-05, 7.06501305103302e-05, 7.796473801136017e-05, 8.527934551239014e-05, 9.25939530134201e-05, 9.990856051445007e-05, 0.00010722316801548004, 0.00011453777551651001, 0.00012185238301753998, 0.00012916699051856995, 0.00013648159801959991, 0.00014379620552062988, 0.00015111081302165985, 0.00015842542052268982, 0.0001657400280237198, 0.00017305463552474976, 0.00018036924302577972, 0.0001876838505268097, 0.00019499845802783966, 0.00020231306552886963, 0.0002096276730298996, 0.00021694228053092957, 0.00022425688803195953, 0.0002315714955329895, 0.00023888610303401947, 0.00024620071053504944, 0.0002535153180360794, 0.0002608299255371094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 5.0, 18.0, 34.0, 58.0, 140.0, 298.0, 973.0, 6640.0, 295915.0, 730399.0, 12061.0, 1344.0, 365.0, 144.0, 80.0, 36.0, 22.0, 11.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.1158447265625, -2.005126953125, -1.8944091796875, -1.78369140625, -1.6729736328125, -1.562255859375, -1.4515380859375, -1.3408203125, -1.2301025390625, -1.119384765625, -1.0086669921875, -0.89794921875, -0.7872314453125, -0.676513671875, -0.5657958984375, -0.455078125, -0.3443603515625, -0.233642578125, -0.1229248046875, -0.01220703125, 0.0985107421875, 0.209228515625, 0.3199462890625, 0.4306640625, 0.5413818359375, 0.652099609375, 0.7628173828125, 0.87353515625, 0.9842529296875, 1.094970703125, 1.2056884765625, 1.31640625, 1.4271240234375, 1.537841796875, 1.6485595703125, 1.75927734375, 1.8699951171875, 1.980712890625, 2.0914306640625, 2.2021484375, 2.3128662109375, 2.423583984375, 2.5343017578125, 2.64501953125, 2.7557373046875, 2.866455078125, 2.9771728515625, 3.087890625, 3.1986083984375, 3.309326171875, 3.4200439453125, 3.53076171875, 3.6414794921875, 3.752197265625, 3.8629150390625, 3.9736328125, 4.0843505859375, 4.195068359375, 4.3057861328125, 4.41650390625, 4.5272216796875, 4.637939453125, 4.7486572265625, 4.859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 14.0, 17.0, 22.0, 22.0, 32.0, 43.0, 42.0, 79.0, 102.0, 133.0, 112.0, 85.0, 71.0, 52.0, 44.0, 29.0, 22.0, 17.0, 7.0, 12.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.134765625, -1.0979461669921875, -1.061126708984375, -1.0243072509765625, -0.98748779296875, -0.9506683349609375, -0.913848876953125, -0.8770294189453125, -0.8402099609375, -0.8033905029296875, -0.766571044921875, -0.7297515869140625, -0.69293212890625, -0.6561126708984375, -0.619293212890625, -0.5824737548828125, -0.545654296875, -0.5088348388671875, -0.472015380859375, -0.4351959228515625, -0.39837646484375, -0.3615570068359375, -0.324737548828125, -0.2879180908203125, -0.2510986328125, -0.2142791748046875, -0.177459716796875, -0.1406402587890625, -0.10382080078125, -0.0670013427734375, -0.030181884765625, 0.0066375732421875, 0.04345703125, 0.0802764892578125, 0.117095947265625, 0.1539154052734375, 0.19073486328125, 0.2275543212890625, 0.264373779296875, 0.3011932373046875, 0.3380126953125, 0.3748321533203125, 0.411651611328125, 0.4484710693359375, 0.48529052734375, 0.5221099853515625, 0.558929443359375, 0.5957489013671875, 0.632568359375, 0.6693878173828125, 0.706207275390625, 0.7430267333984375, 0.77984619140625, 0.8166656494140625, 0.853485107421875, 0.8903045654296875, 0.9271240234375, 0.9639434814453125, 1.000762939453125, 1.0375823974609375, 1.07440185546875, 1.1112213134765625, 1.148040771484375, 1.1848602294921875, 1.2216796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 17.0, 41.0, 73.0, 122.0, 176.0, 195.0, 168.0, 111.0, 53.0, 27.0, 7.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.097789764404297, -18.418212890625, -17.738636016845703, -17.059059143066406, -16.37948226928711, -15.699904441833496, -15.020326614379883, -14.340749740600586, -13.661172866821289, -12.981595993041992, -12.302019119262695, -11.622441291809082, -10.942864418029785, -10.263287544250488, -9.583709716796875, -8.904132843017578, -8.224555969238281, -7.544979095458984, -6.865401744842529, -6.185824394226074, -5.506247520446777, -4.8266706466674805, -4.147093296051025, -3.4675159454345703, -2.7879390716552734, -2.1083619594573975, -1.4287848472595215, -0.7492077350616455, -0.06963062286376953, 0.6099464893341064, 1.2895236015319824, 1.9691009521484375, 2.648679733276367, 3.328256845474243, 4.007833957672119, 4.687411308288574, 5.366988182067871, 6.046565055847168, 6.726142406463623, 7.405719757080078, 8.085296630859375, 8.764873504638672, 9.444450378417969, 10.124028205871582, 10.803605079650879, 11.483181953430176, 12.162759780883789, 12.842336654663086, 13.521913528442383, 14.20149040222168, 14.881067276000977, 15.56064510345459, 16.240222930908203, 16.9197998046875, 17.599376678466797, 18.278953552246094, 18.95853042602539, 19.638107299804688, 20.317684173583984, 20.99726104736328, 21.676837921142578, 22.356416702270508, 23.035993576049805, 23.7155704498291, 24.3951473236084]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 8.0, 9.0, 11.0, 17.0, 19.0, 18.0, 27.0, 24.0, 27.0, 28.0, 31.0, 36.0, 27.0, 36.0, 33.0, 35.0, 46.0, 32.0, 58.0, 41.0, 54.0, 42.0, 37.0, 38.0, 33.0, 31.0, 37.0, 17.0, 20.0, 24.0, 12.0, 18.0, 13.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.588407516479492, -8.307476043701172, -8.026544570922852, -7.745614051818848, -7.464682579040527, -7.183751106262207, -6.902820110321045, -6.621889114379883, -6.3409576416015625, -6.060026168823242, -5.77909517288208, -5.498164176940918, -5.217232704162598, -4.936301231384277, -4.655370235443115, -4.374439239501953, -4.093507766723633, -3.8125765323638916, -3.5316452980041504, -3.250714063644409, -2.969782829284668, -2.6888515949249268, -2.4079203605651855, -2.1269891262054443, -1.8460578918457031, -1.565126657485962, -1.2841954231262207, -1.0032641887664795, -0.7223329544067383, -0.44140172004699707, -0.16047048568725586, 0.12046074867248535, 0.40139102935791016, 0.6823222637176514, 0.9632534980773926, 1.2441847324371338, 1.525115966796875, 1.8060472011566162, 2.0869784355163574, 2.3679096698760986, 2.64884090423584, 2.929772138595581, 3.2107033729553223, 3.4916346073150635, 3.7725658416748047, 4.053497314453125, 4.334428310394287, 4.615359306335449, 4.8962907791137695, 5.17722225189209, 5.458153247833252, 5.739084243774414, 6.020015716552734, 6.300947189331055, 6.581878185272217, 6.862809181213379, 7.143740653991699, 7.4246721267700195, 7.705603122711182, 7.986534118652344, 8.267465591430664, 8.548397064208984, 8.829328536987305, 9.110259056091309, 9.391190528869629]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 12.0, 29.0, 37.0, 85.0, 142.0, 208.0, 393.0, 740.0, 1567.0, 3530.0, 8469.0, 23897.0, 81698.0, 496976.0, 3291564.0, 210927.0, 48169.0, 15365.0, 5733.0, 2432.0, 1101.0, 549.0, 241.0, 172.0, 92.0, 48.0, 33.0, 27.0, 14.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1494293212890625, -1.092803955078125, -1.0361785888671875, -0.97955322265625, -0.9229278564453125, -0.866302490234375, -0.8096771240234375, -0.7530517578125, -0.6964263916015625, -0.639801025390625, -0.5831756591796875, -0.52655029296875, -0.4699249267578125, -0.413299560546875, -0.3566741943359375, -0.300048828125, -0.2434234619140625, -0.186798095703125, -0.1301727294921875, -0.07354736328125, -0.0169219970703125, 0.039703369140625, 0.0963287353515625, 0.1529541015625, 0.2095794677734375, 0.266204833984375, 0.3228302001953125, 0.37945556640625, 0.4360809326171875, 0.492706298828125, 0.5493316650390625, 0.60595703125, 0.6625823974609375, 0.719207763671875, 0.7758331298828125, 0.83245849609375, 0.8890838623046875, 0.945709228515625, 1.0023345947265625, 1.0589599609375, 1.1155853271484375, 1.172210693359375, 1.2288360595703125, 1.28546142578125, 1.3420867919921875, 1.398712158203125, 1.4553375244140625, 1.511962890625, 1.5685882568359375, 1.625213623046875, 1.6818389892578125, 1.73846435546875, 1.7950897216796875, 1.851715087890625, 1.9083404541015625, 1.9649658203125, 2.0215911865234375, 2.078216552734375, 2.1348419189453125, 2.19146728515625, 2.2480926513671875, 2.304718017578125, 2.3613433837890625, 2.41796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 9.0, 7.0, 13.0, 19.0, 17.0, 18.0, 18.0, 22.0, 27.0, 38.0, 52.0, 48.0, 57.0, 63.0, 45.0, 52.0, 58.0, 58.0, 56.0, 43.0, 52.0, 40.0, 32.0, 13.0, 30.0, 25.0, 22.0, 15.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.48095703125, -0.4669036865234375, -0.452850341796875, -0.4387969970703125, -0.42474365234375, -0.4106903076171875, -0.396636962890625, -0.3825836181640625, -0.3685302734375, -0.3544769287109375, -0.340423583984375, -0.3263702392578125, -0.31231689453125, -0.2982635498046875, -0.284210205078125, -0.2701568603515625, -0.256103515625, -0.2420501708984375, -0.227996826171875, -0.2139434814453125, -0.19989013671875, -0.1858367919921875, -0.171783447265625, -0.1577301025390625, -0.1436767578125, -0.1296234130859375, -0.115570068359375, -0.1015167236328125, -0.08746337890625, -0.0734100341796875, -0.059356689453125, -0.0453033447265625, -0.03125, -0.0171966552734375, -0.003143310546875, 0.0109100341796875, 0.02496337890625, 0.0390167236328125, 0.053070068359375, 0.0671234130859375, 0.0811767578125, 0.0952301025390625, 0.109283447265625, 0.1233367919921875, 0.13739013671875, 0.1514434814453125, 0.165496826171875, 0.1795501708984375, 0.193603515625, 0.2076568603515625, 0.221710205078125, 0.2357635498046875, 0.24981689453125, 0.2638702392578125, 0.277923583984375, 0.2919769287109375, 0.3060302734375, 0.3200836181640625, 0.334136962890625, 0.3481903076171875, 0.36224365234375, 0.3762969970703125, 0.390350341796875, 0.4044036865234375, 0.41845703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 9.0, 20.0, 14.0, 25.0, 42.0, 61.0, 92.0, 168.0, 266.0, 481.0, 882.0, 1597.0, 3058.0, 6295.0, 13736.0, 32240.0, 87184.0, 302477.0, 2700713.0, 789608.0, 161127.0, 53781.0, 21490.0, 9415.0, 4506.0, 2207.0, 1188.0, 639.0, 353.0, 201.0, 119.0, 90.0, 54.0, 51.0, 26.0, 10.0, 17.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3515625, -1.3076324462890625, -1.263702392578125, -1.2197723388671875, -1.17584228515625, -1.1319122314453125, -1.087982177734375, -1.0440521240234375, -1.0001220703125, -0.9561920166015625, -0.912261962890625, -0.8683319091796875, -0.82440185546875, -0.7804718017578125, -0.736541748046875, -0.6926116943359375, -0.648681640625, -0.6047515869140625, -0.560821533203125, -0.5168914794921875, -0.47296142578125, -0.4290313720703125, -0.385101318359375, -0.3411712646484375, -0.2972412109375, -0.2533111572265625, -0.209381103515625, -0.1654510498046875, -0.12152099609375, -0.0775909423828125, -0.033660888671875, 0.0102691650390625, 0.05419921875, 0.0981292724609375, 0.142059326171875, 0.1859893798828125, 0.22991943359375, 0.2738494873046875, 0.317779541015625, 0.3617095947265625, 0.4056396484375, 0.4495697021484375, 0.493499755859375, 0.5374298095703125, 0.58135986328125, 0.6252899169921875, 0.669219970703125, 0.7131500244140625, 0.757080078125, 0.8010101318359375, 0.844940185546875, 0.8888702392578125, 0.93280029296875, 0.9767303466796875, 1.020660400390625, 1.0645904541015625, 1.1085205078125, 1.1524505615234375, 1.196380615234375, 1.2403106689453125, 1.28424072265625, 1.3281707763671875, 1.372100830078125, 1.4160308837890625, 1.4599609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 13.0, 16.0, 20.0, 40.0, 48.0, 63.0, 116.0, 156.0, 238.0, 527.0, 1504.0, 581.0, 275.0, 138.0, 109.0, 53.0, 53.0, 32.0, 25.0, 9.0, 10.0, 7.0, 4.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.037109375, -1.0061798095703125, -0.975250244140625, -0.9443206787109375, -0.91339111328125, -0.8824615478515625, -0.851531982421875, -0.8206024169921875, -0.7896728515625, -0.7587432861328125, -0.727813720703125, -0.6968841552734375, -0.66595458984375, -0.6350250244140625, -0.604095458984375, -0.5731658935546875, -0.542236328125, -0.5113067626953125, -0.480377197265625, -0.4494476318359375, -0.41851806640625, -0.3875885009765625, -0.356658935546875, -0.3257293701171875, -0.2947998046875, -0.2638702392578125, -0.232940673828125, -0.2020111083984375, -0.17108154296875, -0.1401519775390625, -0.109222412109375, -0.0782928466796875, -0.04736328125, -0.0164337158203125, 0.014495849609375, 0.0454254150390625, 0.07635498046875, 0.1072845458984375, 0.138214111328125, 0.1691436767578125, 0.2000732421875, 0.2310028076171875, 0.261932373046875, 0.2928619384765625, 0.32379150390625, 0.3547210693359375, 0.385650634765625, 0.4165802001953125, 0.447509765625, 0.4784393310546875, 0.509368896484375, 0.5402984619140625, 0.57122802734375, 0.6021575927734375, 0.633087158203125, 0.6640167236328125, 0.6949462890625, 0.7258758544921875, 0.756805419921875, 0.7877349853515625, 0.81866455078125, 0.8495941162109375, 0.880523681640625, 0.9114532470703125, 0.9423828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 23.0, 43.0, 65.0, 122.0, 161.0, 168.0, 161.0, 120.0, 76.0, 26.0, 16.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.415340423583984, -13.128097534179688, -12.84085464477539, -12.553610801696777, -12.26636791229248, -11.979125022888184, -11.691882133483887, -11.40463924407959, -11.117395401000977, -10.83015251159668, -10.542909622192383, -10.25566577911377, -9.968422889709473, -9.681180000305176, -9.393937110900879, -9.106694221496582, -8.819451332092285, -8.532208442687988, -8.244965553283691, -7.957722187042236, -7.670478820800781, -7.383235931396484, -7.0959930419921875, -6.808750152587891, -6.5215067863464355, -6.234263896942139, -5.947020530700684, -5.659777641296387, -5.37253475189209, -5.085291385650635, -4.798048496246338, -4.510805130004883, -4.223561763763428, -3.9363186359405518, -3.649075508117676, -3.361832618713379, -3.074589490890503, -2.787346363067627, -2.50010347366333, -2.212860345840454, -1.9256172180175781, -1.6383740901947021, -1.3511310815811157, -1.0638880729675293, -0.7766449451446533, -0.48940181732177734, -0.20215880870819092, 0.08508419990539551, 0.3723273277282715, 0.6595703959465027, 0.9468134641647339, 1.2340564727783203, 1.5212996006011963, 1.8085427284240723, 2.095785617828369, 2.383028745651245, 2.670271873474121, 2.957515001296997, 3.244758129119873, 3.53200101852417, 3.819244146347046, 4.106487274169922, 4.393730163574219, 4.680973052978516, 4.968216419219971]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 11.0, 7.0, 8.0, 14.0, 18.0, 27.0, 23.0, 30.0, 31.0, 33.0, 40.0, 45.0, 39.0, 42.0, 55.0, 40.0, 51.0, 52.0, 49.0, 37.0, 40.0, 42.0, 40.0, 32.0, 36.0, 26.0, 14.0, 15.0, 20.0, 18.0, 13.0, 13.0, 8.0, 5.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5559964179992676, -3.444936990737915, -3.3338775634765625, -3.222817897796631, -3.1117584705352783, -3.000699043273926, -2.889639377593994, -2.7785799503326416, -2.667520523071289, -2.5564610958099365, -2.445401668548584, -2.3343420028686523, -2.2232825756073, -2.1122231483459473, -2.0011634826660156, -1.890104055404663, -1.7790446281433105, -1.667985200881958, -1.556925654411316, -1.4458661079406738, -1.3348066806793213, -1.2237472534179688, -1.1126877069473267, -1.0016281604766846, -0.890568733215332, -0.7795092463493347, -0.6684497594833374, -0.5573902726173401, -0.4463307857513428, -0.33527129888534546, -0.22421181201934814, -0.11315232515335083, -0.002092599868774414, 0.1089668869972229, 0.22002637386322021, 0.33108586072921753, 0.44214534759521484, 0.5532048344612122, 0.6642643213272095, 0.7753238081932068, 0.8863832950592041, 0.9974427819252014, 1.1085022687911987, 1.2195618152618408, 1.3306212425231934, 1.441680669784546, 1.552740216255188, 1.66379976272583, 1.7748591899871826, 1.8859186172485352, 1.9969781637191772, 2.1080377101898193, 2.219097137451172, 2.3301565647125244, 2.441215991973877, 2.5522756576538086, 2.663335084915161, 2.7743945121765137, 2.8854541778564453, 2.996513605117798, 3.1075730323791504, 3.218632459640503, 3.3296918869018555, 3.440751552581787, 3.5518109798431396]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 13.0, 14.0, 29.0, 33.0, 67.0, 76.0, 137.0, 245.0, 427.0, 840.0, 1776.0, 3769.0, 8665.0, 20849.0, 50929.0, 121193.0, 245005.0, 289868.0, 173067.0, 76268.0, 31447.0, 12981.0, 5683.0, 2543.0, 1198.0, 598.0, 333.0, 185.0, 112.0, 79.0, 44.0, 29.0, 11.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4384765625, -1.3951873779296875, -1.351898193359375, -1.3086090087890625, -1.26531982421875, -1.2220306396484375, -1.178741455078125, -1.1354522705078125, -1.0921630859375, -1.0488739013671875, -1.005584716796875, -0.9622955322265625, -0.91900634765625, -0.8757171630859375, -0.832427978515625, -0.7891387939453125, -0.745849609375, -0.7025604248046875, -0.659271240234375, -0.6159820556640625, -0.57269287109375, -0.5294036865234375, -0.486114501953125, -0.4428253173828125, -0.3995361328125, -0.3562469482421875, -0.312957763671875, -0.2696685791015625, -0.22637939453125, -0.1830902099609375, -0.139801025390625, -0.0965118408203125, -0.05322265625, -0.0099334716796875, 0.033355712890625, 0.0766448974609375, 0.11993408203125, 0.1632232666015625, 0.206512451171875, 0.2498016357421875, 0.2930908203125, 0.3363800048828125, 0.379669189453125, 0.4229583740234375, 0.46624755859375, 0.5095367431640625, 0.552825927734375, 0.5961151123046875, 0.639404296875, 0.6826934814453125, 0.725982666015625, 0.7692718505859375, 0.81256103515625, 0.8558502197265625, 0.899139404296875, 0.9424285888671875, 0.9857177734375, 1.0290069580078125, 1.072296142578125, 1.1155853271484375, 1.15887451171875, 1.2021636962890625, 1.245452880859375, 1.2887420654296875, 1.33203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 3.0, 6.0, 13.0, 13.0, 9.0, 18.0, 22.0, 26.0, 24.0, 37.0, 37.0, 31.0, 47.0, 46.0, 40.0, 51.0, 51.0, 62.0, 59.0, 58.0, 48.0, 47.0, 46.0, 42.0, 32.0, 32.0, 22.0, 22.0, 11.0, 11.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4773597717285156, -0.46277618408203125, -0.4481925964355469, -0.4336090087890625, -0.4190254211425781, -0.40444183349609375, -0.3898582458496094, -0.375274658203125, -0.3606910705566406, -0.34610748291015625, -0.3315238952636719, -0.3169403076171875, -0.3023567199707031, -0.28777313232421875, -0.2731895446777344, -0.25860595703125, -0.24402236938476562, -0.22943878173828125, -0.21485519409179688, -0.2002716064453125, -0.18568801879882812, -0.17110443115234375, -0.15652084350585938, -0.141937255859375, -0.12735366821289062, -0.11277008056640625, -0.09818649291992188, -0.0836029052734375, -0.06901931762695312, -0.05443572998046875, -0.039852142333984375, -0.0252685546875, -0.010684967041015625, 0.00389862060546875, 0.018482208251953125, 0.0330657958984375, 0.047649383544921875, 0.06223297119140625, 0.07681655883789062, 0.091400146484375, 0.10598373413085938, 0.12056732177734375, 0.13515090942382812, 0.1497344970703125, 0.16431808471679688, 0.17890167236328125, 0.19348526000976562, 0.20806884765625, 0.22265243530273438, 0.23723602294921875, 0.2518196105957031, 0.2664031982421875, 0.2809867858886719, 0.29557037353515625, 0.3101539611816406, 0.324737548828125, 0.3393211364746094, 0.35390472412109375, 0.3684883117675781, 0.3830718994140625, 0.3976554870605469, 0.41223907470703125, 0.4268226623535156, 0.44140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 9.0, 5.0, 25.0, 25.0, 29.0, 39.0, 72.0, 87.0, 107.0, 202.0, 273.0, 433.0, 726.0, 1355.0, 3601.0, 15184.0, 92782.0, 481092.0, 372010.0, 63588.0, 11118.0, 2744.0, 1159.0, 607.0, 380.0, 274.0, 194.0, 137.0, 93.0, 49.0, 52.0, 33.0, 12.0, 17.0, 7.0, 11.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.376495361328125, -2.28814697265625, -2.199798583984375, -2.1114501953125, -2.023101806640625, -1.93475341796875, -1.846405029296875, -1.758056640625, -1.669708251953125, -1.58135986328125, -1.493011474609375, -1.4046630859375, -1.316314697265625, -1.22796630859375, -1.139617919921875, -1.05126953125, -0.962921142578125, -0.87457275390625, -0.786224365234375, -0.6978759765625, -0.609527587890625, -0.52117919921875, -0.432830810546875, -0.344482421875, -0.256134033203125, -0.16778564453125, -0.079437255859375, 0.0089111328125, 0.097259521484375, 0.18560791015625, 0.273956298828125, 0.3623046875, 0.450653076171875, 0.53900146484375, 0.627349853515625, 0.7156982421875, 0.804046630859375, 0.89239501953125, 0.980743408203125, 1.069091796875, 1.157440185546875, 1.24578857421875, 1.334136962890625, 1.4224853515625, 1.510833740234375, 1.59918212890625, 1.687530517578125, 1.77587890625, 1.864227294921875, 1.95257568359375, 2.040924072265625, 2.1292724609375, 2.217620849609375, 2.30596923828125, 2.394317626953125, 2.482666015625, 2.571014404296875, 2.65936279296875, 2.747711181640625, 2.8360595703125, 2.924407958984375, 3.01275634765625, 3.101104736328125, 3.189453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 13.0, 5.0, 9.0, 12.0, 12.0, 18.0, 17.0, 18.0, 21.0, 36.0, 26.0, 37.0, 32.0, 29.0, 35.0, 44.0, 47.0, 36.0, 46.0, 47.0, 38.0, 49.0, 41.0, 38.0, 24.0, 28.0, 31.0, 23.0, 20.0, 26.0, 16.0, 17.0, 17.0, 13.0, 16.0, 10.0, 14.0, 5.0, 3.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.017578125, -1.952178955078125, -1.88677978515625, -1.821380615234375, -1.7559814453125, -1.690582275390625, -1.62518310546875, -1.559783935546875, -1.494384765625, -1.428985595703125, -1.36358642578125, -1.298187255859375, -1.2327880859375, -1.167388916015625, -1.10198974609375, -1.036590576171875, -0.97119140625, -0.905792236328125, -0.84039306640625, -0.774993896484375, -0.7095947265625, -0.644195556640625, -0.57879638671875, -0.513397216796875, -0.447998046875, -0.382598876953125, -0.31719970703125, -0.251800537109375, -0.1864013671875, -0.121002197265625, -0.05560302734375, 0.009796142578125, 0.0751953125, 0.140594482421875, 0.20599365234375, 0.271392822265625, 0.3367919921875, 0.402191162109375, 0.46759033203125, 0.532989501953125, 0.598388671875, 0.663787841796875, 0.72918701171875, 0.794586181640625, 0.8599853515625, 0.925384521484375, 0.99078369140625, 1.056182861328125, 1.12158203125, 1.186981201171875, 1.25238037109375, 1.317779541015625, 1.3831787109375, 1.448577880859375, 1.51397705078125, 1.579376220703125, 1.644775390625, 1.710174560546875, 1.77557373046875, 1.840972900390625, 1.9063720703125, 1.971771240234375, 2.03717041015625, 2.102569580078125, 2.16796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 7.0, 6.0, 8.0, 6.0, 11.0, 15.0, 19.0, 36.0, 55.0, 82.0, 130.0, 272.0, 540.0, 1065.0, 2343.0, 6647.0, 23043.0, 97857.0, 416354.0, 381691.0, 87634.0, 20363.0, 6097.0, 2217.0, 955.0, 473.0, 251.0, 132.0, 95.0, 42.0, 31.0, 31.0, 18.0, 11.0, 9.0, 1.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9666900634765625, -0.924591064453125, -0.8824920654296875, -0.84039306640625, -0.7982940673828125, -0.756195068359375, -0.7140960693359375, -0.6719970703125, -0.6298980712890625, -0.587799072265625, -0.5457000732421875, -0.50360107421875, -0.4615020751953125, -0.419403076171875, -0.3773040771484375, -0.335205078125, -0.2931060791015625, -0.251007080078125, -0.2089080810546875, -0.16680908203125, -0.1247100830078125, -0.082611083984375, -0.0405120849609375, 0.0015869140625, 0.0436859130859375, 0.085784912109375, 0.1278839111328125, 0.16998291015625, 0.2120819091796875, 0.254180908203125, 0.2962799072265625, 0.33837890625, 0.3804779052734375, 0.422576904296875, 0.4646759033203125, 0.50677490234375, 0.5488739013671875, 0.590972900390625, 0.6330718994140625, 0.6751708984375, 0.7172698974609375, 0.759368896484375, 0.8014678955078125, 0.84356689453125, 0.8856658935546875, 0.927764892578125, 0.9698638916015625, 1.011962890625, 1.0540618896484375, 1.096160888671875, 1.1382598876953125, 1.18035888671875, 1.2224578857421875, 1.264556884765625, 1.3066558837890625, 1.3487548828125, 1.3908538818359375, 1.432952880859375, 1.4750518798828125, 1.51715087890625, 1.5592498779296875, 1.601348876953125, 1.6434478759765625, 1.685546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 2.0, 7.0, 13.0, 24.0, 25.0, 27.0, 37.0, 55.0, 60.0, 83.0, 105.0, 96.0, 104.0, 74.0, 56.0, 54.0, 37.0, 30.0, 23.0, 19.0, 16.0, 5.0, 18.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031280517578125, -0.0003044009208679199, -0.00029599666595458984, -0.00028759241104125977, -0.0002791881561279297, -0.0002707839012145996, -0.00026237964630126953, -0.00025397539138793945, -0.0002455711364746094, -0.0002371668815612793, -0.00022876262664794922, -0.00022035837173461914, -0.00021195411682128906, -0.00020354986190795898, -0.0001951456069946289, -0.00018674135208129883, -0.00017833709716796875, -0.00016993284225463867, -0.0001615285873413086, -0.00015312433242797852, -0.00014472007751464844, -0.00013631582260131836, -0.00012791156768798828, -0.0001195073127746582, -0.00011110305786132812, -0.00010269880294799805, -9.429454803466797e-05, -8.589029312133789e-05, -7.748603820800781e-05, -6.908178329467773e-05, -6.0677528381347656e-05, -5.227327346801758e-05, -4.38690185546875e-05, -3.546476364135742e-05, -2.7060508728027344e-05, -1.8656253814697266e-05, -1.0251998901367188e-05, -1.8477439880371094e-06, 6.556510925292969e-06, 1.4960765838623047e-05, 2.3365020751953125e-05, 3.17692756652832e-05, 4.017353057861328e-05, 4.857778549194336e-05, 5.698204040527344e-05, 6.538629531860352e-05, 7.37905502319336e-05, 8.219480514526367e-05, 9.059906005859375e-05, 9.900331497192383e-05, 0.0001074075698852539, 0.00011581182479858398, 0.00012421607971191406, 0.00013262033462524414, 0.00014102458953857422, 0.0001494288444519043, 0.00015783309936523438, 0.00016623735427856445, 0.00017464160919189453, 0.0001830458641052246, 0.0001914501190185547, 0.00019985437393188477, 0.00020825862884521484, 0.00021666288375854492, 0.000225067138671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 15.0, 9.0, 13.0, 20.0, 22.0, 47.0, 59.0, 85.0, 135.0, 169.0, 279.0, 510.0, 894.0, 1681.0, 3518.0, 8885.0, 27734.0, 105180.0, 403992.0, 363862.0, 91701.0, 24592.0, 8141.0, 3237.0, 1542.0, 829.0, 473.0, 294.0, 181.0, 142.0, 81.0, 53.0, 38.0, 33.0, 31.0, 16.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2265625, -1.1869354248046875, -1.147308349609375, -1.1076812744140625, -1.06805419921875, -1.0284271240234375, -0.988800048828125, -0.9491729736328125, -0.9095458984375, -0.8699188232421875, -0.830291748046875, -0.7906646728515625, -0.75103759765625, -0.7114105224609375, -0.671783447265625, -0.6321563720703125, -0.592529296875, -0.5529022216796875, -0.513275146484375, -0.4736480712890625, -0.43402099609375, -0.3943939208984375, -0.354766845703125, -0.3151397705078125, -0.2755126953125, -0.2358856201171875, -0.196258544921875, -0.1566314697265625, -0.11700439453125, -0.0773773193359375, -0.037750244140625, 0.0018768310546875, 0.04150390625, 0.0811309814453125, 0.120758056640625, 0.1603851318359375, 0.20001220703125, 0.2396392822265625, 0.279266357421875, 0.3188934326171875, 0.3585205078125, 0.3981475830078125, 0.437774658203125, 0.4774017333984375, 0.51702880859375, 0.5566558837890625, 0.596282958984375, 0.6359100341796875, 0.675537109375, 0.7151641845703125, 0.754791259765625, 0.7944183349609375, 0.83404541015625, 0.8736724853515625, 0.913299560546875, 0.9529266357421875, 0.9925537109375, 1.0321807861328125, 1.071807861328125, 1.1114349365234375, 1.15106201171875, 1.1906890869140625, 1.230316162109375, 1.2699432373046875, 1.3095703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 5.0, 6.0, 11.0, 15.0, 21.0, 20.0, 29.0, 28.0, 39.0, 48.0, 58.0, 55.0, 63.0, 63.0, 83.0, 77.0, 54.0, 59.0, 44.0, 37.0, 39.0, 27.0, 30.0, 13.0, 14.0, 16.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1119232177734375, -1.078338623046875, -1.0447540283203125, -1.01116943359375, -0.9775848388671875, -0.944000244140625, -0.9104156494140625, -0.8768310546875, -0.8432464599609375, -0.809661865234375, -0.7760772705078125, -0.74249267578125, -0.7089080810546875, -0.675323486328125, -0.6417388916015625, -0.608154296875, -0.5745697021484375, -0.540985107421875, -0.5074005126953125, -0.47381591796875, -0.4402313232421875, -0.406646728515625, -0.3730621337890625, -0.3394775390625, -0.3058929443359375, -0.272308349609375, -0.2387237548828125, -0.20513916015625, -0.1715545654296875, -0.137969970703125, -0.1043853759765625, -0.07080078125, -0.0372161865234375, -0.003631591796875, 0.0299530029296875, 0.06353759765625, 0.0971221923828125, 0.130706787109375, 0.1642913818359375, 0.1978759765625, 0.2314605712890625, 0.265045166015625, 0.2986297607421875, 0.33221435546875, 0.3657989501953125, 0.399383544921875, 0.4329681396484375, 0.466552734375, 0.5001373291015625, 0.533721923828125, 0.5673065185546875, 0.60089111328125, 0.6344757080078125, 0.668060302734375, 0.7016448974609375, 0.7352294921875, 0.7688140869140625, 0.802398681640625, 0.8359832763671875, 0.86956787109375, 0.9031524658203125, 0.936737060546875, 0.9703216552734375, 1.00390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 13.0, 28.0, 67.0, 104.0, 146.0, 165.0, 159.0, 143.0, 77.0, 43.0, 20.0, 21.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.57615852355957, -22.898099899291992, -22.22003936767578, -21.541980743408203, -20.863920211791992, -20.185861587524414, -19.507801055908203, -18.829742431640625, -18.151683807373047, -17.47362518310547, -16.795564651489258, -16.11750602722168, -15.439445495605469, -14.76138687133789, -14.083327293395996, -13.405267715454102, -12.72720718383789, -12.049147605895996, -11.371088027954102, -10.693029403686523, -10.014968872070312, -9.336910247802734, -8.65885066986084, -7.980791091918945, -7.302731513977051, -6.624671936035156, -5.946612358093262, -5.268553256988525, -4.590493679046631, -3.9124341011047363, -3.234375, -2.5563154220581055, -1.8782539367675781, -1.2001944780349731, -0.5221350193023682, 0.15592432022094727, 0.8339838981628418, 1.5120434761047363, 2.1901025772094727, 2.868162155151367, 3.5462217330932617, 4.224281311035156, 4.902340888977051, 5.580399990081787, 6.258459568023682, 6.936519145965576, 7.6145782470703125, 8.292637825012207, 8.970697402954102, 9.648756980895996, 10.32681655883789, 11.004875183105469, 11.68293571472168, 12.360994338989258, 13.039053916931152, 13.717113494873047, 14.395173072814941, 15.073232650756836, 15.75129222869873, 16.429351806640625, 17.107410430908203, 17.785470962524414, 18.463529586791992, 19.141590118408203, 19.81964874267578]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 7.0, 3.0, 4.0, 13.0, 11.0, 14.0, 8.0, 11.0, 16.0, 11.0, 26.0, 21.0, 28.0, 31.0, 36.0, 43.0, 42.0, 34.0, 37.0, 46.0, 43.0, 45.0, 48.0, 56.0, 41.0, 43.0, 44.0, 37.0, 33.0, 25.0, 20.0, 19.0, 21.0, 12.0, 11.0, 11.0, 13.0, 6.0, 10.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.2324857711792, -10.869551658630371, -10.506617546081543, -10.143683433532715, -9.78074836730957, -9.417814254760742, -9.054880142211914, -8.691946029663086, -8.329011917114258, -7.96607780456543, -7.603143692016602, -7.240209102630615, -6.877274990081787, -6.514340877532959, -6.151406288146973, -5.7884721755981445, -5.425538063049316, -5.062603950500488, -4.69966983795166, -4.336735248565674, -3.9738011360168457, -3.6108670234680176, -3.2479326725006104, -2.884998321533203, -2.522064208984375, -2.159130096435547, -1.7961957454681396, -1.433261513710022, -1.0703272819519043, -0.7073930501937866, -0.34445881843566895, 0.01847553253173828, 0.3814096450805664, 0.7443438768386841, 1.1072781085968018, 1.4702123403549194, 1.833146572113037, 2.1960806846618652, 2.5590150356292725, 2.9219493865966797, 3.284883499145508, 3.647817611694336, 4.010751724243164, 4.37368631362915, 4.7366204261779785, 5.099554538726807, 5.462489128112793, 5.825423240661621, 6.188357353210449, 6.551291465759277, 6.9142255783081055, 7.277160167694092, 7.64009428024292, 8.003028869628906, 8.365962982177734, 8.728897094726562, 9.09183120727539, 9.454765319824219, 9.817699432373047, 10.180633544921875, 10.543567657470703, 10.906502723693848, 11.269436836242676, 11.632370948791504, 11.995305061340332]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 6.0, 0.0, 2.0, 5.0, 13.0, 10.0, 13.0, 30.0, 31.0, 44.0, 83.0, 88.0, 154.0, 204.0, 349.0, 538.0, 851.0, 1534.0, 2703.0, 5881.0, 16038.0, 67660.0, 3908214.0, 148674.0, 24630.0, 8255.0, 3631.0, 1858.0, 1010.0, 592.0, 375.0, 237.0, 187.0, 110.0, 79.0, 46.0, 44.0, 32.0, 21.0, 11.0, 11.0, 9.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.949462890625, -1.87353515625, -1.797607421875, -1.7216796875, -1.645751953125, -1.56982421875, -1.493896484375, -1.41796875, -1.342041015625, -1.26611328125, -1.190185546875, -1.1142578125, -1.038330078125, -0.96240234375, -0.886474609375, -0.810546875, -0.734619140625, -0.65869140625, -0.582763671875, -0.5068359375, -0.430908203125, -0.35498046875, -0.279052734375, -0.203125, -0.127197265625, -0.05126953125, 0.024658203125, 0.1005859375, 0.176513671875, 0.25244140625, 0.328369140625, 0.404296875, 0.480224609375, 0.55615234375, 0.632080078125, 0.7080078125, 0.783935546875, 0.85986328125, 0.935791015625, 1.01171875, 1.087646484375, 1.16357421875, 1.239501953125, 1.3154296875, 1.391357421875, 1.46728515625, 1.543212890625, 1.619140625, 1.695068359375, 1.77099609375, 1.846923828125, 1.9228515625, 1.998779296875, 2.07470703125, 2.150634765625, 2.2265625, 2.302490234375, 2.37841796875, 2.454345703125, 2.5302734375, 2.606201171875, 2.68212890625, 2.758056640625, 2.833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 7.0, 12.0, 11.0, 21.0, 17.0, 24.0, 17.0, 31.0, 36.0, 37.0, 49.0, 40.0, 46.0, 52.0, 57.0, 57.0, 57.0, 70.0, 47.0, 38.0, 46.0, 41.0, 33.0, 25.0, 22.0, 15.0, 10.0, 14.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.62060546875, -0.6035995483398438, -0.5865936279296875, -0.5695877075195312, -0.552581787109375, -0.5355758666992188, -0.5185699462890625, -0.5015640258789062, -0.48455810546875, -0.46755218505859375, -0.4505462646484375, -0.43354034423828125, -0.416534423828125, -0.39952850341796875, -0.3825225830078125, -0.36551666259765625, -0.3485107421875, -0.33150482177734375, -0.3144989013671875, -0.29749298095703125, -0.280487060546875, -0.26348114013671875, -0.2464752197265625, -0.22946929931640625, -0.21246337890625, -0.19545745849609375, -0.1784515380859375, -0.16144561767578125, -0.144439697265625, -0.12743377685546875, -0.1104278564453125, -0.09342193603515625, -0.076416015625, -0.05941009521484375, -0.0424041748046875, -0.02539825439453125, -0.008392333984375, 0.00861358642578125, 0.0256195068359375, 0.04262542724609375, 0.05963134765625, 0.07663726806640625, 0.0936431884765625, 0.11064910888671875, 0.127655029296875, 0.14466094970703125, 0.1616668701171875, 0.17867279052734375, 0.1956787109375, 0.21268463134765625, 0.2296905517578125, 0.24669647216796875, 0.263702392578125, 0.28070831298828125, 0.2977142333984375, 0.31472015380859375, 0.33172607421875, 0.34873199462890625, 0.3657379150390625, 0.38274383544921875, 0.399749755859375, 0.41675567626953125, 0.4337615966796875, 0.45076751708984375, 0.4677734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 10.0, 8.0, 17.0, 23.0, 29.0, 62.0, 85.0, 132.0, 197.0, 364.0, 725.0, 1497.0, 3434.0, 9237.0, 35689.0, 3485323.0, 611064.0, 31635.0, 8481.0, 3145.0, 1408.0, 727.0, 385.0, 206.0, 123.0, 87.0, 55.0, 42.0, 23.0, 17.0, 9.0, 14.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.91339111328125, -2.8092041015625, -2.70501708984375, -2.600830078125, -2.49664306640625, -2.3924560546875, -2.28826904296875, -2.18408203125, -2.07989501953125, -1.9757080078125, -1.87152099609375, -1.767333984375, -1.66314697265625, -1.5589599609375, -1.45477294921875, -1.3505859375, -1.24639892578125, -1.1422119140625, -1.03802490234375, -0.933837890625, -0.82965087890625, -0.7254638671875, -0.62127685546875, -0.51708984375, -0.41290283203125, -0.3087158203125, -0.20452880859375, -0.100341796875, 0.00384521484375, 0.1080322265625, 0.21221923828125, 0.31640625, 0.42059326171875, 0.5247802734375, 0.62896728515625, 0.733154296875, 0.83734130859375, 0.9415283203125, 1.04571533203125, 1.14990234375, 1.25408935546875, 1.3582763671875, 1.46246337890625, 1.566650390625, 1.67083740234375, 1.7750244140625, 1.87921142578125, 1.9833984375, 2.08758544921875, 2.1917724609375, 2.29595947265625, 2.400146484375, 2.50433349609375, 2.6085205078125, 2.71270751953125, 2.81689453125, 2.92108154296875, 3.0252685546875, 3.12945556640625, 3.233642578125, 3.33782958984375, 3.4420166015625, 3.54620361328125, 3.650390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 10.0, 10.0, 23.0, 13.0, 26.0, 39.0, 73.0, 182.0, 3104.0, 338.0, 101.0, 65.0, 28.0, 15.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44287109375, -0.4249267578125, -0.406982421875, -0.3890380859375, -0.37109375, -0.3531494140625, -0.335205078125, -0.3172607421875, -0.29931640625, -0.2813720703125, -0.263427734375, -0.2454833984375, -0.2275390625, -0.2095947265625, -0.191650390625, -0.1737060546875, -0.15576171875, -0.1378173828125, -0.119873046875, -0.1019287109375, -0.083984375, -0.0660400390625, -0.048095703125, -0.0301513671875, -0.01220703125, 0.0057373046875, 0.023681640625, 0.0416259765625, 0.0595703125, 0.0775146484375, 0.095458984375, 0.1134033203125, 0.13134765625, 0.1492919921875, 0.167236328125, 0.1851806640625, 0.203125, 0.2210693359375, 0.239013671875, 0.2569580078125, 0.27490234375, 0.2928466796875, 0.310791015625, 0.3287353515625, 0.3466796875, 0.3646240234375, 0.382568359375, 0.4005126953125, 0.41845703125, 0.4364013671875, 0.454345703125, 0.4722900390625, 0.490234375, 0.5081787109375, 0.526123046875, 0.5440673828125, 0.56201171875, 0.5799560546875, 0.597900390625, 0.6158447265625, 0.6337890625, 0.6517333984375, 0.669677734375, 0.6876220703125, 0.70556640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 15.0, 23.0, 38.0, 51.0, 67.0, 85.0, 92.0, 87.0, 86.0, 93.0, 75.0, 61.0, 65.0, 36.0, 40.0, 22.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3268327713012695, -1.2658958435058594, -1.2049589157104492, -1.144021987915039, -1.0830851793289185, -1.0221482515335083, -0.9612113237380981, -0.900274395942688, -0.8393375277519226, -0.7784005999565125, -0.7174637317657471, -0.6565268039703369, -0.5955898761749268, -0.5346530079841614, -0.4737160801887512, -0.41277918219566345, -0.3518422842025757, -0.2909053862094879, -0.22996847331523895, -0.16903156042099, -0.10809466242790222, -0.04715776443481445, 0.013779163360595703, 0.07471606135368347, 0.13565295934677124, 0.196589857339859, 0.2575267553329468, 0.31846368312835693, 0.3794005811214447, 0.44033747911453247, 0.5012744069099426, 0.562211275100708, 0.6231482028961182, 0.6840851306915283, 0.7450219988822937, 0.8059589266777039, 0.8668957948684692, 0.9278327226638794, 0.9887696504592896, 1.0497065782546997, 1.1106433868408203, 1.1715803146362305, 1.2325172424316406, 1.2934541702270508, 1.3543909788131714, 1.4153279066085815, 1.4762648344039917, 1.5372017621994019, 1.598138689994812, 1.6590756177902222, 1.7200125455856323, 1.780949354171753, 1.841886281967163, 1.9028232097625732, 1.9637601375579834, 2.0246970653533936, 2.0856339931488037, 2.146570920944214, 2.207507848739624, 2.268444776535034, 2.3293817043304443, 2.3903183937072754, 2.4512553215026855, 2.5121922492980957, 2.573129177093506]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 7.0, 12.0, 9.0, 20.0, 18.0, 22.0, 31.0, 31.0, 37.0, 46.0, 39.0, 49.0, 45.0, 37.0, 38.0, 58.0, 55.0, 47.0, 34.0, 44.0, 28.0, 26.0, 37.0, 32.0, 23.0, 23.0, 24.0, 24.0, 12.0, 12.0, 14.0, 8.0, 13.0, 5.0, 3.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1505343914031982, -1.1135934591293335, -1.0766524076461792, -1.0397114753723145, -1.0027705430984497, -0.9658295512199402, -0.9288885593414307, -0.8919476270675659, -0.8550066351890564, -0.8180656433105469, -0.7811247110366821, -0.7441837191581726, -0.7072427272796631, -0.6703017950057983, -0.6333608031272888, -0.5964198112487793, -0.5594788789749146, -0.522537887096405, -0.4855969548225403, -0.44865596294403076, -0.41171500086784363, -0.3747740387916565, -0.337833046913147, -0.30089208483695984, -0.2639511227607727, -0.22701016068458557, -0.19006918370723724, -0.15312820672988892, -0.11618724465370178, -0.07924628257751465, -0.04230530560016632, -0.005364328622817993, 0.03157663345336914, 0.06851760298013687, 0.1054585725069046, 0.14239954948425293, 0.17934051156044006, 0.2162814736366272, 0.2532224655151367, 0.29016342759132385, 0.327104389667511, 0.3640453517436981, 0.40098631381988525, 0.4379273056983948, 0.4748682677745819, 0.511809229850769, 0.5487502217292786, 0.5856912136077881, 0.6226321458816528, 0.6595731377601624, 0.6965140700340271, 0.7334550619125366, 0.7703959941864014, 0.8073369860649109, 0.8442779779434204, 0.8812189102172852, 0.9181599020957947, 0.9551008939743042, 0.992041826248169, 1.0289827585220337, 1.065923810005188, 1.1028647422790527, 1.1398056745529175, 1.1767467260360718, 1.2136876583099365]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 11.0, 5.0, 20.0, 13.0, 26.0, 34.0, 78.0, 91.0, 192.0, 341.0, 654.0, 1536.0, 3506.0, 8647.0, 22349.0, 57896.0, 145612.0, 287022.0, 283748.0, 143748.0, 56804.0, 21428.0, 8372.0, 3412.0, 1515.0, 658.0, 356.0, 187.0, 109.0, 66.0, 38.0, 22.0, 13.0, 11.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.8525390625, -1.805023193359375, -1.75750732421875, -1.709991455078125, -1.6624755859375, -1.614959716796875, -1.56744384765625, -1.519927978515625, -1.472412109375, -1.424896240234375, -1.37738037109375, -1.329864501953125, -1.2823486328125, -1.234832763671875, -1.18731689453125, -1.139801025390625, -1.09228515625, -1.044769287109375, -0.99725341796875, -0.949737548828125, -0.9022216796875, -0.854705810546875, -0.80718994140625, -0.759674072265625, -0.712158203125, -0.664642333984375, -0.61712646484375, -0.569610595703125, -0.5220947265625, -0.474578857421875, -0.42706298828125, -0.379547119140625, -0.33203125, -0.284515380859375, -0.23699951171875, -0.189483642578125, -0.1419677734375, -0.094451904296875, -0.04693603515625, 0.000579833984375, 0.048095703125, 0.095611572265625, 0.14312744140625, 0.190643310546875, 0.2381591796875, 0.285675048828125, 0.33319091796875, 0.380706787109375, 0.42822265625, 0.475738525390625, 0.52325439453125, 0.570770263671875, 0.6182861328125, 0.665802001953125, 0.71331787109375, 0.760833740234375, 0.808349609375, 0.855865478515625, 0.90338134765625, 0.950897216796875, 0.9984130859375, 1.045928955078125, 1.09344482421875, 1.140960693359375, 1.1884765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 6.0, 9.0, 14.0, 14.0, 15.0, 25.0, 26.0, 27.0, 37.0, 30.0, 44.0, 57.0, 58.0, 55.0, 75.0, 63.0, 61.0, 59.0, 45.0, 35.0, 35.0, 37.0, 32.0, 31.0, 21.0, 12.0, 11.0, 10.0, 8.0, 5.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6729507446289062, -0.6540069580078125, -0.6350631713867188, -0.616119384765625, -0.5971755981445312, -0.5782318115234375, -0.5592880249023438, -0.54034423828125, -0.5214004516601562, -0.5024566650390625, -0.48351287841796875, -0.464569091796875, -0.44562530517578125, -0.4266815185546875, -0.40773773193359375, -0.3887939453125, -0.36985015869140625, -0.3509063720703125, -0.33196258544921875, -0.313018798828125, -0.29407501220703125, -0.2751312255859375, -0.25618743896484375, -0.23724365234375, -0.21829986572265625, -0.1993560791015625, -0.18041229248046875, -0.161468505859375, -0.14252471923828125, -0.1235809326171875, -0.10463714599609375, -0.085693359375, -0.06674957275390625, -0.0478057861328125, -0.02886199951171875, -0.009918212890625, 0.00902557373046875, 0.0279693603515625, 0.04691314697265625, 0.06585693359375, 0.08480072021484375, 0.1037445068359375, 0.12268829345703125, 0.141632080078125, 0.16057586669921875, 0.1795196533203125, 0.19846343994140625, 0.2174072265625, 0.23635101318359375, 0.2552947998046875, 0.27423858642578125, 0.293182373046875, 0.31212615966796875, 0.3310699462890625, 0.35001373291015625, 0.36895751953125, 0.38790130615234375, 0.4068450927734375, 0.42578887939453125, 0.444732666015625, 0.46367645263671875, 0.4826202392578125, 0.5015640258789062, 0.5205078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 14.0, 14.0, 16.0, 32.0, 38.0, 61.0, 86.0, 106.0, 160.0, 219.0, 316.0, 467.0, 781.0, 1309.0, 2999.0, 10517.0, 60934.0, 416820.0, 465301.0, 69614.0, 11840.0, 3162.0, 1396.0, 746.0, 483.0, 314.0, 225.0, 158.0, 120.0, 72.0, 53.0, 41.0, 28.0, 27.0, 20.0, 15.0, 14.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.28515625, -3.188629150390625, -3.09210205078125, -2.995574951171875, -2.8990478515625, -2.802520751953125, -2.70599365234375, -2.609466552734375, -2.512939453125, -2.416412353515625, -2.31988525390625, -2.223358154296875, -2.1268310546875, -2.030303955078125, -1.93377685546875, -1.837249755859375, -1.74072265625, -1.644195556640625, -1.54766845703125, -1.451141357421875, -1.3546142578125, -1.258087158203125, -1.16156005859375, -1.065032958984375, -0.968505859375, -0.871978759765625, -0.77545166015625, -0.678924560546875, -0.5823974609375, -0.485870361328125, -0.38934326171875, -0.292816162109375, -0.1962890625, -0.099761962890625, -0.00323486328125, 0.093292236328125, 0.1898193359375, 0.286346435546875, 0.38287353515625, 0.479400634765625, 0.575927734375, 0.672454833984375, 0.76898193359375, 0.865509033203125, 0.9620361328125, 1.058563232421875, 1.15509033203125, 1.251617431640625, 1.34814453125, 1.444671630859375, 1.54119873046875, 1.637725830078125, 1.7342529296875, 1.830780029296875, 1.92730712890625, 2.023834228515625, 2.120361328125, 2.216888427734375, 2.31341552734375, 2.409942626953125, 2.5064697265625, 2.602996826171875, 2.69952392578125, 2.796051025390625, 2.892578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 15.0, 9.0, 15.0, 11.0, 15.0, 23.0, 24.0, 26.0, 35.0, 39.0, 38.0, 51.0, 56.0, 54.0, 44.0, 51.0, 53.0, 48.0, 43.0, 40.0, 42.0, 40.0, 32.0, 32.0, 22.0, 24.0, 14.0, 16.0, 15.0, 13.0, 10.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.0595703125, -2.955078125, -2.8505859375, -2.74609375, -2.6416015625, -2.537109375, -2.4326171875, -2.328125, -2.2236328125, -2.119140625, -2.0146484375, -1.91015625, -1.8056640625, -1.701171875, -1.5966796875, -1.4921875, -1.3876953125, -1.283203125, -1.1787109375, -1.07421875, -0.9697265625, -0.865234375, -0.7607421875, -0.65625, -0.5517578125, -0.447265625, -0.3427734375, -0.23828125, -0.1337890625, -0.029296875, 0.0751953125, 0.1796875, 0.2841796875, 0.388671875, 0.4931640625, 0.59765625, 0.7021484375, 0.806640625, 0.9111328125, 1.015625, 1.1201171875, 1.224609375, 1.3291015625, 1.43359375, 1.5380859375, 1.642578125, 1.7470703125, 1.8515625, 1.9560546875, 2.060546875, 2.1650390625, 2.26953125, 2.3740234375, 2.478515625, 2.5830078125, 2.6875, 2.7919921875, 2.896484375, 3.0009765625, 3.10546875, 3.2099609375, 3.314453125, 3.4189453125, 3.5234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 7.0, 8.0, 19.0, 7.0, 36.0, 30.0, 49.0, 70.0, 129.0, 181.0, 292.0, 623.0, 1453.0, 4012.0, 14539.0, 69398.0, 404337.0, 452434.0, 77470.0, 16072.0, 4267.0, 1552.0, 659.0, 320.0, 208.0, 101.0, 76.0, 51.0, 46.0, 23.0, 23.0, 13.0, 14.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4039764404296875, -1.358734130859375, -1.3134918212890625, -1.26824951171875, -1.2230072021484375, -1.177764892578125, -1.1325225830078125, -1.0872802734375, -1.0420379638671875, -0.996795654296875, -0.9515533447265625, -0.90631103515625, -0.8610687255859375, -0.815826416015625, -0.7705841064453125, -0.725341796875, -0.6800994873046875, -0.634857177734375, -0.5896148681640625, -0.54437255859375, -0.4991302490234375, -0.453887939453125, -0.4086456298828125, -0.3634033203125, -0.3181610107421875, -0.272918701171875, -0.2276763916015625, -0.18243408203125, -0.1371917724609375, -0.091949462890625, -0.0467071533203125, -0.00146484375, 0.0437774658203125, 0.089019775390625, 0.1342620849609375, 0.17950439453125, 0.2247467041015625, 0.269989013671875, 0.3152313232421875, 0.3604736328125, 0.4057159423828125, 0.450958251953125, 0.4962005615234375, 0.54144287109375, 0.5866851806640625, 0.631927490234375, 0.6771697998046875, 0.722412109375, 0.7676544189453125, 0.812896728515625, 0.8581390380859375, 0.90338134765625, 0.9486236572265625, 0.993865966796875, 1.0391082763671875, 1.0843505859375, 1.1295928955078125, 1.174835205078125, 1.2200775146484375, 1.26531982421875, 1.3105621337890625, 1.355804443359375, 1.4010467529296875, 1.4462890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 12.0, 19.0, 13.0, 16.0, 29.0, 37.0, 56.0, 61.0, 72.0, 86.0, 77.0, 91.0, 70.0, 79.0, 49.0, 36.0, 38.0, 24.0, 32.0, 18.0, 15.0, 14.0, 8.0, 7.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000194549560546875, -0.00018706917762756348, -0.00017958879470825195, -0.00017210841178894043, -0.0001646280288696289, -0.00015714764595031738, -0.00014966726303100586, -0.00014218688011169434, -0.0001347064971923828, -0.0001272261142730713, -0.00011974573135375977, -0.00011226534843444824, -0.00010478496551513672, -9.73045825958252e-05, -8.982419967651367e-05, -8.234381675720215e-05, -7.486343383789062e-05, -6.73830509185791e-05, -5.990266799926758e-05, -5.2422285079956055e-05, -4.494190216064453e-05, -3.746151924133301e-05, -2.9981136322021484e-05, -2.250075340270996e-05, -1.5020370483398438e-05, -7.539987564086914e-06, -5.960464477539063e-08, 7.420778274536133e-06, 1.4901161193847656e-05, 2.238154411315918e-05, 2.9861927032470703e-05, 3.7342309951782227e-05, 4.482269287109375e-05, 5.2303075790405273e-05, 5.97834587097168e-05, 6.726384162902832e-05, 7.474422454833984e-05, 8.222460746765137e-05, 8.970499038696289e-05, 9.718537330627441e-05, 0.00010466575622558594, 0.00011214613914489746, 0.00011962652206420898, 0.0001271069049835205, 0.00013458728790283203, 0.00014206767082214355, 0.00014954805374145508, 0.0001570284366607666, 0.00016450881958007812, 0.00017198920249938965, 0.00017946958541870117, 0.0001869499683380127, 0.00019443035125732422, 0.00020191073417663574, 0.00020939111709594727, 0.0002168715000152588, 0.0002243518829345703, 0.00023183226585388184, 0.00023931264877319336, 0.0002467930316925049, 0.0002542734146118164, 0.00026175379753112793, 0.00026923418045043945, 0.000276714563369751, 0.0002841949462890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 17.0, 15.0, 27.0, 25.0, 62.0, 70.0, 114.0, 211.0, 388.0, 753.0, 1816.0, 5816.0, 33446.0, 379908.0, 562846.0, 51291.0, 7676.0, 2144.0, 857.0, 430.0, 248.0, 123.0, 98.0, 42.0, 30.0, 22.0, 17.0, 12.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.115234375, -2.054962158203125, -1.99468994140625, -1.934417724609375, -1.8741455078125, -1.813873291015625, -1.75360107421875, -1.693328857421875, -1.633056640625, -1.572784423828125, -1.51251220703125, -1.452239990234375, -1.3919677734375, -1.331695556640625, -1.27142333984375, -1.211151123046875, -1.15087890625, -1.090606689453125, -1.03033447265625, -0.970062255859375, -0.9097900390625, -0.849517822265625, -0.78924560546875, -0.728973388671875, -0.668701171875, -0.608428955078125, -0.54815673828125, -0.487884521484375, -0.4276123046875, -0.367340087890625, -0.30706787109375, -0.246795654296875, -0.1865234375, -0.126251220703125, -0.06597900390625, -0.005706787109375, 0.0545654296875, 0.114837646484375, 0.17510986328125, 0.235382080078125, 0.295654296875, 0.355926513671875, 0.41619873046875, 0.476470947265625, 0.5367431640625, 0.597015380859375, 0.65728759765625, 0.717559814453125, 0.77783203125, 0.838104248046875, 0.89837646484375, 0.958648681640625, 1.0189208984375, 1.079193115234375, 1.13946533203125, 1.199737548828125, 1.260009765625, 1.320281982421875, 1.38055419921875, 1.440826416015625, 1.5010986328125, 1.561370849609375, 1.62164306640625, 1.681915283203125, 1.7421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 14.0, 17.0, 26.0, 36.0, 49.0, 43.0, 72.0, 71.0, 80.0, 89.0, 93.0, 72.0, 61.0, 53.0, 36.0, 39.0, 25.0, 21.0, 15.0, 12.0, 10.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.662109375, -1.6167755126953125, -1.571441650390625, -1.5261077880859375, -1.48077392578125, -1.4354400634765625, -1.390106201171875, -1.3447723388671875, -1.2994384765625, -1.2541046142578125, -1.208770751953125, -1.1634368896484375, -1.11810302734375, -1.0727691650390625, -1.027435302734375, -0.9821014404296875, -0.936767578125, -0.8914337158203125, -0.846099853515625, -0.8007659912109375, -0.75543212890625, -0.7100982666015625, -0.664764404296875, -0.6194305419921875, -0.5740966796875, -0.5287628173828125, -0.483428955078125, -0.4380950927734375, -0.39276123046875, -0.3474273681640625, -0.302093505859375, -0.2567596435546875, -0.21142578125, -0.1660919189453125, -0.120758056640625, -0.0754241943359375, -0.03009033203125, 0.0152435302734375, 0.060577392578125, 0.1059112548828125, 0.1512451171875, 0.1965789794921875, 0.241912841796875, 0.2872467041015625, 0.33258056640625, 0.3779144287109375, 0.423248291015625, 0.4685821533203125, 0.513916015625, 0.5592498779296875, 0.604583740234375, 0.6499176025390625, 0.69525146484375, 0.7405853271484375, 0.785919189453125, 0.8312530517578125, 0.8765869140625, 0.9219207763671875, 0.967254638671875, 1.0125885009765625, 1.05792236328125, 1.1032562255859375, 1.148590087890625, 1.1939239501953125, 1.2392578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 40.0, 127.0, 253.0, 315.0, 164.0, 67.0, 17.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.206470489501953, -14.763477325439453, -13.32048511505127, -11.877492904663086, -10.434499740600586, -8.991506576538086, -7.548514366149902, -6.105522155761719, -4.662528991699219, -3.219536304473877, -1.7765436172485352, -0.33355093002319336, 1.1094417572021484, 2.5524344444274902, 3.995427131652832, 5.438419342041016, 6.881412506103516, 8.324405670166016, 9.7673978805542, 11.210390090942383, 12.653383255004883, 14.096376419067383, 15.539368629455566, 16.98236083984375, 18.42535400390625, 19.86834716796875, 21.31134033203125, 22.754331588745117, 24.197324752807617, 25.640317916870117, 27.083309173583984, 28.526302337646484, 29.96929168701172, 31.41228485107422, 32.85527801513672, 34.29827117919922, 35.74126434326172, 37.18425369262695, 38.62724685668945, 40.07024002075195, 41.51323318481445, 42.95622634887695, 44.39921951293945, 45.84221267700195, 47.28520202636719, 48.72819519042969, 50.17118835449219, 51.61418151855469, 53.05717468261719, 54.50016784667969, 55.94316101074219, 57.38615417480469, 58.82914733886719, 60.27213668823242, 61.71512985229492, 63.15812301635742, 64.60111999511719, 66.04411315917969, 67.48710632324219, 68.93009948730469, 70.37309265136719, 71.81608581542969, 73.25907897949219, 74.70207214355469, 76.14505767822266]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 7.0, 11.0, 9.0, 19.0, 11.0, 20.0, 20.0, 23.0, 22.0, 36.0, 39.0, 41.0, 43.0, 57.0, 44.0, 61.0, 47.0, 50.0, 43.0, 53.0, 44.0, 40.0, 36.0, 27.0, 26.0, 25.0, 25.0, 20.0, 26.0, 14.0, 8.0, 6.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.999813079833984, -16.508935928344727, -16.018056869506836, -15.527179718017578, -15.036301612854004, -14.54542350769043, -14.054546356201172, -13.563668251037598, -13.072790145874023, -12.58191204071045, -12.091034889221191, -11.600156784057617, -11.109278678894043, -10.618400573730469, -10.127523422241211, -9.636645317077637, -9.145768165588379, -8.654890060424805, -8.164012908935547, -7.673134803771973, -7.182256698608398, -6.691379070281982, -6.200501441955566, -5.709623336791992, -5.218745708465576, -4.72786808013916, -4.236989974975586, -3.74611234664917, -3.255234479904175, -2.7643566131591797, -2.2734789848327637, -1.7826011180877686, -1.2917232513427734, -0.8008454442024231, -0.30996763706207275, 0.1809101104736328, 0.6717879772186279, 1.162665843963623, 1.653543472290039, 2.144421339035034, 2.6352992057800293, 3.1261770725250244, 3.6170549392700195, 4.1079325675964355, 4.598810195922852, 5.089688301086426, 5.580565929412842, 6.071443557739258, 6.562321662902832, 7.053199291229248, 7.544077396392822, 8.034955024719238, 8.525833129882812, 9.01671028137207, 9.507588386535645, 9.998466491699219, 10.489343643188477, 10.98022174835205, 11.471098899841309, 11.961977005004883, 12.452855110168457, 12.943733215332031, 13.434610366821289, 13.925488471984863, 14.416366577148438]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 2.0, 8.0, 10.0, 15.0, 31.0, 30.0, 63.0, 102.0, 111.0, 221.0, 351.0, 603.0, 1168.0, 2464.0, 5984.0, 19345.0, 147975.0, 3948504.0, 48670.0, 10969.0, 3912.0, 1757.0, 818.0, 444.0, 280.0, 147.0, 123.0, 66.0, 26.0, 31.0, 9.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.74609375, -2.6553955078125, -2.564697265625, -2.4739990234375, -2.38330078125, -2.2926025390625, -2.201904296875, -2.1112060546875, -2.0205078125, -1.9298095703125, -1.839111328125, -1.7484130859375, -1.65771484375, -1.5670166015625, -1.476318359375, -1.3856201171875, -1.294921875, -1.2042236328125, -1.113525390625, -1.0228271484375, -0.93212890625, -0.8414306640625, -0.750732421875, -0.6600341796875, -0.5693359375, -0.4786376953125, -0.387939453125, -0.2972412109375, -0.20654296875, -0.1158447265625, -0.025146484375, 0.0655517578125, 0.15625, 0.2469482421875, 0.337646484375, 0.4283447265625, 0.51904296875, 0.6097412109375, 0.700439453125, 0.7911376953125, 0.8818359375, 0.9725341796875, 1.063232421875, 1.1539306640625, 1.24462890625, 1.3353271484375, 1.426025390625, 1.5167236328125, 1.607421875, 1.6981201171875, 1.788818359375, 1.8795166015625, 1.97021484375, 2.0609130859375, 2.151611328125, 2.2423095703125, 2.3330078125, 2.4237060546875, 2.514404296875, 2.6051025390625, 2.69580078125, 2.7864990234375, 2.877197265625, 2.9678955078125, 3.05859375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 5.0, 5.0, 14.0, 9.0, 12.0, 11.0, 13.0, 16.0, 22.0, 34.0, 34.0, 45.0, 49.0, 79.0, 73.0, 57.0, 65.0, 70.0, 73.0, 56.0, 53.0, 52.0, 35.0, 23.0, 19.0, 16.0, 14.0, 9.0, 10.0, 4.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92236328125, -0.8979415893554688, -0.8735198974609375, -0.8490982055664062, -0.824676513671875, -0.8002548217773438, -0.7758331298828125, -0.7514114379882812, -0.72698974609375, -0.7025680541992188, -0.6781463623046875, -0.6537246704101562, -0.629302978515625, -0.6048812866210938, -0.5804595947265625, -0.5560379028320312, -0.5316162109375, -0.5071945190429688, -0.4827728271484375, -0.45835113525390625, -0.433929443359375, -0.40950775146484375, -0.3850860595703125, -0.36066436767578125, -0.33624267578125, -0.31182098388671875, -0.2873992919921875, -0.26297760009765625, -0.238555908203125, -0.21413421630859375, -0.1897125244140625, -0.16529083251953125, -0.140869140625, -0.11644744873046875, -0.0920257568359375, -0.06760406494140625, -0.043182373046875, -0.01876068115234375, 0.0056610107421875, 0.03008270263671875, 0.05450439453125, 0.07892608642578125, 0.1033477783203125, 0.12776947021484375, 0.152191162109375, 0.17661285400390625, 0.2010345458984375, 0.22545623779296875, 0.2498779296875, 0.27429962158203125, 0.2987213134765625, 0.32314300537109375, 0.347564697265625, 0.37198638916015625, 0.3964080810546875, 0.42082977294921875, 0.44525146484375, 0.46967315673828125, 0.4940948486328125, 0.5185165405273438, 0.542938232421875, 0.5673599243164062, 0.5917816162109375, 0.6162033081054688, 0.640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 8.0, 5.0, 9.0, 7.0, 9.0, 14.0, 10.0, 23.0, 21.0, 48.0, 70.0, 82.0, 101.0, 154.0, 239.0, 375.0, 633.0, 1124.0, 2258.0, 4673.0, 10614.0, 32282.0, 185008.0, 3813200.0, 103163.0, 23651.0, 8250.0, 3745.0, 1854.0, 988.0, 576.0, 343.0, 209.0, 118.0, 100.0, 86.0, 61.0, 39.0, 31.0, 26.0, 24.0, 12.0, 12.0, 8.0, 10.0, 6.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.31488037109375, -2.2410888671875, -2.16729736328125, -2.093505859375, -2.01971435546875, -1.9459228515625, -1.87213134765625, -1.79833984375, -1.72454833984375, -1.6507568359375, -1.57696533203125, -1.503173828125, -1.42938232421875, -1.3555908203125, -1.28179931640625, -1.2080078125, -1.13421630859375, -1.0604248046875, -0.98663330078125, -0.912841796875, -0.83905029296875, -0.7652587890625, -0.69146728515625, -0.61767578125, -0.54388427734375, -0.4700927734375, -0.39630126953125, -0.322509765625, -0.24871826171875, -0.1749267578125, -0.10113525390625, -0.02734375, 0.04644775390625, 0.1202392578125, 0.19403076171875, 0.267822265625, 0.34161376953125, 0.4154052734375, 0.48919677734375, 0.56298828125, 0.63677978515625, 0.7105712890625, 0.78436279296875, 0.858154296875, 0.93194580078125, 1.0057373046875, 1.07952880859375, 1.1533203125, 1.22711181640625, 1.3009033203125, 1.37469482421875, 1.448486328125, 1.52227783203125, 1.5960693359375, 1.66986083984375, 1.74365234375, 1.81744384765625, 1.8912353515625, 1.96502685546875, 2.038818359375, 2.11260986328125, 2.1864013671875, 2.26019287109375, 2.333984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 8.0, 2.0, 5.0, 6.0, 12.0, 29.0, 26.0, 49.0, 90.0, 174.0, 924.0, 2409.0, 143.0, 70.0, 38.0, 30.0, 14.0, 9.0, 5.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7744140625, -0.75506591796875, -0.7357177734375, -0.71636962890625, -0.697021484375, -0.67767333984375, -0.6583251953125, -0.63897705078125, -0.61962890625, -0.60028076171875, -0.5809326171875, -0.56158447265625, -0.542236328125, -0.52288818359375, -0.5035400390625, -0.48419189453125, -0.46484375, -0.44549560546875, -0.4261474609375, -0.40679931640625, -0.387451171875, -0.36810302734375, -0.3487548828125, -0.32940673828125, -0.31005859375, -0.29071044921875, -0.2713623046875, -0.25201416015625, -0.232666015625, -0.21331787109375, -0.1939697265625, -0.17462158203125, -0.1552734375, -0.13592529296875, -0.1165771484375, -0.09722900390625, -0.077880859375, -0.05853271484375, -0.0391845703125, -0.01983642578125, -0.00048828125, 0.01885986328125, 0.0382080078125, 0.05755615234375, 0.076904296875, 0.09625244140625, 0.1156005859375, 0.13494873046875, 0.154296875, 0.17364501953125, 0.1929931640625, 0.21234130859375, 0.231689453125, 0.25103759765625, 0.2703857421875, 0.28973388671875, 0.30908203125, 0.32843017578125, 0.3477783203125, 0.36712646484375, 0.386474609375, 0.40582275390625, 0.4251708984375, 0.44451904296875, 0.4638671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 6.0, 12.0, 24.0, 39.0, 52.0, 88.0, 89.0, 123.0, 143.0, 114.0, 101.0, 82.0, 52.0, 30.0, 20.0, 9.0, 7.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.143301010131836, -5.041082859039307, -4.938864231109619, -4.83664608001709, -4.734427452087402, -4.632209300994873, -4.529991149902344, -4.427772521972656, -4.325554370880127, -4.223336219787598, -4.12111759185791, -4.018899440765381, -3.9166810512542725, -3.814462661743164, -3.7122442722320557, -3.6100258827209473, -3.507807731628418, -3.4055893421173096, -3.303370952606201, -3.201152801513672, -3.0989344120025635, -2.996716022491455, -2.8944976329803467, -2.7922792434692383, -2.69006085395813, -2.5878424644470215, -2.485624074935913, -2.383405923843384, -2.2811875343322754, -2.178969144821167, -2.0767507553100586, -1.9745324850082397, -1.872314214706421, -1.7700958251953125, -1.6678775548934937, -1.5656591653823853, -1.4634408950805664, -1.361222505569458, -1.2590041160583496, -1.1567858457565308, -1.054567575454712, -0.9523492455482483, -0.8501309156417847, -0.7479125261306763, -0.6456942558288574, -0.543475866317749, -0.4412575364112854, -0.3390392065048218, -0.23682081699371338, -0.13460248708724976, -0.03238414227962494, 0.06983420252799988, 0.1720525324344635, 0.2742708921432495, 0.37648922204971313, 0.47870755195617676, 0.5809258818626404, 0.683144211769104, 0.7853625416755676, 0.8875808715820312, 0.9897992610931396, 1.092017650604248, 1.194235920906067, 1.2964541912078857, 1.3986725807189941]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 5.0, 11.0, 13.0, 10.0, 10.0, 11.0, 18.0, 26.0, 20.0, 32.0, 44.0, 38.0, 45.0, 42.0, 34.0, 44.0, 41.0, 41.0, 42.0, 37.0, 45.0, 39.0, 33.0, 38.0, 33.0, 36.0, 25.0, 27.0, 27.0, 20.0, 24.0, 19.0, 16.0, 10.0, 7.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.382106065750122, -1.3313755989074707, -1.2806451320648193, -1.229914665222168, -1.1791841983795166, -1.1284537315368652, -1.0777232646942139, -1.0269927978515625, -0.9762623906135559, -0.9255319237709045, -0.8748014569282532, -0.8240710496902466, -0.7733405828475952, -0.7226101160049438, -0.6718796491622925, -0.6211491823196411, -0.5704187154769897, -0.5196882486343384, -0.468957781791687, -0.41822734475135803, -0.36749687790870667, -0.3167664110660553, -0.2660359740257263, -0.21530550718307495, -0.16457504034042358, -0.11384458094835281, -0.06311412155628204, -0.01238366961479187, 0.0383467972278595, 0.08907726407051086, 0.13980770111083984, 0.1905381679534912, 0.24126863479614258, 0.29199910163879395, 0.3427295684814453, 0.3934600055217743, 0.44419047236442566, 0.494920939207077, 0.545651376247406, 0.5963818430900574, 0.6471123099327087, 0.6978427767753601, 0.7485732436180115, 0.7993036508560181, 0.8500341176986694, 0.9007645845413208, 0.9514950513839722, 1.0022255182266235, 1.052955985069275, 1.1036864519119263, 1.1544169187545776, 1.205147385597229, 1.2558778524398804, 1.3066083192825317, 1.3573386669158936, 1.408069133758545, 1.4587996006011963, 1.5095300674438477, 1.560260534286499, 1.6109910011291504, 1.6617214679718018, 1.7124519348144531, 1.7631824016571045, 1.8139128684997559, 1.8646433353424072]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 21.0, 20.0, 28.0, 50.0, 77.0, 113.0, 165.0, 296.0, 455.0, 723.0, 1244.0, 2395.0, 4315.0, 8394.0, 17226.0, 35427.0, 73117.0, 141707.0, 225872.0, 232150.0, 150757.0, 78511.0, 37778.0, 18334.0, 8951.0, 4587.0, 2462.0, 1362.0, 721.0, 479.0, 281.0, 183.0, 115.0, 70.0, 56.0, 30.0, 14.0, 15.0, 15.0, 9.0, 9.0, 6.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78564453125, -0.7565994262695312, -0.7275543212890625, -0.6985092163085938, -0.669464111328125, -0.6404190063476562, -0.6113739013671875, -0.5823287963867188, -0.55328369140625, -0.5242385864257812, -0.4951934814453125, -0.46614837646484375, -0.437103271484375, -0.40805816650390625, -0.3790130615234375, -0.34996795654296875, -0.3209228515625, -0.29187774658203125, -0.2628326416015625, -0.23378753662109375, -0.204742431640625, -0.17569732666015625, -0.1466522216796875, -0.11760711669921875, -0.08856201171875, -0.05951690673828125, -0.0304718017578125, -0.00142669677734375, 0.027618408203125, 0.05666351318359375, 0.0857086181640625, 0.11475372314453125, 0.143798828125, 0.17284393310546875, 0.2018890380859375, 0.23093414306640625, 0.259979248046875, 0.28902435302734375, 0.3180694580078125, 0.34711456298828125, 0.37615966796875, 0.40520477294921875, 0.4342498779296875, 0.46329498291015625, 0.492340087890625, 0.5213851928710938, 0.5504302978515625, 0.5794754028320312, 0.6085205078125, 0.6375656127929688, 0.6666107177734375, 0.6956558227539062, 0.724700927734375, 0.7537460327148438, 0.7827911376953125, 0.8118362426757812, 0.84088134765625, 0.8699264526367188, 0.8989715576171875, 0.9280166625976562, 0.957061767578125, 0.9861068725585938, 1.0151519775390625, 1.0441970825195312, 1.0732421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 8.0, 11.0, 12.0, 14.0, 17.0, 23.0, 27.0, 22.0, 30.0, 43.0, 42.0, 60.0, 60.0, 63.0, 72.0, 75.0, 65.0, 63.0, 48.0, 53.0, 40.0, 36.0, 20.0, 12.0, 14.0, 15.0, 12.0, 8.0, 3.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.00390625, -0.9789276123046875, -0.953948974609375, -0.9289703369140625, -0.90399169921875, -0.8790130615234375, -0.854034423828125, -0.8290557861328125, -0.8040771484375, -0.7790985107421875, -0.754119873046875, -0.7291412353515625, -0.70416259765625, -0.6791839599609375, -0.654205322265625, -0.6292266845703125, -0.604248046875, -0.5792694091796875, -0.554290771484375, -0.5293121337890625, -0.50433349609375, -0.4793548583984375, -0.454376220703125, -0.4293975830078125, -0.4044189453125, -0.3794403076171875, -0.354461669921875, -0.3294830322265625, -0.30450439453125, -0.2795257568359375, -0.254547119140625, -0.2295684814453125, -0.20458984375, -0.1796112060546875, -0.154632568359375, -0.1296539306640625, -0.10467529296875, -0.0796966552734375, -0.054718017578125, -0.0297393798828125, -0.0047607421875, 0.0202178955078125, 0.045196533203125, 0.0701751708984375, 0.09515380859375, 0.1201324462890625, 0.145111083984375, 0.1700897216796875, 0.195068359375, 0.2200469970703125, 0.245025634765625, 0.2700042724609375, 0.29498291015625, 0.3199615478515625, 0.344940185546875, 0.3699188232421875, 0.3948974609375, 0.4198760986328125, 0.444854736328125, 0.4698333740234375, 0.49481201171875, 0.5197906494140625, 0.544769287109375, 0.5697479248046875, 0.5947265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 27.0, 25.0, 54.0, 79.0, 107.0, 191.0, 302.0, 453.0, 874.0, 1647.0, 4692.0, 34239.0, 565038.0, 409218.0, 24319.0, 3930.0, 1420.0, 743.0, 393.0, 262.0, 172.0, 106.0, 67.0, 48.0, 30.0, 18.0, 20.0, 16.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.548828125, -3.43768310546875, -3.3265380859375, -3.21539306640625, -3.104248046875, -2.99310302734375, -2.8819580078125, -2.77081298828125, -2.65966796875, -2.54852294921875, -2.4373779296875, -2.32623291015625, -2.215087890625, -2.10394287109375, -1.9927978515625, -1.88165283203125, -1.7705078125, -1.65936279296875, -1.5482177734375, -1.43707275390625, -1.325927734375, -1.21478271484375, -1.1036376953125, -0.99249267578125, -0.88134765625, -0.77020263671875, -0.6590576171875, -0.54791259765625, -0.436767578125, -0.32562255859375, -0.2144775390625, -0.10333251953125, 0.0078125, 0.11895751953125, 0.2301025390625, 0.34124755859375, 0.452392578125, 0.56353759765625, 0.6746826171875, 0.78582763671875, 0.89697265625, 1.00811767578125, 1.1192626953125, 1.23040771484375, 1.341552734375, 1.45269775390625, 1.5638427734375, 1.67498779296875, 1.7861328125, 1.89727783203125, 2.0084228515625, 2.11956787109375, 2.230712890625, 2.34185791015625, 2.4530029296875, 2.56414794921875, 2.67529296875, 2.78643798828125, 2.8975830078125, 3.00872802734375, 3.119873046875, 3.23101806640625, 3.3421630859375, 3.45330810546875, 3.564453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 12.0, 19.0, 16.0, 16.0, 24.0, 23.0, 31.0, 37.0, 55.0, 46.0, 47.0, 59.0, 42.0, 48.0, 49.0, 52.0, 53.0, 39.0, 48.0, 54.0, 40.0, 25.0, 21.0, 27.0, 10.0, 12.0, 8.0, 12.0, 8.0, 11.0, 8.0, 2.0, 3.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46484375, -3.353057861328125, -3.24127197265625, -3.129486083984375, -3.0177001953125, -2.905914306640625, -2.79412841796875, -2.682342529296875, -2.570556640625, -2.458770751953125, -2.34698486328125, -2.235198974609375, -2.1234130859375, -2.011627197265625, -1.89984130859375, -1.788055419921875, -1.67626953125, -1.564483642578125, -1.45269775390625, -1.340911865234375, -1.2291259765625, -1.117340087890625, -1.00555419921875, -0.893768310546875, -0.781982421875, -0.670196533203125, -0.55841064453125, -0.446624755859375, -0.3348388671875, -0.223052978515625, -0.11126708984375, 0.000518798828125, 0.1123046875, 0.224090576171875, 0.33587646484375, 0.447662353515625, 0.5594482421875, 0.671234130859375, 0.78302001953125, 0.894805908203125, 1.006591796875, 1.118377685546875, 1.23016357421875, 1.341949462890625, 1.4537353515625, 1.565521240234375, 1.67730712890625, 1.789093017578125, 1.90087890625, 2.012664794921875, 2.12445068359375, 2.236236572265625, 2.3480224609375, 2.459808349609375, 2.57159423828125, 2.683380126953125, 2.795166015625, 2.906951904296875, 3.01873779296875, 3.130523681640625, 3.2423095703125, 3.354095458984375, 3.46588134765625, 3.577667236328125, 3.689453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 3.0, 5.0, 13.0, 11.0, 14.0, 19.0, 33.0, 62.0, 72.0, 142.0, 254.0, 413.0, 955.0, 3179.0, 20751.0, 467024.0, 527129.0, 23033.0, 3310.0, 1021.0, 436.0, 230.0, 140.0, 85.0, 45.0, 32.0, 31.0, 15.0, 22.0, 12.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.849609375, -1.783599853515625, -1.71759033203125, -1.651580810546875, -1.5855712890625, -1.519561767578125, -1.45355224609375, -1.387542724609375, -1.321533203125, -1.255523681640625, -1.18951416015625, -1.123504638671875, -1.0574951171875, -0.991485595703125, -0.92547607421875, -0.859466552734375, -0.79345703125, -0.727447509765625, -0.66143798828125, -0.595428466796875, -0.5294189453125, -0.463409423828125, -0.39739990234375, -0.331390380859375, -0.265380859375, -0.199371337890625, -0.13336181640625, -0.067352294921875, -0.0013427734375, 0.064666748046875, 0.13067626953125, 0.196685791015625, 0.2626953125, 0.328704833984375, 0.39471435546875, 0.460723876953125, 0.5267333984375, 0.592742919921875, 0.65875244140625, 0.724761962890625, 0.790771484375, 0.856781005859375, 0.92279052734375, 0.988800048828125, 1.0548095703125, 1.120819091796875, 1.18682861328125, 1.252838134765625, 1.31884765625, 1.384857177734375, 1.45086669921875, 1.516876220703125, 1.5828857421875, 1.648895263671875, 1.71490478515625, 1.780914306640625, 1.846923828125, 1.912933349609375, 1.97894287109375, 2.044952392578125, 2.1109619140625, 2.176971435546875, 2.24298095703125, 2.308990478515625, 2.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 12.0, 12.0, 14.0, 12.0, 19.0, 30.0, 36.0, 32.0, 48.0, 46.0, 50.0, 87.0, 89.0, 73.0, 88.0, 78.0, 59.0, 36.0, 45.0, 29.0, 28.0, 18.0, 15.0, 12.0, 6.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018835067749023438, -0.00018247216939926147, -0.00017659366130828857, -0.00017071515321731567, -0.00016483664512634277, -0.00015895813703536987, -0.00015307962894439697, -0.00014720112085342407, -0.00014132261276245117, -0.00013544410467147827, -0.00012956559658050537, -0.00012368708848953247, -0.00011780858039855957, -0.00011193007230758667, -0.00010605156421661377, -0.00010017305612564087, -9.429454803466797e-05, -8.841603994369507e-05, -8.253753185272217e-05, -7.665902376174927e-05, -7.078051567077637e-05, -6.490200757980347e-05, -5.9023499488830566e-05, -5.3144991397857666e-05, -4.7266483306884766e-05, -4.1387975215911865e-05, -3.5509467124938965e-05, -2.9630959033966064e-05, -2.3752450942993164e-05, -1.7873942852020264e-05, -1.1995434761047363e-05, -6.116926670074463e-06, -2.384185791015625e-07, 5.640089511871338e-06, 1.1518597602844238e-05, 1.739710569381714e-05, 2.327561378479004e-05, 2.915412187576294e-05, 3.503262996673584e-05, 4.091113805770874e-05, 4.678964614868164e-05, 5.266815423965454e-05, 5.854666233062744e-05, 6.442517042160034e-05, 7.030367851257324e-05, 7.618218660354614e-05, 8.206069469451904e-05, 8.793920278549194e-05, 9.381771087646484e-05, 9.969621896743774e-05, 0.00010557472705841064, 0.00011145323514938354, 0.00011733174324035645, 0.00012321025133132935, 0.00012908875942230225, 0.00013496726751327515, 0.00014084577560424805, 0.00014672428369522095, 0.00015260279178619385, 0.00015848129987716675, 0.00016435980796813965, 0.00017023831605911255, 0.00017611682415008545, 0.00018199533224105835, 0.00018787384033203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 12.0, 18.0, 22.0, 36.0, 66.0, 96.0, 181.0, 409.0, 1023.0, 3811.0, 45000.0, 911474.0, 79392.0, 4867.0, 1191.0, 437.0, 204.0, 94.0, 77.0, 46.0, 24.0, 23.0, 14.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.69921875, -3.605743408203125, -3.51226806640625, -3.418792724609375, -3.3253173828125, -3.231842041015625, -3.13836669921875, -3.044891357421875, -2.951416015625, -2.857940673828125, -2.76446533203125, -2.670989990234375, -2.5775146484375, -2.484039306640625, -2.39056396484375, -2.297088623046875, -2.20361328125, -2.110137939453125, -2.01666259765625, -1.923187255859375, -1.8297119140625, -1.736236572265625, -1.64276123046875, -1.549285888671875, -1.455810546875, -1.362335205078125, -1.26885986328125, -1.175384521484375, -1.0819091796875, -0.988433837890625, -0.89495849609375, -0.801483154296875, -0.7080078125, -0.614532470703125, -0.52105712890625, -0.427581787109375, -0.3341064453125, -0.240631103515625, -0.14715576171875, -0.053680419921875, 0.039794921875, 0.133270263671875, 0.22674560546875, 0.320220947265625, 0.4136962890625, 0.507171630859375, 0.60064697265625, 0.694122314453125, 0.78759765625, 0.881072998046875, 0.97454833984375, 1.068023681640625, 1.1614990234375, 1.254974365234375, 1.34844970703125, 1.441925048828125, 1.535400390625, 1.628875732421875, 1.72235107421875, 1.815826416015625, 1.9093017578125, 2.002777099609375, 2.09625244140625, 2.189727783203125, 2.283203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 12.0, 17.0, 35.0, 31.0, 40.0, 43.0, 58.0, 73.0, 90.0, 85.0, 81.0, 81.0, 78.0, 65.0, 46.0, 30.0, 28.0, 16.0, 10.0, 11.0, 12.0, 12.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.234375, -1.1913909912109375, -1.148406982421875, -1.1054229736328125, -1.06243896484375, -1.0194549560546875, -0.976470947265625, -0.9334869384765625, -0.8905029296875, -0.8475189208984375, -0.804534912109375, -0.7615509033203125, -0.71856689453125, -0.6755828857421875, -0.632598876953125, -0.5896148681640625, -0.546630859375, -0.5036468505859375, -0.460662841796875, -0.4176788330078125, -0.37469482421875, -0.3317108154296875, -0.288726806640625, -0.2457427978515625, -0.2027587890625, -0.1597747802734375, -0.116790771484375, -0.0738067626953125, -0.03082275390625, 0.0121612548828125, 0.055145263671875, 0.0981292724609375, 0.14111328125, 0.1840972900390625, 0.227081298828125, 0.2700653076171875, 0.31304931640625, 0.3560333251953125, 0.399017333984375, 0.4420013427734375, 0.4849853515625, 0.5279693603515625, 0.570953369140625, 0.6139373779296875, 0.65692138671875, 0.6999053955078125, 0.742889404296875, 0.7858734130859375, 0.828857421875, 0.8718414306640625, 0.914825439453125, 0.9578094482421875, 1.00079345703125, 1.0437774658203125, 1.086761474609375, 1.1297454833984375, 1.1727294921875, 1.2157135009765625, 1.258697509765625, 1.3016815185546875, 1.34466552734375, 1.3876495361328125, 1.430633544921875, 1.4736175537109375, 1.5166015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 42.0, 149.0, 354.0, 301.0, 108.0, 26.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015113830566406, -20.432607650756836, -18.850101470947266, -17.267597198486328, -15.685091018676758, -14.102584838867188, -12.520078659057617, -10.937573432922363, -9.355067253112793, -7.772561550140381, -6.190055847167969, -4.607549667358398, -3.0250439643859863, -1.4425382614135742, 0.1399679183959961, 1.72247314453125, 3.3049793243408203, 4.887485027313232, 6.4699907302856445, 8.052496910095215, 9.635002136230469, 11.217508316040039, 12.80001449584961, 14.382519721984863, 15.965025901794434, 17.547531127929688, 19.130037307739258, 20.712543487548828, 22.2950496673584, 23.87755584716797, 25.460060119628906, 27.042566299438477, 28.625072479248047, 30.207578659057617, 31.790084838867188, 33.372589111328125, 34.95509719848633, 36.537601470947266, 38.12010955810547, 39.702613830566406, 41.285118103027344, 42.86762237548828, 44.450130462646484, 46.03263473510742, 47.615142822265625, 49.19764709472656, 50.7801513671875, 52.3626594543457, 53.945167541503906, 55.527671813964844, 57.11017990112305, 58.692684173583984, 60.27519226074219, 61.857696533203125, 63.44020080566406, 65.022705078125, 66.60520935058594, 68.18771362304688, 69.77021789550781, 71.35272979736328, 72.93523406982422, 74.51773834228516, 76.1002426147461, 77.68274688720703, 79.2652587890625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 7.0, 10.0, 11.0, 6.0, 21.0, 7.0, 31.0, 20.0, 34.0, 29.0, 30.0, 47.0, 44.0, 45.0, 36.0, 32.0, 50.0, 46.0, 56.0, 39.0, 28.0, 36.0, 37.0, 35.0, 39.0, 37.0, 25.0, 20.0, 15.0, 26.0, 18.0, 13.0, 19.0, 7.0, 9.0, 8.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.968815803527832, -12.532960891723633, -12.097105979919434, -11.661251068115234, -11.225396156311035, -10.789541244506836, -10.35368537902832, -9.917831420898438, -9.481975555419922, -9.046120643615723, -8.610265731811523, -8.174410820007324, -7.738555908203125, -7.302700996398926, -6.866845607757568, -6.430990695953369, -5.995136260986328, -5.559281349182129, -5.12342643737793, -4.6875715255737305, -4.251716613769531, -3.815861463546753, -3.3800063133239746, -2.9441514015197754, -2.508296489715576, -2.072441577911377, -1.6365865468978882, -1.2007315158843994, -0.7648766040802002, -0.329021692276001, 0.10683345794677734, 0.5426883697509766, 0.9785423278808594, 1.4143972396850586, 1.8502522706985474, 2.286107301712036, 2.7219622135162354, 3.1578171253204346, 3.593672275543213, 4.029527187347412, 4.465382099151611, 4.9012370109558105, 5.33709192276001, 5.772947311401367, 6.208802223205566, 6.644657135009766, 7.080512046813965, 7.516366958618164, 7.952221870422363, 8.388076782226562, 8.823931694030762, 9.259786605834961, 9.69564151763916, 10.13149642944336, 10.567352294921875, 11.003206253051758, 11.439062118530273, 11.874917030334473, 12.310771942138672, 12.746626853942871, 13.18248176574707, 13.61833667755127, 14.054191589355469, 14.490047454833984, 14.925901412963867]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 12.0, 14.0, 28.0, 20.0, 42.0, 54.0, 94.0, 98.0, 175.0, 250.0, 444.0, 770.0, 1452.0, 2877.0, 8056.0, 35642.0, 4042361.0, 81358.0, 12247.0, 4059.0, 1826.0, 954.0, 510.0, 328.0, 186.0, 124.0, 77.0, 54.0, 48.0, 31.0, 17.0, 13.0, 12.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.827728271484375, -2.73553466796875, -2.643341064453125, -2.5511474609375, -2.458953857421875, -2.36676025390625, -2.274566650390625, -2.182373046875, -2.090179443359375, -1.99798583984375, -1.905792236328125, -1.8135986328125, -1.721405029296875, -1.62921142578125, -1.537017822265625, -1.44482421875, -1.352630615234375, -1.26043701171875, -1.168243408203125, -1.0760498046875, -0.983856201171875, -0.89166259765625, -0.799468994140625, -0.707275390625, -0.615081787109375, -0.52288818359375, -0.430694580078125, -0.3385009765625, -0.246307373046875, -0.15411376953125, -0.061920166015625, 0.0302734375, 0.122467041015625, 0.21466064453125, 0.306854248046875, 0.3990478515625, 0.491241455078125, 0.58343505859375, 0.675628662109375, 0.767822265625, 0.860015869140625, 0.95220947265625, 1.044403076171875, 1.1365966796875, 1.228790283203125, 1.32098388671875, 1.413177490234375, 1.50537109375, 1.597564697265625, 1.68975830078125, 1.781951904296875, 1.8741455078125, 1.966339111328125, 2.05853271484375, 2.150726318359375, 2.242919921875, 2.335113525390625, 2.42730712890625, 2.519500732421875, 2.6116943359375, 2.703887939453125, 2.79608154296875, 2.888275146484375, 2.98046875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 8.0, 10.0, 13.0, 15.0, 15.0, 13.0, 24.0, 14.0, 32.0, 43.0, 62.0, 45.0, 67.0, 86.0, 83.0, 60.0, 79.0, 68.0, 58.0, 46.0, 36.0, 25.0, 28.0, 19.0, 13.0, 6.0, 7.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8623046875, -0.83306884765625, -0.8038330078125, -0.77459716796875, -0.745361328125, -0.71612548828125, -0.6868896484375, -0.65765380859375, -0.62841796875, -0.59918212890625, -0.5699462890625, -0.54071044921875, -0.511474609375, -0.48223876953125, -0.4530029296875, -0.42376708984375, -0.39453125, -0.36529541015625, -0.3360595703125, -0.30682373046875, -0.277587890625, -0.24835205078125, -0.2191162109375, -0.18988037109375, -0.16064453125, -0.13140869140625, -0.1021728515625, -0.07293701171875, -0.043701171875, -0.01446533203125, 0.0147705078125, 0.04400634765625, 0.0732421875, 0.10247802734375, 0.1317138671875, 0.16094970703125, 0.190185546875, 0.21942138671875, 0.2486572265625, 0.27789306640625, 0.30712890625, 0.33636474609375, 0.3656005859375, 0.39483642578125, 0.424072265625, 0.45330810546875, 0.4825439453125, 0.51177978515625, 0.541015625, 0.57025146484375, 0.5994873046875, 0.62872314453125, 0.657958984375, 0.68719482421875, 0.7164306640625, 0.74566650390625, 0.77490234375, 0.80413818359375, 0.8333740234375, 0.86260986328125, 0.891845703125, 0.92108154296875, 0.9503173828125, 0.97955322265625, 1.0087890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 18.0, 35.0, 44.0, 58.0, 95.0, 145.0, 263.0, 433.0, 804.0, 1670.0, 4066.0, 15333.0, 293901.0, 3847668.0, 20714.0, 4924.0, 1901.0, 972.0, 501.0, 281.0, 163.0, 96.0, 62.0, 50.0, 23.0, 11.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2265625, -3.107421875, -2.98828125, -2.869140625, -2.75, -2.630859375, -2.51171875, -2.392578125, -2.2734375, -2.154296875, -2.03515625, -1.916015625, -1.796875, -1.677734375, -1.55859375, -1.439453125, -1.3203125, -1.201171875, -1.08203125, -0.962890625, -0.84375, -0.724609375, -0.60546875, -0.486328125, -0.3671875, -0.248046875, -0.12890625, -0.009765625, 0.109375, 0.228515625, 0.34765625, 0.466796875, 0.5859375, 0.705078125, 0.82421875, 0.943359375, 1.0625, 1.181640625, 1.30078125, 1.419921875, 1.5390625, 1.658203125, 1.77734375, 1.896484375, 2.015625, 2.134765625, 2.25390625, 2.373046875, 2.4921875, 2.611328125, 2.73046875, 2.849609375, 2.96875, 3.087890625, 3.20703125, 3.326171875, 3.4453125, 3.564453125, 3.68359375, 3.802734375, 3.921875, 4.041015625, 4.16015625, 4.279296875, 4.3984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 19.0, 31.0, 46.0, 106.0, 732.0, 2872.0, 94.0, 62.0, 34.0, 13.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64892578125, -0.6292800903320312, -0.6096343994140625, -0.5899887084960938, -0.570343017578125, -0.5506973266601562, -0.5310516357421875, -0.5114059448242188, -0.49176025390625, -0.47211456298828125, -0.4524688720703125, -0.43282318115234375, -0.413177490234375, -0.39353179931640625, -0.3738861083984375, -0.35424041748046875, -0.3345947265625, -0.31494903564453125, -0.2953033447265625, -0.27565765380859375, -0.256011962890625, -0.23636627197265625, -0.2167205810546875, -0.19707489013671875, -0.17742919921875, -0.15778350830078125, -0.1381378173828125, -0.11849212646484375, -0.098846435546875, -0.07920074462890625, -0.0595550537109375, -0.03990936279296875, -0.020263671875, -0.00061798095703125, 0.0190277099609375, 0.03867340087890625, 0.058319091796875, 0.07796478271484375, 0.0976104736328125, 0.11725616455078125, 0.13690185546875, 0.15654754638671875, 0.1761932373046875, 0.19583892822265625, 0.215484619140625, 0.23513031005859375, 0.2547760009765625, 0.27442169189453125, 0.2940673828125, 0.31371307373046875, 0.3333587646484375, 0.35300445556640625, 0.372650146484375, 0.39229583740234375, 0.4119415283203125, 0.43158721923828125, 0.45123291015625, 0.47087860107421875, 0.4905242919921875, 0.5101699829101562, 0.529815673828125, 0.5494613647460938, 0.5691070556640625, 0.5887527465820312, 0.6083984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 10.0, 16.0, 17.0, 15.0, 33.0, 56.0, 52.0, 79.0, 88.0, 90.0, 85.0, 95.0, 88.0, 64.0, 58.0, 34.0, 32.0, 25.0, 14.0, 6.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9634976387023926, -1.9067236185073853, -1.8499497175216675, -1.7931756973266602, -1.7364016771316528, -1.679627776145935, -1.6228537559509277, -1.56607985496521, -1.5093058347702026, -1.4525318145751953, -1.3957579135894775, -1.3389838933944702, -1.282209873199463, -1.2254359722137451, -1.1686619520187378, -1.1118879318237305, -1.0551140308380127, -0.9983400702476501, -0.9415660500526428, -0.8847920894622803, -0.8280181288719177, -0.7712441682815552, -0.7144701480865479, -0.6576961874961853, -0.6009221076965332, -0.5441481471061707, -0.4873741567134857, -0.4306001663208008, -0.37382620573043823, -0.3170522153377533, -0.26027822494506836, -0.2035042643547058, -0.14673030376434326, -0.08995632827281952, -0.03318234533071518, 0.02359163761138916, 0.0803656131029129, 0.13713958859443665, 0.19391357898712158, 0.25068753957748413, 0.30746152997016907, 0.364235520362854, 0.42100948095321655, 0.4777834713459015, 0.5345574617385864, 0.591331422328949, 0.6481053829193115, 0.7048794031143188, 0.7616533637046814, 0.818427324295044, 0.8752013444900513, 0.9319753050804138, 0.9887492656707764, 1.0455232858657837, 1.102297306060791, 1.1590712070465088, 1.2158452272415161, 1.2726192474365234, 1.3293931484222412, 1.3861671686172485, 1.4429411888122559, 1.4997150897979736, 1.556489109992981, 1.6132631301879883, 1.670037031173706]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 8.0, 13.0, 9.0, 18.0, 32.0, 21.0, 22.0, 28.0, 26.0, 40.0, 32.0, 43.0, 52.0, 49.0, 59.0, 52.0, 50.0, 44.0, 47.0, 43.0, 38.0, 37.0, 36.0, 22.0, 29.0, 19.0, 20.0, 15.0, 10.0, 12.0, 13.0, 19.0, 5.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2582471370697021, -1.2196928262710571, -1.1811383962631226, -1.1425840854644775, -1.104029655456543, -1.065475344657898, -1.0269209146499634, -0.9883666038513184, -0.9498122334480286, -0.9112578630447388, -0.872703492641449, -0.8341491222381592, -0.7955948114395142, -0.7570403814315796, -0.7184860706329346, -0.6799317002296448, -0.641377329826355, -0.6028229594230652, -0.5642685890197754, -0.5257142186164856, -0.4871598780155182, -0.4486055076122284, -0.410051167011261, -0.3714967966079712, -0.3329424262046814, -0.2943880558013916, -0.2558336853981018, -0.2172793447971344, -0.1787249743938446, -0.1401706039905548, -0.10161624848842621, -0.06306189298629761, -0.024507522583007812, 0.014046840369701385, 0.052601203322410583, 0.09115556627511978, 0.12970992922782898, 0.16826429963111877, 0.20681865513324738, 0.24537301063537598, 0.28392738103866577, 0.32248175144195557, 0.36103612184524536, 0.39959046244621277, 0.43814483284950256, 0.47669920325279236, 0.5152535438537598, 0.5538079142570496, 0.5923622846603394, 0.6309166550636292, 0.669471025466919, 0.7080253958702087, 0.7465797662734985, 0.7851340770721436, 0.8236884474754333, 0.8622428178787231, 0.9007971882820129, 0.9393515586853027, 0.9779059290885925, 1.0164602994918823, 1.0550146102905273, 1.093569040298462, 1.132123351097107, 1.170677661895752, 1.2092320919036865]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 11.0, 9.0, 20.0, 23.0, 26.0, 40.0, 80.0, 93.0, 205.0, 354.0, 646.0, 1442.0, 3127.0, 7621.0, 21459.0, 63312.0, 187565.0, 391144.0, 242390.0, 83445.0, 27945.0, 10013.0, 3910.0, 1803.0, 815.0, 457.0, 203.0, 139.0, 98.0, 48.0, 34.0, 27.0, 14.0, 10.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.447265625, -1.4029083251953125, -1.358551025390625, -1.3141937255859375, -1.26983642578125, -1.2254791259765625, -1.181121826171875, -1.1367645263671875, -1.0924072265625, -1.0480499267578125, -1.003692626953125, -0.9593353271484375, -0.91497802734375, -0.8706207275390625, -0.826263427734375, -0.7819061279296875, -0.737548828125, -0.6931915283203125, -0.648834228515625, -0.6044769287109375, -0.56011962890625, -0.5157623291015625, -0.471405029296875, -0.4270477294921875, -0.3826904296875, -0.3383331298828125, -0.293975830078125, -0.2496185302734375, -0.20526123046875, -0.1609039306640625, -0.116546630859375, -0.0721893310546875, -0.02783203125, 0.0165252685546875, 0.060882568359375, 0.1052398681640625, 0.14959716796875, 0.1939544677734375, 0.238311767578125, 0.2826690673828125, 0.3270263671875, 0.3713836669921875, 0.415740966796875, 0.4600982666015625, 0.50445556640625, 0.5488128662109375, 0.593170166015625, 0.6375274658203125, 0.681884765625, 0.7262420654296875, 0.770599365234375, 0.8149566650390625, 0.85931396484375, 0.9036712646484375, 0.948028564453125, 0.9923858642578125, 1.0367431640625, 1.0811004638671875, 1.125457763671875, 1.1698150634765625, 1.21417236328125, 1.2585296630859375, 1.302886962890625, 1.3472442626953125, 1.3916015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 10.0, 14.0, 15.0, 17.0, 17.0, 36.0, 33.0, 38.0, 44.0, 64.0, 72.0, 66.0, 74.0, 69.0, 69.0, 59.0, 54.0, 51.0, 48.0, 28.0, 21.0, 16.0, 19.0, 5.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.870452880859375, -0.84100341796875, -0.811553955078125, -0.7821044921875, -0.752655029296875, -0.72320556640625, -0.693756103515625, -0.664306640625, -0.634857177734375, -0.60540771484375, -0.575958251953125, -0.5465087890625, -0.517059326171875, -0.48760986328125, -0.458160400390625, -0.4287109375, -0.399261474609375, -0.36981201171875, -0.340362548828125, -0.3109130859375, -0.281463623046875, -0.25201416015625, -0.222564697265625, -0.193115234375, -0.163665771484375, -0.13421630859375, -0.104766845703125, -0.0753173828125, -0.045867919921875, -0.01641845703125, 0.013031005859375, 0.04248046875, 0.071929931640625, 0.10137939453125, 0.130828857421875, 0.1602783203125, 0.189727783203125, 0.21917724609375, 0.248626708984375, 0.278076171875, 0.307525634765625, 0.33697509765625, 0.366424560546875, 0.3958740234375, 0.425323486328125, 0.45477294921875, 0.484222412109375, 0.513671875, 0.543121337890625, 0.57257080078125, 0.602020263671875, 0.6314697265625, 0.660919189453125, 0.69036865234375, 0.719818115234375, 0.749267578125, 0.778717041015625, 0.80816650390625, 0.837615966796875, 0.8670654296875, 0.896514892578125, 0.92596435546875, 0.955413818359375, 0.98486328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 15.0, 20.0, 53.0, 104.0, 246.0, 672.0, 2359.0, 66825.0, 966939.0, 9192.0, 1319.0, 419.0, 182.0, 72.0, 53.0, 21.0, 15.0, 7.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1640625, -8.91156005859375, -8.6590576171875, -8.40655517578125, -8.154052734375, -7.90155029296875, -7.6490478515625, -7.39654541015625, -7.14404296875, -6.89154052734375, -6.6390380859375, -6.38653564453125, -6.134033203125, -5.88153076171875, -5.6290283203125, -5.37652587890625, -5.1240234375, -4.87152099609375, -4.6190185546875, -4.36651611328125, -4.114013671875, -3.86151123046875, -3.6090087890625, -3.35650634765625, -3.10400390625, -2.85150146484375, -2.5989990234375, -2.34649658203125, -2.093994140625, -1.84149169921875, -1.5889892578125, -1.33648681640625, -1.083984375, -0.83148193359375, -0.5789794921875, -0.32647705078125, -0.073974609375, 0.17852783203125, 0.4310302734375, 0.68353271484375, 0.93603515625, 1.18853759765625, 1.4410400390625, 1.69354248046875, 1.946044921875, 2.19854736328125, 2.4510498046875, 2.70355224609375, 2.9560546875, 3.20855712890625, 3.4610595703125, 3.71356201171875, 3.966064453125, 4.21856689453125, 4.4710693359375, 4.72357177734375, 4.97607421875, 5.22857666015625, 5.4810791015625, 5.73358154296875, 5.986083984375, 6.23858642578125, 6.4910888671875, 6.74359130859375, 6.99609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 10.0, 19.0, 26.0, 35.0, 38.0, 62.0, 59.0, 57.0, 72.0, 72.0, 88.0, 83.0, 63.0, 65.0, 58.0, 45.0, 26.0, 25.0, 19.0, 11.0, 9.0, 9.0, 12.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.84716796875, -3.6748046875, -3.50244140625, -3.330078125, -3.15771484375, -2.9853515625, -2.81298828125, -2.640625, -2.46826171875, -2.2958984375, -2.12353515625, -1.951171875, -1.77880859375, -1.6064453125, -1.43408203125, -1.26171875, -1.08935546875, -0.9169921875, -0.74462890625, -0.572265625, -0.39990234375, -0.2275390625, -0.05517578125, 0.1171875, 0.28955078125, 0.4619140625, 0.63427734375, 0.806640625, 0.97900390625, 1.1513671875, 1.32373046875, 1.49609375, 1.66845703125, 1.8408203125, 2.01318359375, 2.185546875, 2.35791015625, 2.5302734375, 2.70263671875, 2.875, 3.04736328125, 3.2197265625, 3.39208984375, 3.564453125, 3.73681640625, 3.9091796875, 4.08154296875, 4.25390625, 4.42626953125, 4.5986328125, 4.77099609375, 4.943359375, 5.11572265625, 5.2880859375, 5.46044921875, 5.6328125, 5.80517578125, 5.9775390625, 6.14990234375, 6.322265625, 6.49462890625, 6.6669921875, 6.83935546875, 7.01171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 14.0, 5.0, 10.0, 21.0, 31.0, 48.0, 63.0, 106.0, 222.0, 432.0, 1261.0, 5983.0, 172377.0, 845480.0, 18983.0, 2140.0, 650.0, 291.0, 154.0, 94.0, 58.0, 34.0, 30.0, 18.0, 7.0, 6.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.406280517578125, -2.31451416015625, -2.222747802734375, -2.1309814453125, -2.039215087890625, -1.94744873046875, -1.855682373046875, -1.763916015625, -1.672149658203125, -1.58038330078125, -1.488616943359375, -1.3968505859375, -1.305084228515625, -1.21331787109375, -1.121551513671875, -1.02978515625, -0.938018798828125, -0.84625244140625, -0.754486083984375, -0.6627197265625, -0.570953369140625, -0.47918701171875, -0.387420654296875, -0.295654296875, -0.203887939453125, -0.11212158203125, -0.020355224609375, 0.0714111328125, 0.163177490234375, 0.25494384765625, 0.346710205078125, 0.4384765625, 0.530242919921875, 0.62200927734375, 0.713775634765625, 0.8055419921875, 0.897308349609375, 0.98907470703125, 1.080841064453125, 1.172607421875, 1.264373779296875, 1.35614013671875, 1.447906494140625, 1.5396728515625, 1.631439208984375, 1.72320556640625, 1.814971923828125, 1.90673828125, 1.998504638671875, 2.09027099609375, 2.182037353515625, 2.2738037109375, 2.365570068359375, 2.45733642578125, 2.549102783203125, 2.640869140625, 2.732635498046875, 2.82440185546875, 2.916168212890625, 3.0079345703125, 3.099700927734375, 3.19146728515625, 3.283233642578125, 3.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 12.0, 11.0, 14.0, 27.0, 29.0, 37.0, 44.0, 55.0, 65.0, 102.0, 109.0, 89.0, 79.0, 65.0, 45.0, 44.0, 26.0, 18.0, 23.0, 20.0, 10.0, 10.0, 5.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00023055076599121094, -0.00022425130009651184, -0.00021795183420181274, -0.00021165236830711365, -0.00020535290241241455, -0.00019905343651771545, -0.00019275397062301636, -0.00018645450472831726, -0.00018015503883361816, -0.00017385557293891907, -0.00016755610704421997, -0.00016125664114952087, -0.00015495717525482178, -0.00014865770936012268, -0.00014235824346542358, -0.0001360587775707245, -0.0001297593116760254, -0.0001234598457813263, -0.0001171603798866272, -0.0001108609139919281, -0.000104561448097229, -9.826198220252991e-05, -9.196251630783081e-05, -8.566305041313171e-05, -7.936358451843262e-05, -7.306411862373352e-05, -6.676465272903442e-05, -6.046518683433533e-05, -5.416572093963623e-05, -4.7866255044937134e-05, -4.156678915023804e-05, -3.526732325553894e-05, -2.8967857360839844e-05, -2.2668391466140747e-05, -1.636892557144165e-05, -1.0069459676742554e-05, -3.769993782043457e-06, 2.5294721126556396e-06, 8.828938007354736e-06, 1.5128403902053833e-05, 2.142786979675293e-05, 2.7727335691452026e-05, 3.402680158615112e-05, 4.032626748085022e-05, 4.6625733375549316e-05, 5.292519927024841e-05, 5.922466516494751e-05, 6.55241310596466e-05, 7.18235969543457e-05, 7.81230628490448e-05, 8.44225287437439e-05, 9.072199463844299e-05, 9.702146053314209e-05, 0.00010332092642784119, 0.00010962039232254028, 0.00011591985821723938, 0.00012221932411193848, 0.00012851879000663757, 0.00013481825590133667, 0.00014111772179603577, 0.00014741718769073486, 0.00015371665358543396, 0.00016001611948013306, 0.00016631558537483215, 0.00017261505126953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 8.0, 10.0, 10.0, 29.0, 39.0, 45.0, 67.0, 135.0, 285.0, 578.0, 1366.0, 4407.0, 35598.0, 776840.0, 213318.0, 11530.0, 2423.0, 924.0, 409.0, 212.0, 108.0, 61.0, 39.0, 25.0, 22.0, 23.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.405120849609375, -2.33172607421875, -2.258331298828125, -2.1849365234375, -2.111541748046875, -2.03814697265625, -1.964752197265625, -1.891357421875, -1.817962646484375, -1.74456787109375, -1.671173095703125, -1.5977783203125, -1.524383544921875, -1.45098876953125, -1.377593994140625, -1.30419921875, -1.230804443359375, -1.15740966796875, -1.084014892578125, -1.0106201171875, -0.937225341796875, -0.86383056640625, -0.790435791015625, -0.717041015625, -0.643646240234375, -0.57025146484375, -0.496856689453125, -0.4234619140625, -0.350067138671875, -0.27667236328125, -0.203277587890625, -0.1298828125, -0.056488037109375, 0.01690673828125, 0.090301513671875, 0.1636962890625, 0.237091064453125, 0.31048583984375, 0.383880615234375, 0.457275390625, 0.530670166015625, 0.60406494140625, 0.677459716796875, 0.7508544921875, 0.824249267578125, 0.89764404296875, 0.971038818359375, 1.04443359375, 1.117828369140625, 1.19122314453125, 1.264617919921875, 1.3380126953125, 1.411407470703125, 1.48480224609375, 1.558197021484375, 1.631591796875, 1.704986572265625, 1.77838134765625, 1.851776123046875, 1.9251708984375, 1.998565673828125, 2.07196044921875, 2.145355224609375, 2.21875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 15.0, 12.0, 26.0, 26.0, 55.0, 60.0, 101.0, 109.0, 120.0, 121.0, 88.0, 68.0, 47.0, 31.0, 30.0, 19.0, 14.0, 9.0, 6.0, 5.0, 10.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8759918212890625, -1.807647705078125, -1.7393035888671875, -1.67095947265625, -1.6026153564453125, -1.534271240234375, -1.4659271240234375, -1.3975830078125, -1.3292388916015625, -1.260894775390625, -1.1925506591796875, -1.12420654296875, -1.0558624267578125, -0.987518310546875, -0.9191741943359375, -0.850830078125, -0.7824859619140625, -0.714141845703125, -0.6457977294921875, -0.57745361328125, -0.5091094970703125, -0.440765380859375, -0.3724212646484375, -0.3040771484375, -0.2357330322265625, -0.167388916015625, -0.0990447998046875, -0.03070068359375, 0.0376434326171875, 0.105987548828125, 0.1743316650390625, 0.24267578125, 0.3110198974609375, 0.379364013671875, 0.4477081298828125, 0.51605224609375, 0.5843963623046875, 0.652740478515625, 0.7210845947265625, 0.7894287109375, 0.8577728271484375, 0.926116943359375, 0.9944610595703125, 1.06280517578125, 1.1311492919921875, 1.199493408203125, 1.2678375244140625, 1.336181640625, 1.4045257568359375, 1.472869873046875, 1.5412139892578125, 1.60955810546875, 1.6779022216796875, 1.746246337890625, 1.8145904541015625, 1.8829345703125, 1.9512786865234375, 2.019622802734375, 2.0879669189453125, 2.15631103515625, 2.2246551513671875, 2.292999267578125, 2.3613433837890625, 2.4296875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 12.0, 53.0, 235.0, 423.0, 213.0, 43.0, 12.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.392494201660156, -32.712867736816406, -31.033245086669922, -29.353618621826172, -27.673995971679688, -25.994369506835938, -24.31474494934082, -22.635120391845703, -20.955495834350586, -19.27587127685547, -17.59624671936035, -15.916621208190918, -14.2369966506958, -12.557372093200684, -10.87774658203125, -9.198122024536133, -7.518497467041016, -5.838872909545898, -4.159247875213623, -2.4796228408813477, -0.7999982833862305, 0.8796262741088867, 2.5592517852783203, 4.2388763427734375, 5.918500900268555, 7.598125457763672, 9.277750015258789, 10.957375526428223, 12.63700008392334, 14.316624641418457, 15.99625015258789, 17.675874710083008, 19.355499267578125, 21.035123825073242, 22.71474838256836, 24.39437484741211, 26.073997497558594, 27.753623962402344, 29.43324851989746, 31.112873077392578, 32.79249572753906, 34.47212219238281, 36.1517448425293, 37.83137130737305, 39.51099395751953, 41.19062042236328, 42.87024688720703, 44.549869537353516, 46.229496002197266, 47.909122467041016, 49.5887451171875, 51.26837158203125, 52.947994232177734, 54.627620697021484, 56.30724334716797, 57.98686981201172, 59.66649627685547, 61.34612274169922, 63.0257453918457, 64.70536804199219, 66.38499450683594, 68.06462097167969, 69.74424743652344, 71.42387390136719, 73.1034927368164]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 8.0, 10.0, 6.0, 13.0, 14.0, 15.0, 19.0, 29.0, 22.0, 22.0, 21.0, 27.0, 41.0, 40.0, 44.0, 46.0, 37.0, 51.0, 47.0, 48.0, 42.0, 40.0, 40.0, 35.0, 35.0, 31.0, 32.0, 24.0, 15.0, 16.0, 15.0, 16.0, 9.0, 8.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.982881546020508, -12.583287239074707, -12.183693885803223, -11.784099578857422, -11.384506225585938, -10.984911918640137, -10.585317611694336, -10.185724258422852, -9.78612995147705, -9.38653564453125, -8.986942291259766, -8.587347984313965, -8.187753677368164, -7.78816032409668, -7.388566017150879, -6.988972187042236, -6.589378356933594, -6.189784526824951, -5.790190696716309, -5.390596389770508, -4.991002559661865, -4.591408729553223, -4.191814422607422, -3.7922205924987793, -3.3926267623901367, -2.993032932281494, -2.5934388637542725, -2.193844795227051, -1.7942509651184082, -1.394657015800476, -0.995063066482544, -0.5954689979553223, -0.1958761215209961, 0.20371782779693604, 0.6033117771148682, 1.0029057264328003, 1.4024996757507324, 1.8020936250686646, 2.2016875743865967, 2.6012816429138184, 3.000875473022461, 3.4004693031311035, 3.800063371658325, 4.199657440185547, 4.5992512702941895, 4.998845100402832, 5.398439407348633, 5.798033237457275, 6.197627067565918, 6.5972208976745605, 6.996814727783203, 7.396409034729004, 7.7960028648376465, 8.195596694946289, 8.59519100189209, 8.99478530883789, 9.394378662109375, 9.793972969055176, 10.19356632232666, 10.593160629272461, 10.992753982543945, 11.392348289489746, 11.791942596435547, 12.191535949707031, 12.591130256652832]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 9.0, 14.0, 14.0, 15.0, 25.0, 32.0, 42.0, 72.0, 85.0, 138.0, 186.0, 300.0, 378.0, 656.0, 1095.0, 1896.0, 4033.0, 9992.0, 33704.0, 295228.0, 3757550.0, 61888.0, 15139.0, 5579.0, 2492.0, 1389.0, 762.0, 498.0, 329.0, 238.0, 144.0, 103.0, 69.0, 47.0, 39.0, 30.0, 15.0, 15.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.14453125, -2.077911376953125, -2.01129150390625, -1.944671630859375, -1.8780517578125, -1.811431884765625, -1.74481201171875, -1.678192138671875, -1.611572265625, -1.544952392578125, -1.47833251953125, -1.411712646484375, -1.3450927734375, -1.278472900390625, -1.21185302734375, -1.145233154296875, -1.07861328125, -1.011993408203125, -0.94537353515625, -0.878753662109375, -0.8121337890625, -0.745513916015625, -0.67889404296875, -0.612274169921875, -0.545654296875, -0.479034423828125, -0.41241455078125, -0.345794677734375, -0.2791748046875, -0.212554931640625, -0.14593505859375, -0.079315185546875, -0.0126953125, 0.053924560546875, 0.12054443359375, 0.187164306640625, 0.2537841796875, 0.320404052734375, 0.38702392578125, 0.453643798828125, 0.520263671875, 0.586883544921875, 0.65350341796875, 0.720123291015625, 0.7867431640625, 0.853363037109375, 0.91998291015625, 0.986602783203125, 1.05322265625, 1.119842529296875, 1.18646240234375, 1.253082275390625, 1.3197021484375, 1.386322021484375, 1.45294189453125, 1.519561767578125, 1.586181640625, 1.652801513671875, 1.71942138671875, 1.786041259765625, 1.8526611328125, 1.919281005859375, 1.98590087890625, 2.052520751953125, 2.119140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 7.0, 12.0, 17.0, 11.0, 19.0, 27.0, 29.0, 45.0, 54.0, 50.0, 51.0, 61.0, 54.0, 65.0, 65.0, 62.0, 63.0, 53.0, 43.0, 50.0, 36.0, 21.0, 14.0, 19.0, 11.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8300933837890625, -0.805206298828125, -0.7803192138671875, -0.75543212890625, -0.7305450439453125, -0.705657958984375, -0.6807708740234375, -0.6558837890625, -0.6309967041015625, -0.606109619140625, -0.5812225341796875, -0.55633544921875, -0.5314483642578125, -0.506561279296875, -0.4816741943359375, -0.456787109375, -0.4319000244140625, -0.407012939453125, -0.3821258544921875, -0.35723876953125, -0.3323516845703125, -0.307464599609375, -0.2825775146484375, -0.2576904296875, -0.2328033447265625, -0.207916259765625, -0.1830291748046875, -0.15814208984375, -0.1332550048828125, -0.108367919921875, -0.0834808349609375, -0.05859375, -0.0337066650390625, -0.008819580078125, 0.0160675048828125, 0.04095458984375, 0.0658416748046875, 0.090728759765625, 0.1156158447265625, 0.1405029296875, 0.1653900146484375, 0.190277099609375, 0.2151641845703125, 0.24005126953125, 0.2649383544921875, 0.289825439453125, 0.3147125244140625, 0.339599609375, 0.3644866943359375, 0.389373779296875, 0.4142608642578125, 0.43914794921875, 0.4640350341796875, 0.488922119140625, 0.5138092041015625, 0.5386962890625, 0.5635833740234375, 0.588470458984375, 0.6133575439453125, 0.63824462890625, 0.6631317138671875, 0.688018798828125, 0.7129058837890625, 0.73779296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 11.0, 8.0, 7.0, 7.0, 19.0, 22.0, 17.0, 41.0, 77.0, 126.0, 202.0, 321.0, 604.0, 1146.0, 2357.0, 6205.0, 24501.0, 412099.0, 3689529.0, 42300.0, 8559.0, 2962.0, 1432.0, 751.0, 373.0, 201.0, 126.0, 94.0, 69.0, 38.0, 29.0, 17.0, 4.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.445068359375, -2.35498046875, -2.264892578125, -2.1748046875, -2.084716796875, -1.99462890625, -1.904541015625, -1.814453125, -1.724365234375, -1.63427734375, -1.544189453125, -1.4541015625, -1.364013671875, -1.27392578125, -1.183837890625, -1.09375, -1.003662109375, -0.91357421875, -0.823486328125, -0.7333984375, -0.643310546875, -0.55322265625, -0.463134765625, -0.373046875, -0.282958984375, -0.19287109375, -0.102783203125, -0.0126953125, 0.077392578125, 0.16748046875, 0.257568359375, 0.34765625, 0.437744140625, 0.52783203125, 0.617919921875, 0.7080078125, 0.798095703125, 0.88818359375, 0.978271484375, 1.068359375, 1.158447265625, 1.24853515625, 1.338623046875, 1.4287109375, 1.518798828125, 1.60888671875, 1.698974609375, 1.7890625, 1.879150390625, 1.96923828125, 2.059326171875, 2.1494140625, 2.239501953125, 2.32958984375, 2.419677734375, 2.509765625, 2.599853515625, 2.68994140625, 2.780029296875, 2.8701171875, 2.960205078125, 3.05029296875, 3.140380859375, 3.23046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 11.0, 19.0, 39.0, 45.0, 112.0, 337.0, 2780.0, 404.0, 148.0, 63.0, 31.0, 25.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.244140625, -1.2091598510742188, -1.1741790771484375, -1.1391983032226562, -1.104217529296875, -1.0692367553710938, -1.0342559814453125, -0.9992752075195312, -0.96429443359375, -0.9293136596679688, -0.8943328857421875, -0.8593521118164062, -0.824371337890625, -0.7893905639648438, -0.7544097900390625, -0.7194290161132812, -0.6844482421875, -0.6494674682617188, -0.6144866943359375, -0.5795059204101562, -0.544525146484375, -0.5095443725585938, -0.4745635986328125, -0.43958282470703125, -0.40460205078125, -0.36962127685546875, -0.3346405029296875, -0.29965972900390625, -0.264678955078125, -0.22969818115234375, -0.1947174072265625, -0.15973663330078125, -0.124755859375, -0.08977508544921875, -0.0547943115234375, -0.01981353759765625, 0.015167236328125, 0.05014801025390625, 0.0851287841796875, 0.12010955810546875, 0.15509033203125, 0.19007110595703125, 0.2250518798828125, 0.26003265380859375, 0.295013427734375, 0.32999420166015625, 0.3649749755859375, 0.39995574951171875, 0.4349365234375, 0.46991729736328125, 0.5048980712890625, 0.5398788452148438, 0.574859619140625, 0.6098403930664062, 0.6448211669921875, 0.6798019409179688, 0.71478271484375, 0.7497634887695312, 0.7847442626953125, 0.8197250366210938, 0.854705810546875, 0.8896865844726562, 0.9246673583984375, 0.9596481323242188, 0.99462890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 14.0, 19.0, 34.0, 59.0, 98.0, 121.0, 142.0, 141.0, 114.0, 91.0, 51.0, 27.0, 25.0, 17.0, 12.0, 6.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.239797592163086, -3.081843852996826, -2.9238898754119873, -2.7659361362457275, -2.6079823970794678, -2.450028419494629, -2.292074680328369, -2.1341209411621094, -1.97616708278656, -1.8182132244110107, -1.660259485244751, -1.5023056268692017, -1.3443517684936523, -1.1863980293273926, -1.0284441709518433, -0.8704904317855835, -0.7125365734100342, -0.5545827746391296, -0.3966289460659027, -0.23867511749267578, -0.08072131872177124, 0.0772324800491333, 0.23518633842468262, 0.3931400775909424, 0.5510939359664917, 0.7090477347373962, 0.8670015335083008, 1.02495539188385, 1.1829092502593994, 1.3408629894256592, 1.4988168478012085, 1.6567705869674683, 1.8147244453430176, 1.972678303718567, 2.130632162094116, 2.288585901260376, 2.4465396404266357, 2.6044936180114746, 2.7624473571777344, 2.920401096343994, 3.078354835510254, 3.2363085746765137, 3.3942625522613525, 3.5522162914276123, 3.710170030593872, 3.868124008178711, 4.026077747344971, 4.1840314865112305, 4.341985702514648, 4.499939441680908, 4.657893180847168, 4.815847396850586, 4.973801136016846, 5.1317548751831055, 5.289708614349365, 5.447662353515625, 5.605616092681885, 5.7635698318481445, 5.921523571014404, 6.079477310180664, 6.237431526184082, 6.395385265350342, 6.553339004516602, 6.711292743682861, 6.869246482849121]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 2.0, 8.0, 13.0, 10.0, 11.0, 18.0, 27.0, 21.0, 28.0, 26.0, 33.0, 31.0, 30.0, 47.0, 45.0, 40.0, 34.0, 35.0, 44.0, 46.0, 45.0, 38.0, 38.0, 39.0, 35.0, 17.0, 29.0, 29.0, 20.0, 20.0, 23.0, 16.0, 18.0, 9.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3008830547332764, -2.2314326763153076, -2.161982297897339, -2.09253191947937, -2.0230817794799805, -1.9536312818527222, -1.884181022644043, -1.8147306442260742, -1.7452802658081055, -1.6758298873901367, -1.606379508972168, -1.5369292497634888, -1.46747887134552, -1.3980284929275513, -1.328578233718872, -1.2591278553009033, -1.1896774768829346, -1.1202270984649658, -1.050776720046997, -0.9813264608383179, -0.9118760824203491, -0.8424257040023804, -0.7729753851890564, -0.7035250663757324, -0.6340746879577637, -0.5646243095397949, -0.49517399072647095, -0.4257236421108246, -0.3562732934951782, -0.28682294487953186, -0.2173725962638855, -0.14792224764823914, -0.07847213745117188, -0.009021788835525513, 0.06042855978012085, 0.1298789083957672, 0.19932925701141357, 0.26877960562705994, 0.3382299542427063, 0.40768030285835266, 0.477130651473999, 0.5465810298919678, 0.6160313487052917, 0.6854816675186157, 0.7549320459365845, 0.8243824243545532, 0.8938327431678772, 0.9632830619812012, 1.03273344039917, 1.1021838188171387, 1.1716341972351074, 1.2410844564437866, 1.3105348348617554, 1.3799852132797241, 1.4494354724884033, 1.518885850906372, 1.5883362293243408, 1.6577866077423096, 1.7272369861602783, 1.7966872453689575, 1.8661376237869263, 1.935588002204895, 2.005038261413574, 2.074488639831543, 2.1439390182495117]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 15.0, 10.0, 12.0, 27.0, 64.0, 108.0, 257.0, 573.0, 1624.0, 5555.0, 23885.0, 124793.0, 564689.0, 264138.0, 48346.0, 10055.0, 2713.0, 908.0, 372.0, 169.0, 98.0, 52.0, 28.0, 17.0, 12.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.455078125, -2.372467041015625, -2.28985595703125, -2.207244873046875, -2.1246337890625, -2.042022705078125, -1.95941162109375, -1.876800537109375, -1.794189453125, -1.711578369140625, -1.62896728515625, -1.546356201171875, -1.4637451171875, -1.381134033203125, -1.29852294921875, -1.215911865234375, -1.13330078125, -1.050689697265625, -0.96807861328125, -0.885467529296875, -0.8028564453125, -0.720245361328125, -0.63763427734375, -0.555023193359375, -0.472412109375, -0.389801025390625, -0.30718994140625, -0.224578857421875, -0.1419677734375, -0.059356689453125, 0.02325439453125, 0.105865478515625, 0.1884765625, 0.271087646484375, 0.35369873046875, 0.436309814453125, 0.5189208984375, 0.601531982421875, 0.68414306640625, 0.766754150390625, 0.849365234375, 0.931976318359375, 1.01458740234375, 1.097198486328125, 1.1798095703125, 1.262420654296875, 1.34503173828125, 1.427642822265625, 1.51025390625, 1.592864990234375, 1.67547607421875, 1.758087158203125, 1.8406982421875, 1.923309326171875, 2.00592041015625, 2.088531494140625, 2.171142578125, 2.253753662109375, 2.33636474609375, 2.418975830078125, 2.5015869140625, 2.584197998046875, 2.66680908203125, 2.749420166015625, 2.83203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 14.0, 7.0, 18.0, 27.0, 35.0, 32.0, 27.0, 43.0, 58.0, 65.0, 53.0, 50.0, 51.0, 67.0, 58.0, 53.0, 58.0, 37.0, 38.0, 33.0, 22.0, 28.0, 14.0, 19.0, 18.0, 10.0, 4.0, 1.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8361892700195312, -0.8125152587890625, -0.7888412475585938, -0.765167236328125, -0.7414932250976562, -0.7178192138671875, -0.6941452026367188, -0.67047119140625, -0.6467971801757812, -0.6231231689453125, -0.5994491577148438, -0.575775146484375, -0.5521011352539062, -0.5284271240234375, -0.5047531127929688, -0.4810791015625, -0.45740509033203125, -0.4337310791015625, -0.41005706787109375, -0.386383056640625, -0.36270904541015625, -0.3390350341796875, -0.31536102294921875, -0.29168701171875, -0.26801300048828125, -0.2443389892578125, -0.22066497802734375, -0.196990966796875, -0.17331695556640625, -0.1496429443359375, -0.12596893310546875, -0.102294921875, -0.07862091064453125, -0.0549468994140625, -0.03127288818359375, -0.007598876953125, 0.01607513427734375, 0.0397491455078125, 0.06342315673828125, 0.08709716796875, 0.11077117919921875, 0.1344451904296875, 0.15811920166015625, 0.181793212890625, 0.20546722412109375, 0.2291412353515625, 0.25281524658203125, 0.2764892578125, 0.30016326904296875, 0.3238372802734375, 0.34751129150390625, 0.371185302734375, 0.39485931396484375, 0.4185333251953125, 0.44220733642578125, 0.46588134765625, 0.48955535888671875, 0.5132293701171875, 0.5369033813476562, 0.560577392578125, 0.5842514038085938, 0.6079254150390625, 0.6315994262695312, 0.6552734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 9.0, 15.0, 27.0, 55.0, 81.0, 181.0, 476.0, 1748.0, 22689.0, 1003416.0, 17350.0, 1595.0, 464.0, 181.0, 100.0, 45.0, 25.0, 17.0, 14.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4002685546875, -8.105224609375, -7.8101806640625, -7.51513671875, -7.2200927734375, -6.925048828125, -6.6300048828125, -6.3349609375, -6.0399169921875, -5.744873046875, -5.4498291015625, -5.15478515625, -4.8597412109375, -4.564697265625, -4.2696533203125, -3.974609375, -3.6795654296875, -3.384521484375, -3.0894775390625, -2.79443359375, -2.4993896484375, -2.204345703125, -1.9093017578125, -1.6142578125, -1.3192138671875, -1.024169921875, -0.7291259765625, -0.43408203125, -0.1390380859375, 0.156005859375, 0.4510498046875, 0.74609375, 1.0411376953125, 1.336181640625, 1.6312255859375, 1.92626953125, 2.2213134765625, 2.516357421875, 2.8114013671875, 3.1064453125, 3.4014892578125, 3.696533203125, 3.9915771484375, 4.28662109375, 4.5816650390625, 4.876708984375, 5.1717529296875, 5.466796875, 5.7618408203125, 6.056884765625, 6.3519287109375, 6.64697265625, 6.9420166015625, 7.237060546875, 7.5321044921875, 7.8271484375, 8.1221923828125, 8.417236328125, 8.7122802734375, 9.00732421875, 9.3023681640625, 9.597412109375, 9.8924560546875, 10.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 19.0, 14.0, 15.0, 29.0, 35.0, 39.0, 35.0, 66.0, 59.0, 78.0, 77.0, 65.0, 63.0, 57.0, 47.0, 44.0, 51.0, 38.0, 36.0, 29.0, 22.0, 16.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.753570556640625, -3.63018798828125, -3.506805419921875, -3.3834228515625, -3.260040283203125, -3.13665771484375, -3.013275146484375, -2.889892578125, -2.766510009765625, -2.64312744140625, -2.519744873046875, -2.3963623046875, -2.272979736328125, -2.14959716796875, -2.026214599609375, -1.90283203125, -1.779449462890625, -1.65606689453125, -1.532684326171875, -1.4093017578125, -1.285919189453125, -1.16253662109375, -1.039154052734375, -0.915771484375, -0.792388916015625, -0.66900634765625, -0.545623779296875, -0.4222412109375, -0.298858642578125, -0.17547607421875, -0.052093505859375, 0.0712890625, 0.194671630859375, 0.31805419921875, 0.441436767578125, 0.5648193359375, 0.688201904296875, 0.81158447265625, 0.934967041015625, 1.058349609375, 1.181732177734375, 1.30511474609375, 1.428497314453125, 1.5518798828125, 1.675262451171875, 1.79864501953125, 1.922027587890625, 2.04541015625, 2.168792724609375, 2.29217529296875, 2.415557861328125, 2.5389404296875, 2.662322998046875, 2.78570556640625, 2.909088134765625, 3.032470703125, 3.155853271484375, 3.27923583984375, 3.402618408203125, 3.5260009765625, 3.649383544921875, 3.77276611328125, 3.896148681640625, 4.01953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 11.0, 20.0, 19.0, 25.0, 43.0, 70.0, 98.0, 188.0, 281.0, 489.0, 1016.0, 2504.0, 8414.0, 42242.0, 342789.0, 569288.0, 63948.0, 11338.0, 3165.0, 1191.0, 556.0, 310.0, 166.0, 101.0, 79.0, 51.0, 38.0, 26.0, 23.0, 14.0, 9.0, 9.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.5283203125, -1.4911422729492188, -1.4539642333984375, -1.4167861938476562, -1.379608154296875, -1.3424301147460938, -1.3052520751953125, -1.2680740356445312, -1.23089599609375, -1.1937179565429688, -1.1565399169921875, -1.1193618774414062, -1.082183837890625, -1.0450057983398438, -1.0078277587890625, -0.9706497192382812, -0.9334716796875, -0.8962936401367188, -0.8591156005859375, -0.8219375610351562, -0.784759521484375, -0.7475814819335938, -0.7104034423828125, -0.6732254028320312, -0.63604736328125, -0.5988693237304688, -0.5616912841796875, -0.5245132446289062, -0.487335205078125, -0.45015716552734375, -0.4129791259765625, -0.37580108642578125, -0.338623046875, -0.30144500732421875, -0.2642669677734375, -0.22708892822265625, -0.189910888671875, -0.15273284912109375, -0.1155548095703125, -0.07837677001953125, -0.04119873046875, -0.00402069091796875, 0.0331573486328125, 0.07033538818359375, 0.107513427734375, 0.14469146728515625, 0.1818695068359375, 0.21904754638671875, 0.2562255859375, 0.29340362548828125, 0.3305816650390625, 0.36775970458984375, 0.404937744140625, 0.44211578369140625, 0.4792938232421875, 0.5164718627929688, 0.55364990234375, 0.5908279418945312, 0.6280059814453125, 0.6651840209960938, 0.702362060546875, 0.7395401000976562, 0.7767181396484375, 0.8138961791992188, 0.85107421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 11.0, 20.0, 16.0, 18.0, 24.0, 28.0, 35.0, 44.0, 48.0, 71.0, 123.0, 137.0, 105.0, 48.0, 50.0, 37.0, 34.0, 23.0, 23.0, 22.0, 19.0, 13.0, 8.0, 11.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.00021397322416305542, -0.00020645558834075928, -0.00019893795251846313, -0.000191420316696167, -0.00018390268087387085, -0.0001763850450515747, -0.00016886740922927856, -0.00016134977340698242, -0.00015383213758468628, -0.00014631450176239014, -0.000138796865940094, -0.00013127923011779785, -0.0001237615942955017, -0.00011624395847320557, -0.00010872632265090942, -0.00010120868682861328, -9.369105100631714e-05, -8.6173415184021e-05, -7.865577936172485e-05, -7.113814353942871e-05, -6.362050771713257e-05, -5.6102871894836426e-05, -4.858523607254028e-05, -4.106760025024414e-05, -3.3549964427948e-05, -2.6032328605651855e-05, -1.8514692783355713e-05, -1.099705696105957e-05, -3.4794211387634277e-06, 4.038214683532715e-06, 1.1555850505828857e-05, 1.9073486328125e-05, 2.6591122150421143e-05, 3.4108757972717285e-05, 4.162639379501343e-05, 4.914402961730957e-05, 5.666166543960571e-05, 6.417930126190186e-05, 7.1696937084198e-05, 7.921457290649414e-05, 8.673220872879028e-05, 9.424984455108643e-05, 0.00010176748037338257, 0.00010928511619567871, 0.00011680275201797485, 0.000124320387840271, 0.00013183802366256714, 0.00013935565948486328, 0.00014687329530715942, 0.00015439093112945557, 0.0001619085669517517, 0.00016942620277404785, 0.000176943838596344, 0.00018446147441864014, 0.00019197911024093628, 0.00019949674606323242, 0.00020701438188552856, 0.0002145320177078247, 0.00022204965353012085, 0.000229567289352417, 0.00023708492517471313, 0.0002446025609970093, 0.0002521201968193054, 0.00025963783264160156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 9.0, 10.0, 20.0, 32.0, 49.0, 72.0, 131.0, 208.0, 348.0, 700.0, 1546.0, 4698.0, 25189.0, 286649.0, 660356.0, 56071.0, 8143.0, 2218.0, 971.0, 443.0, 240.0, 142.0, 99.0, 59.0, 31.0, 28.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.2458343505859375, -1.201629638671875, -1.1574249267578125, -1.11322021484375, -1.0690155029296875, -1.024810791015625, -0.9806060791015625, -0.9364013671875, -0.8921966552734375, -0.847991943359375, -0.8037872314453125, -0.75958251953125, -0.7153778076171875, -0.671173095703125, -0.6269683837890625, -0.582763671875, -0.5385589599609375, -0.494354248046875, -0.4501495361328125, -0.40594482421875, -0.3617401123046875, -0.317535400390625, -0.2733306884765625, -0.2291259765625, -0.1849212646484375, -0.140716552734375, -0.0965118408203125, -0.05230712890625, -0.0081024169921875, 0.036102294921875, 0.0803070068359375, 0.12451171875, 0.1687164306640625, 0.212921142578125, 0.2571258544921875, 0.30133056640625, 0.3455352783203125, 0.389739990234375, 0.4339447021484375, 0.4781494140625, 0.5223541259765625, 0.566558837890625, 0.6107635498046875, 0.65496826171875, 0.6991729736328125, 0.743377685546875, 0.7875823974609375, 0.831787109375, 0.8759918212890625, 0.920196533203125, 0.9644012451171875, 1.00860595703125, 1.0528106689453125, 1.097015380859375, 1.1412200927734375, 1.1854248046875, 1.2296295166015625, 1.273834228515625, 1.3180389404296875, 1.36224365234375, 1.4064483642578125, 1.450653076171875, 1.4948577880859375, 1.5390625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 8.0, 7.0, 11.0, 16.0, 17.0, 19.0, 21.0, 36.0, 54.0, 51.0, 73.0, 111.0, 94.0, 78.0, 93.0, 72.0, 65.0, 47.0, 37.0, 21.0, 21.0, 16.0, 9.0, 8.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2294921875, -1.194244384765625, -1.15899658203125, -1.123748779296875, -1.0885009765625, -1.053253173828125, -1.01800537109375, -0.982757568359375, -0.947509765625, -0.912261962890625, -0.87701416015625, -0.841766357421875, -0.8065185546875, -0.771270751953125, -0.73602294921875, -0.700775146484375, -0.66552734375, -0.630279541015625, -0.59503173828125, -0.559783935546875, -0.5245361328125, -0.489288330078125, -0.45404052734375, -0.418792724609375, -0.383544921875, -0.348297119140625, -0.31304931640625, -0.277801513671875, -0.2425537109375, -0.207305908203125, -0.17205810546875, -0.136810302734375, -0.1015625, -0.066314697265625, -0.03106689453125, 0.004180908203125, 0.0394287109375, 0.074676513671875, 0.10992431640625, 0.145172119140625, 0.180419921875, 0.215667724609375, 0.25091552734375, 0.286163330078125, 0.3214111328125, 0.356658935546875, 0.39190673828125, 0.427154541015625, 0.46240234375, 0.497650146484375, 0.53289794921875, 0.568145751953125, 0.6033935546875, 0.638641357421875, 0.67388916015625, 0.709136962890625, 0.744384765625, 0.779632568359375, 0.81488037109375, 0.850128173828125, 0.8853759765625, 0.920623779296875, 0.95587158203125, 0.991119384765625, 1.0263671875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 13.0, 17.0, 35.0, 69.0, 104.0, 148.0, 161.0, 170.0, 97.0, 75.0, 36.0, 24.0, 9.0, 12.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.929759979248047, -22.264568328857422, -21.59937858581543, -20.934186935424805, -20.26899528503418, -19.603803634643555, -18.938613891601562, -18.273422241210938, -17.608230590820312, -16.943038940429688, -16.277849197387695, -15.61265754699707, -14.947465896606445, -14.282275199890137, -13.617084503173828, -12.951892852783203, -12.286702156066895, -11.621511459350586, -10.956319808959961, -10.291129112243652, -9.625937461853027, -8.960746765136719, -8.295555114746094, -7.630364418029785, -6.965173244476318, -6.299982070922852, -5.634790897369385, -4.969599723815918, -4.304409027099609, -3.6392176151275635, -2.974026679992676, -2.308835506439209, -1.6436443328857422, -0.9784532189369202, -0.31326210498809814, 0.3519289493560791, 1.017120122909546, 1.6823112964630127, 2.3475022315979004, 3.012693405151367, 3.677884578704834, 4.343075752258301, 5.008266925811768, 5.673458099365234, 6.338648796081543, 7.003840446472168, 7.669031143188477, 8.334222793579102, 8.99941349029541, 9.664604187011719, 10.329795837402344, 10.994986534118652, 11.660178184509277, 12.325368881225586, 12.990560531616211, 13.65575122833252, 14.320941925048828, 14.986132621765137, 15.651324272155762, 16.31651496887207, 16.981706619262695, 17.64689826965332, 18.312088012695312, 18.977279663085938, 19.642471313476562]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 11.0, 13.0, 15.0, 26.0, 21.0, 23.0, 18.0, 32.0, 32.0, 38.0, 48.0, 33.0, 46.0, 46.0, 51.0, 55.0, 71.0, 47.0, 37.0, 45.0, 45.0, 33.0, 27.0, 24.0, 32.0, 23.0, 19.0, 18.0, 14.0, 5.0, 9.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-13.828222274780273, -13.415547370910645, -13.0028715133667, -12.59019660949707, -12.177520751953125, -11.764845848083496, -11.352170944213867, -10.939495086669922, -10.526819229125977, -10.114144325256348, -9.701468467712402, -9.288793563842773, -8.876117706298828, -8.4634428024292, -8.05076789855957, -7.638092041015625, -7.225417137145996, -6.812741756439209, -6.400066375732422, -5.987391471862793, -5.574715614318848, -5.162040710449219, -4.749365329742432, -4.3366899490356445, -3.9240145683288574, -3.5113391876220703, -3.098663806915283, -2.685988664627075, -2.273313283920288, -1.860637903213501, -1.447962760925293, -1.0352873802185059, -0.6226119995117188, -0.20993667840957642, 0.20273864269256592, 0.6154139041900635, 1.0280892848968506, 1.4407646656036377, 1.8534398078918457, 2.266115188598633, 2.67879056930542, 3.091465950012207, 3.504141330718994, 3.916816473007202, 4.32949161529541, 4.7421674728393555, 5.154842376708984, 5.5675177574157715, 5.980193138122559, 6.392868518829346, 6.805543899536133, 7.218218803405762, 7.630894660949707, 8.043569564819336, 8.456245422363281, 8.86892032623291, 9.281595230102539, 9.694270133972168, 10.106945991516113, 10.519620895385742, 10.932296752929688, 11.344971656799316, 11.757646560668945, 12.17032241821289, 12.582998275756836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 7.0, 8.0, 14.0, 14.0, 25.0, 47.0, 43.0, 70.0, 112.0, 133.0, 195.0, 260.0, 421.0, 598.0, 909.0, 1350.0, 1976.0, 3130.0, 5141.0, 8970.0, 16343.0, 33122.0, 77504.0, 235910.0, 1132262.0, 2054868.0, 410295.0, 115654.0, 45366.0, 21129.0, 11221.0, 6371.0, 3685.0, 2358.0, 1538.0, 1037.0, 675.0, 456.0, 293.0, 238.0, 150.0, 124.0, 83.0, 44.0, 41.0, 31.0, 18.0, 7.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.75537109375, -0.7319107055664062, -0.7084503173828125, -0.6849899291992188, -0.661529541015625, -0.6380691528320312, -0.6146087646484375, -0.5911483764648438, -0.56768798828125, -0.5442276000976562, -0.5207672119140625, -0.49730682373046875, -0.473846435546875, -0.45038604736328125, -0.4269256591796875, -0.40346527099609375, -0.3800048828125, -0.35654449462890625, -0.3330841064453125, -0.30962371826171875, -0.286163330078125, -0.26270294189453125, -0.2392425537109375, -0.21578216552734375, -0.19232177734375, -0.16886138916015625, -0.1454010009765625, -0.12194061279296875, -0.098480224609375, -0.07501983642578125, -0.0515594482421875, -0.02809906005859375, -0.004638671875, 0.01882171630859375, 0.0422821044921875, 0.06574249267578125, 0.089202880859375, 0.11266326904296875, 0.1361236572265625, 0.15958404541015625, 0.18304443359375, 0.20650482177734375, 0.2299652099609375, 0.25342559814453125, 0.276885986328125, 0.30034637451171875, 0.3238067626953125, 0.34726715087890625, 0.3707275390625, 0.39418792724609375, 0.4176483154296875, 0.44110870361328125, 0.464569091796875, 0.48802947998046875, 0.5114898681640625, 0.5349502563476562, 0.55841064453125, 0.5818710327148438, 0.6053314208984375, 0.6287918090820312, 0.652252197265625, 0.6757125854492188, 0.6991729736328125, 0.7226333618164062, 0.74609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 12.0, 14.0, 19.0, 29.0, 25.0, 59.0, 39.0, 48.0, 68.0, 65.0, 70.0, 74.0, 85.0, 69.0, 46.0, 59.0, 44.0, 35.0, 26.0, 26.0, 16.0, 12.0, 10.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330078125, -0.8062744140625, -0.779541015625, -0.7528076171875, -0.72607421875, -0.6993408203125, -0.672607421875, -0.6458740234375, -0.619140625, -0.5924072265625, -0.565673828125, -0.5389404296875, -0.51220703125, -0.4854736328125, -0.458740234375, -0.4320068359375, -0.4052734375, -0.3785400390625, -0.351806640625, -0.3250732421875, -0.29833984375, -0.2716064453125, -0.244873046875, -0.2181396484375, -0.19140625, -0.1646728515625, -0.137939453125, -0.1112060546875, -0.08447265625, -0.0577392578125, -0.031005859375, -0.0042724609375, 0.0224609375, 0.0491943359375, 0.075927734375, 0.1026611328125, 0.12939453125, 0.1561279296875, 0.182861328125, 0.2095947265625, 0.236328125, 0.2630615234375, 0.289794921875, 0.3165283203125, 0.34326171875, 0.3699951171875, 0.396728515625, 0.4234619140625, 0.4501953125, 0.4769287109375, 0.503662109375, 0.5303955078125, 0.55712890625, 0.5838623046875, 0.610595703125, 0.6373291015625, 0.6640625, 0.6907958984375, 0.717529296875, 0.7442626953125, 0.77099609375, 0.7977294921875, 0.824462890625, 0.8511962890625, 0.8779296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 8.0, 20.0, 21.0, 34.0, 56.0, 73.0, 116.0, 239.0, 468.0, 977.0, 2542.0, 7242.0, 27044.0, 148895.0, 2803044.0, 1091945.0, 84611.0, 18094.0, 5238.0, 1835.0, 813.0, 390.0, 193.0, 134.0, 71.0, 45.0, 34.0, 17.0, 23.0, 8.0, 8.0, 6.0, 9.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.816986083984375, -1.75994873046875, -1.702911376953125, -1.6458740234375, -1.588836669921875, -1.53179931640625, -1.474761962890625, -1.417724609375, -1.360687255859375, -1.30364990234375, -1.246612548828125, -1.1895751953125, -1.132537841796875, -1.07550048828125, -1.018463134765625, -0.96142578125, -0.904388427734375, -0.84735107421875, -0.790313720703125, -0.7332763671875, -0.676239013671875, -0.61920166015625, -0.562164306640625, -0.505126953125, -0.448089599609375, -0.39105224609375, -0.334014892578125, -0.2769775390625, -0.219940185546875, -0.16290283203125, -0.105865478515625, -0.048828125, 0.008209228515625, 0.06524658203125, 0.122283935546875, 0.1793212890625, 0.236358642578125, 0.29339599609375, 0.350433349609375, 0.407470703125, 0.464508056640625, 0.52154541015625, 0.578582763671875, 0.6356201171875, 0.692657470703125, 0.74969482421875, 0.806732177734375, 0.86376953125, 0.920806884765625, 0.97784423828125, 1.034881591796875, 1.0919189453125, 1.148956298828125, 1.20599365234375, 1.263031005859375, 1.320068359375, 1.377105712890625, 1.43414306640625, 1.491180419921875, 1.5482177734375, 1.605255126953125, 1.66229248046875, 1.719329833984375, 1.7763671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 1.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 18.0, 16.0, 26.0, 47.0, 56.0, 85.0, 132.0, 197.0, 341.0, 632.0, 879.0, 634.0, 333.0, 218.0, 134.0, 84.0, 48.0, 38.0, 26.0, 20.0, 14.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4012908935546875, -1.348480224609375, -1.2956695556640625, -1.24285888671875, -1.1900482177734375, -1.137237548828125, -1.0844268798828125, -1.0316162109375, -0.9788055419921875, -0.925994873046875, -0.8731842041015625, -0.82037353515625, -0.7675628662109375, -0.714752197265625, -0.6619415283203125, -0.609130859375, -0.5563201904296875, -0.503509521484375, -0.4506988525390625, -0.39788818359375, -0.3450775146484375, -0.292266845703125, -0.2394561767578125, -0.1866455078125, -0.1338348388671875, -0.081024169921875, -0.0282135009765625, 0.02459716796875, 0.0774078369140625, 0.130218505859375, 0.1830291748046875, 0.23583984375, 0.2886505126953125, 0.341461181640625, 0.3942718505859375, 0.44708251953125, 0.4998931884765625, 0.552703857421875, 0.6055145263671875, 0.6583251953125, 0.7111358642578125, 0.763946533203125, 0.8167572021484375, 0.86956787109375, 0.9223785400390625, 0.975189208984375, 1.0279998779296875, 1.080810546875, 1.1336212158203125, 1.186431884765625, 1.2392425537109375, 1.29205322265625, 1.3448638916015625, 1.397674560546875, 1.4504852294921875, 1.5032958984375, 1.5561065673828125, 1.608917236328125, 1.6617279052734375, 1.71453857421875, 1.7673492431640625, 1.820159912109375, 1.8729705810546875, 1.92578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 5.0, 13.0, 36.0, 108.0, 235.0, 286.0, 178.0, 70.0, 26.0, 15.0, 9.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.974903106689453, -10.144695281982422, -9.314488410949707, -8.484281539916992, -7.654073715209961, -6.823866367340088, -5.993659019470215, -5.163451671600342, -4.333244323730469, -3.5030369758605957, -2.6728296279907227, -1.8426222801208496, -1.0124149322509766, -0.18220758438110352, 0.6479997634887695, 1.4782071113586426, 2.3084144592285156, 3.1386218070983887, 3.9688291549682617, 4.799036502838135, 5.629243850708008, 6.459451198577881, 7.289658546447754, 8.119865417480469, 8.9500732421875, 9.780281066894531, 10.610487937927246, 11.440694808959961, 12.270902633666992, 13.101110458374023, 13.931317329406738, 14.761524200439453, 15.591732025146484, 16.421939849853516, 17.252147674560547, 18.082353591918945, 18.912561416625977, 19.742769241333008, 20.572975158691406, 21.403182983398438, 22.23339080810547, 23.0635986328125, 23.89380645751953, 24.72401237487793, 25.55422019958496, 26.384428024291992, 27.21463394165039, 28.044841766357422, 28.875049591064453, 29.705257415771484, 30.535465240478516, 31.365671157836914, 32.19587707519531, 33.026084899902344, 33.856292724609375, 34.686500549316406, 35.51670837402344, 36.34691619873047, 37.1771240234375, 38.00733184814453, 38.83753967285156, 39.66774368286133, 40.49795150756836, 41.32815933227539, 42.15836715698242]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 10.0, 14.0, 12.0, 17.0, 19.0, 21.0, 19.0, 27.0, 19.0, 32.0, 45.0, 39.0, 47.0, 47.0, 50.0, 42.0, 36.0, 49.0, 56.0, 46.0, 35.0, 41.0, 42.0, 29.0, 32.0, 30.0, 27.0, 17.0, 17.0, 17.0, 13.0, 13.0, 13.0, 4.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.859951972961426, -6.618941783905029, -6.377931594848633, -6.136921405792236, -5.89591121673584, -5.654901504516602, -5.413890838623047, -5.172881126403809, -4.931870937347412, -4.690860748291016, -4.449850559234619, -4.208840370178223, -3.9678304195404053, -3.726820230484009, -3.4858100414276123, -3.244800090789795, -3.0037896633148193, -2.762779474258423, -2.5217692852020264, -2.280759334564209, -2.0397491455078125, -1.798738956451416, -1.5577287673950195, -1.3167186975479126, -1.0757085084915161, -0.8346983790397644, -0.5936882495880127, -0.3526780605316162, -0.1116679310798645, 0.1293421983718872, 0.3703523874282837, 0.6113624572753906, 0.8523726463317871, 1.0933828353881836, 1.3343929052352905, 1.575403094291687, 1.816413164138794, 2.0574233531951904, 2.298433542251587, 2.5394434928894043, 2.780453681945801, 3.0214638710021973, 3.2624740600585938, 3.5034842491149902, 3.7444941997528076, 3.985504388809204, 4.22651481628418, 4.467524528503418, 4.708535194396973, 4.949545383453369, 5.190555572509766, 5.431565761566162, 5.672575950622559, 5.913585662841797, 6.154596328735352, 6.39560604095459, 6.636616230010986, 6.877626419067383, 7.118636608123779, 7.359646797180176, 7.600656986236572, 7.841667175292969, 8.082676887512207, 8.323687553405762, 8.564697265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 1.0, 7.0, 13.0, 18.0, 53.0, 52.0, 112.0, 205.0, 344.0, 597.0, 1215.0, 2679.0, 6001.0, 14944.0, 41770.0, 144947.0, 549599.0, 201530.0, 52833.0, 18195.0, 7321.0, 2965.0, 1435.0, 765.0, 393.0, 215.0, 128.0, 72.0, 45.0, 34.0, 21.0, 17.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4708709716796875, -1.413421630859375, -1.3559722900390625, -1.29852294921875, -1.2410736083984375, -1.183624267578125, -1.1261749267578125, -1.0687255859375, -1.0112762451171875, -0.953826904296875, -0.8963775634765625, -0.83892822265625, -0.7814788818359375, -0.724029541015625, -0.6665802001953125, -0.609130859375, -0.5516815185546875, -0.494232177734375, -0.4367828369140625, -0.37933349609375, -0.3218841552734375, -0.264434814453125, -0.2069854736328125, -0.1495361328125, -0.0920867919921875, -0.034637451171875, 0.0228118896484375, 0.08026123046875, 0.1377105712890625, 0.195159912109375, 0.2526092529296875, 0.31005859375, 0.3675079345703125, 0.424957275390625, 0.4824066162109375, 0.53985595703125, 0.5973052978515625, 0.654754638671875, 0.7122039794921875, 0.7696533203125, 0.8271026611328125, 0.884552001953125, 0.9420013427734375, 0.99945068359375, 1.0569000244140625, 1.114349365234375, 1.1717987060546875, 1.229248046875, 1.2866973876953125, 1.344146728515625, 1.4015960693359375, 1.45904541015625, 1.5164947509765625, 1.573944091796875, 1.6313934326171875, 1.6888427734375, 1.7462921142578125, 1.803741455078125, 1.8611907958984375, 1.91864013671875, 1.9760894775390625, 2.033538818359375, 2.0909881591796875, 2.1484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 9.0, 10.0, 10.0, 22.0, 15.0, 21.0, 22.0, 33.0, 34.0, 30.0, 44.0, 37.0, 33.0, 62.0, 49.0, 52.0, 46.0, 42.0, 55.0, 52.0, 47.0, 40.0, 32.0, 28.0, 28.0, 25.0, 13.0, 17.0, 15.0, 18.0, 10.0, 13.0, 5.0, 5.0, 3.0, 2.0, 3.0, 7.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67724609375, -0.6573562622070312, -0.6374664306640625, -0.6175765991210938, -0.597686767578125, -0.5777969360351562, -0.5579071044921875, -0.5380172729492188, -0.51812744140625, -0.49823760986328125, -0.4783477783203125, -0.45845794677734375, -0.438568115234375, -0.41867828369140625, -0.3987884521484375, -0.37889862060546875, -0.3590087890625, -0.33911895751953125, -0.3192291259765625, -0.29933929443359375, -0.279449462890625, -0.25955963134765625, -0.2396697998046875, -0.21977996826171875, -0.19989013671875, -0.18000030517578125, -0.1601104736328125, -0.14022064208984375, -0.120330810546875, -0.10044097900390625, -0.0805511474609375, -0.06066131591796875, -0.040771484375, -0.02088165283203125, -0.0009918212890625, 0.01889801025390625, 0.038787841796875, 0.05867767333984375, 0.0785675048828125, 0.09845733642578125, 0.11834716796875, 0.13823699951171875, 0.1581268310546875, 0.17801666259765625, 0.197906494140625, 0.21779632568359375, 0.2376861572265625, 0.25757598876953125, 0.2774658203125, 0.29735565185546875, 0.3172454833984375, 0.33713531494140625, 0.357025146484375, 0.37691497802734375, 0.3968048095703125, 0.41669464111328125, 0.43658447265625, 0.45647430419921875, 0.4763641357421875, 0.49625396728515625, 0.516143798828125, 0.5360336303710938, 0.5559234619140625, 0.5758132934570312, 0.595703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 6.0, 13.0, 19.0, 20.0, 36.0, 57.0, 118.0, 208.0, 466.0, 1408.0, 7093.0, 552672.0, 477241.0, 6860.0, 1326.0, 479.0, 213.0, 112.0, 66.0, 30.0, 27.0, 14.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.628173828125, -7.39697265625, -7.165771484375, -6.9345703125, -6.703369140625, -6.47216796875, -6.240966796875, -6.009765625, -5.778564453125, -5.54736328125, -5.316162109375, -5.0849609375, -4.853759765625, -4.62255859375, -4.391357421875, -4.16015625, -3.928955078125, -3.69775390625, -3.466552734375, -3.2353515625, -3.004150390625, -2.77294921875, -2.541748046875, -2.310546875, -2.079345703125, -1.84814453125, -1.616943359375, -1.3857421875, -1.154541015625, -0.92333984375, -0.692138671875, -0.4609375, -0.229736328125, 0.00146484375, 0.232666015625, 0.4638671875, 0.695068359375, 0.92626953125, 1.157470703125, 1.388671875, 1.619873046875, 1.85107421875, 2.082275390625, 2.3134765625, 2.544677734375, 2.77587890625, 3.007080078125, 3.23828125, 3.469482421875, 3.70068359375, 3.931884765625, 4.1630859375, 4.394287109375, 4.62548828125, 4.856689453125, 5.087890625, 5.319091796875, 5.55029296875, 5.781494140625, 6.0126953125, 6.243896484375, 6.47509765625, 6.706298828125, 6.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 4.0, 7.0, 11.0, 9.0, 12.0, 17.0, 20.0, 24.0, 35.0, 29.0, 35.0, 41.0, 47.0, 33.0, 50.0, 74.0, 54.0, 60.0, 56.0, 46.0, 59.0, 35.0, 31.0, 28.0, 38.0, 31.0, 23.0, 24.0, 17.0, 8.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.80859375, -3.7078857421875, -3.607177734375, -3.5064697265625, -3.40576171875, -3.3050537109375, -3.204345703125, -3.1036376953125, -3.0029296875, -2.9022216796875, -2.801513671875, -2.7008056640625, -2.60009765625, -2.4993896484375, -2.398681640625, -2.2979736328125, -2.197265625, -2.0965576171875, -1.995849609375, -1.8951416015625, -1.79443359375, -1.6937255859375, -1.593017578125, -1.4923095703125, -1.3916015625, -1.2908935546875, -1.190185546875, -1.0894775390625, -0.98876953125, -0.8880615234375, -0.787353515625, -0.6866455078125, -0.5859375, -0.4852294921875, -0.384521484375, -0.2838134765625, -0.18310546875, -0.0823974609375, 0.018310546875, 0.1190185546875, 0.2197265625, 0.3204345703125, 0.421142578125, 0.5218505859375, 0.62255859375, 0.7232666015625, 0.823974609375, 0.9246826171875, 1.025390625, 1.1260986328125, 1.226806640625, 1.3275146484375, 1.42822265625, 1.5289306640625, 1.629638671875, 1.7303466796875, 1.8310546875, 1.9317626953125, 2.032470703125, 2.1331787109375, 2.23388671875, 2.3345947265625, 2.435302734375, 2.5360107421875, 2.63671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 5.0, 10.0, 7.0, 21.0, 27.0, 46.0, 69.0, 146.0, 340.0, 1105.0, 4832.0, 49834.0, 908080.0, 75512.0, 6416.0, 1283.0, 401.0, 183.0, 92.0, 41.0, 25.0, 28.0, 13.0, 6.0, 10.0, 6.0, 3.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.91015625, -2.83660888671875, -2.7630615234375, -2.68951416015625, -2.615966796875, -2.54241943359375, -2.4688720703125, -2.39532470703125, -2.32177734375, -2.24822998046875, -2.1746826171875, -2.10113525390625, -2.027587890625, -1.95404052734375, -1.8804931640625, -1.80694580078125, -1.7333984375, -1.65985107421875, -1.5863037109375, -1.51275634765625, -1.439208984375, -1.36566162109375, -1.2921142578125, -1.21856689453125, -1.14501953125, -1.07147216796875, -0.9979248046875, -0.92437744140625, -0.850830078125, -0.77728271484375, -0.7037353515625, -0.63018798828125, -0.556640625, -0.48309326171875, -0.4095458984375, -0.33599853515625, -0.262451171875, -0.18890380859375, -0.1153564453125, -0.04180908203125, 0.03173828125, 0.10528564453125, 0.1788330078125, 0.25238037109375, 0.325927734375, 0.39947509765625, 0.4730224609375, 0.54656982421875, 0.6201171875, 0.69366455078125, 0.7672119140625, 0.84075927734375, 0.914306640625, 0.98785400390625, 1.0614013671875, 1.13494873046875, 1.20849609375, 1.28204345703125, 1.3555908203125, 1.42913818359375, 1.502685546875, 1.57623291015625, 1.6497802734375, 1.72332763671875, 1.796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 11.0, 6.0, 11.0, 23.0, 20.0, 44.0, 63.0, 121.0, 315.0, 172.0, 64.0, 39.0, 41.0, 28.0, 16.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004794597625732422, -0.0004647783935070038, -0.0004500970244407654, -0.000435415655374527, -0.0004207342863082886, -0.00040605291724205017, -0.00039137154817581177, -0.00037669017910957336, -0.00036200881004333496, -0.00034732744097709656, -0.00033264607191085815, -0.00031796470284461975, -0.00030328333377838135, -0.00028860196471214294, -0.00027392059564590454, -0.00025923922657966614, -0.00024455785751342773, -0.00022987648844718933, -0.00021519511938095093, -0.00020051375031471252, -0.00018583238124847412, -0.00017115101218223572, -0.00015646964311599731, -0.0001417882740497589, -0.0001271069049835205, -0.0001124255359172821, -9.77441668510437e-05, -8.30627977848053e-05, -6.83814287185669e-05, -5.370005965232849e-05, -3.901869058609009e-05, -2.4337321519851685e-05, -9.655952453613281e-06, 5.025416612625122e-06, 1.9706785678863525e-05, 3.438815474510193e-05, 4.906952381134033e-05, 6.375089287757874e-05, 7.843226194381714e-05, 9.311363101005554e-05, 0.00010779500007629395, 0.00012247636914253235, 0.00013715773820877075, 0.00015183910727500916, 0.00016652047634124756, 0.00018120184540748596, 0.00019588321447372437, 0.00021056458353996277, 0.00022524595260620117, 0.00023992732167243958, 0.000254608690738678, 0.0002692900598049164, 0.0002839714288711548, 0.0002986527979373932, 0.0003133341670036316, 0.00032801553606987, 0.0003426969051361084, 0.0003573782742023468, 0.0003720596432685852, 0.0003867410123348236, 0.000401422381401062, 0.0004161037504673004, 0.0004307851195335388, 0.0004454664885997772, 0.0004601478576660156]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 14.0, 8.0, 21.0, 27.0, 24.0, 51.0, 83.0, 105.0, 216.0, 390.0, 801.0, 1993.0, 6864.0, 42237.0, 722885.0, 245059.0, 20395.0, 4396.0, 1517.0, 617.0, 327.0, 197.0, 96.0, 65.0, 45.0, 39.0, 18.0, 13.0, 14.0, 6.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5986328125, -1.54840087890625, -1.4981689453125, -1.44793701171875, -1.397705078125, -1.34747314453125, -1.2972412109375, -1.24700927734375, -1.19677734375, -1.14654541015625, -1.0963134765625, -1.04608154296875, -0.995849609375, -0.94561767578125, -0.8953857421875, -0.84515380859375, -0.794921875, -0.74468994140625, -0.6944580078125, -0.64422607421875, -0.593994140625, -0.54376220703125, -0.4935302734375, -0.44329833984375, -0.39306640625, -0.34283447265625, -0.2926025390625, -0.24237060546875, -0.192138671875, -0.14190673828125, -0.0916748046875, -0.04144287109375, 0.0087890625, 0.05902099609375, 0.1092529296875, 0.15948486328125, 0.209716796875, 0.25994873046875, 0.3101806640625, 0.36041259765625, 0.41064453125, 0.46087646484375, 0.5111083984375, 0.56134033203125, 0.611572265625, 0.66180419921875, 0.7120361328125, 0.76226806640625, 0.8125, 0.86273193359375, 0.9129638671875, 0.96319580078125, 1.013427734375, 1.06365966796875, 1.1138916015625, 1.16412353515625, 1.21435546875, 1.26458740234375, 1.3148193359375, 1.36505126953125, 1.415283203125, 1.46551513671875, 1.5157470703125, 1.56597900390625, 1.6162109375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 4.0, 3.0, 10.0, 14.0, 23.0, 34.0, 33.0, 53.0, 55.0, 90.0, 132.0, 144.0, 105.0, 81.0, 56.0, 36.0, 33.0, 21.0, 9.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2060699462890625, -1.163116455078125, -1.1201629638671875, -1.07720947265625, -1.0342559814453125, -0.991302490234375, -0.9483489990234375, -0.9053955078125, -0.8624420166015625, -0.819488525390625, -0.7765350341796875, -0.73358154296875, -0.6906280517578125, -0.647674560546875, -0.6047210693359375, -0.561767578125, -0.5188140869140625, -0.475860595703125, -0.4329071044921875, -0.38995361328125, -0.3470001220703125, -0.304046630859375, -0.2610931396484375, -0.2181396484375, -0.1751861572265625, -0.132232666015625, -0.0892791748046875, -0.04632568359375, -0.0033721923828125, 0.039581298828125, 0.0825347900390625, 0.12548828125, 0.1684417724609375, 0.211395263671875, 0.2543487548828125, 0.29730224609375, 0.3402557373046875, 0.383209228515625, 0.4261627197265625, 0.4691162109375, 0.5120697021484375, 0.555023193359375, 0.5979766845703125, 0.64093017578125, 0.6838836669921875, 0.726837158203125, 0.7697906494140625, 0.812744140625, 0.8556976318359375, 0.898651123046875, 0.9416046142578125, 0.98455810546875, 1.0275115966796875, 1.070465087890625, 1.1134185791015625, 1.1563720703125, 1.1993255615234375, 1.242279052734375, 1.2852325439453125, 1.32818603515625, 1.3711395263671875, 1.414093017578125, 1.4570465087890625, 1.5]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 2.0, 5.0, 19.0, 37.0, 62.0, 146.0, 232.0, 195.0, 150.0, 68.0, 31.0, 14.0, 7.0, 10.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.755178451538086, -13.96750545501709, -13.17983341217041, -12.392160415649414, -11.604488372802734, -10.816815376281738, -10.029142379760742, -9.241470336914062, -8.453797340393066, -7.6661248207092285, -6.878452301025391, -6.0907793045043945, -5.303106784820557, -4.515434265136719, -3.7277612686157227, -2.9400887489318848, -2.152416229248047, -1.3647435903549194, -0.577070951461792, 0.210601806640625, 0.9982743263244629, 1.7859468460083008, 2.573619842529297, 3.3612923622131348, 4.148964881896973, 4.9366374015808105, 5.724309921264648, 6.5119829177856445, 7.299655437469482, 8.08732795715332, 8.875000953674316, 9.662673950195312, 10.45034408569336, 11.238017082214355, 12.025689125061035, 12.813362121582031, 13.601034164428711, 14.388707160949707, 15.176380157470703, 15.964052200317383, 16.751724243164062, 17.539396286010742, 18.327070236206055, 19.114742279052734, 19.902414321899414, 20.690086364746094, 21.477760314941406, 22.265432357788086, 23.0531063079834, 23.840778350830078, 24.62845230102539, 25.41612434387207, 26.20379638671875, 26.991470336914062, 27.779142379760742, 28.566814422607422, 29.354488372802734, 30.142160415649414, 30.929834365844727, 31.717506408691406, 32.50518035888672, 33.292850494384766, 34.08052444458008, 34.86819839477539, 35.65586853027344]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 9.0, 13.0, 14.0, 9.0, 22.0, 25.0, 27.0, 28.0, 41.0, 29.0, 39.0, 47.0, 36.0, 53.0, 57.0, 67.0, 51.0, 55.0, 44.0, 45.0, 43.0, 33.0, 22.0, 28.0, 20.0, 22.0, 22.0, 16.0, 13.0, 16.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.940229415893555, -11.576400756835938, -11.21257209777832, -10.848743438720703, -10.484914779663086, -10.121086120605469, -9.757257461547852, -9.393428802490234, -9.029600143432617, -8.665771484375, -8.301942825317383, -7.938114166259766, -7.574285507202148, -7.210456848144531, -6.846628189086914, -6.482799530029297, -6.118971347808838, -5.755142688751221, -5.3913140296936035, -5.027485370635986, -4.663656711578369, -4.299828052520752, -3.935999631881714, -3.5721709728240967, -3.2083423137664795, -2.8445136547088623, -2.480684995651245, -2.116856575012207, -1.7530277967453003, -1.389199137687683, -1.0253705978393555, -0.6615419387817383, -0.2977132797241211, 0.0661153495311737, 0.4299439787864685, 0.7937725782394409, 1.157601237297058, 1.5214298963546753, 1.885258436203003, 2.24908709526062, 2.6129157543182373, 2.9767444133758545, 3.3405730724334717, 3.7044014930725098, 4.068230152130127, 4.432058811187744, 4.795887470245361, 5.1597161293029785, 5.523544788360596, 5.887373447418213, 6.25120210647583, 6.615030765533447, 6.9788594245910645, 7.342688083648682, 7.706516265869141, 8.070344924926758, 8.434173583984375, 8.798002243041992, 9.16183090209961, 9.525659561157227, 9.889488220214844, 10.253316879272461, 10.617145538330078, 10.980974197387695, 11.344802856445312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 9.0, 13.0, 14.0, 28.0, 47.0, 52.0, 104.0, 226.0, 818.0, 22559.0, 4139402.0, 29655.0, 869.0, 209.0, 100.0, 48.0, 45.0, 28.0, 18.0, 16.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.9129638671875, -4.712646484375, -4.5123291015625, -4.31201171875, -4.1116943359375, -3.911376953125, -3.7110595703125, -3.5107421875, -3.3104248046875, -3.110107421875, -2.9097900390625, -2.70947265625, -2.5091552734375, -2.308837890625, -2.1085205078125, -1.908203125, -1.7078857421875, -1.507568359375, -1.3072509765625, -1.10693359375, -0.9066162109375, -0.706298828125, -0.5059814453125, -0.3056640625, -0.1053466796875, 0.094970703125, 0.2952880859375, 0.49560546875, 0.6959228515625, 0.896240234375, 1.0965576171875, 1.296875, 1.4971923828125, 1.697509765625, 1.8978271484375, 2.09814453125, 2.2984619140625, 2.498779296875, 2.6990966796875, 2.8994140625, 3.0997314453125, 3.300048828125, 3.5003662109375, 3.70068359375, 3.9010009765625, 4.101318359375, 4.3016357421875, 4.501953125, 4.7022705078125, 4.902587890625, 5.1029052734375, 5.30322265625, 5.5035400390625, 5.703857421875, 5.9041748046875, 6.1044921875, 6.3048095703125, 6.505126953125, 6.7054443359375, 6.90576171875, 7.1060791015625, 7.306396484375, 7.5067138671875, 7.70703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 12.0, 14.0, 20.0, 18.0, 27.0, 35.0, 29.0, 51.0, 53.0, 58.0, 65.0, 77.0, 74.0, 77.0, 64.0, 67.0, 52.0, 50.0, 30.0, 32.0, 25.0, 17.0, 12.0, 14.0, 11.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1552734375, -1.12725830078125, -1.0992431640625, -1.07122802734375, -1.043212890625, -1.01519775390625, -0.9871826171875, -0.95916748046875, -0.93115234375, -0.90313720703125, -0.8751220703125, -0.84710693359375, -0.819091796875, -0.79107666015625, -0.7630615234375, -0.73504638671875, -0.70703125, -0.67901611328125, -0.6510009765625, -0.62298583984375, -0.594970703125, -0.56695556640625, -0.5389404296875, -0.51092529296875, -0.48291015625, -0.45489501953125, -0.4268798828125, -0.39886474609375, -0.370849609375, -0.34283447265625, -0.3148193359375, -0.28680419921875, -0.2587890625, -0.23077392578125, -0.2027587890625, -0.17474365234375, -0.146728515625, -0.11871337890625, -0.0906982421875, -0.06268310546875, -0.03466796875, -0.00665283203125, 0.0213623046875, 0.04937744140625, 0.077392578125, 0.10540771484375, 0.1334228515625, 0.16143798828125, 0.189453125, 0.21746826171875, 0.2454833984375, 0.27349853515625, 0.301513671875, 0.32952880859375, 0.3575439453125, 0.38555908203125, 0.41357421875, 0.44158935546875, 0.4696044921875, 0.49761962890625, 0.525634765625, 0.55364990234375, 0.5816650390625, 0.60968017578125, 0.6376953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 3.0, 10.0, 13.0, 19.0, 15.0, 40.0, 37.0, 77.0, 117.0, 145.0, 268.0, 511.0, 908.0, 1694.0, 3597.0, 8757.0, 22782.0, 74264.0, 418929.0, 2938698.0, 590646.0, 90557.0, 25883.0, 9273.0, 3692.0, 1576.0, 756.0, 419.0, 222.0, 121.0, 76.0, 43.0, 40.0, 25.0, 17.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4501953125, -1.4082489013671875, -1.366302490234375, -1.3243560791015625, -1.28240966796875, -1.2404632568359375, -1.198516845703125, -1.1565704345703125, -1.1146240234375, -1.0726776123046875, -1.030731201171875, -0.9887847900390625, -0.94683837890625, -0.9048919677734375, -0.862945556640625, -0.8209991455078125, -0.779052734375, -0.7371063232421875, -0.695159912109375, -0.6532135009765625, -0.61126708984375, -0.5693206787109375, -0.527374267578125, -0.4854278564453125, -0.4434814453125, -0.4015350341796875, -0.359588623046875, -0.3176422119140625, -0.27569580078125, -0.2337493896484375, -0.191802978515625, -0.1498565673828125, -0.10791015625, -0.0659637451171875, -0.024017333984375, 0.0179290771484375, 0.05987548828125, 0.1018218994140625, 0.143768310546875, 0.1857147216796875, 0.2276611328125, 0.2696075439453125, 0.311553955078125, 0.3535003662109375, 0.39544677734375, 0.4373931884765625, 0.479339599609375, 0.5212860107421875, 0.563232421875, 0.6051788330078125, 0.647125244140625, 0.6890716552734375, 0.73101806640625, 0.7729644775390625, 0.814910888671875, 0.8568572998046875, 0.8988037109375, 0.9407501220703125, 0.982696533203125, 1.0246429443359375, 1.06658935546875, 1.1085357666015625, 1.150482177734375, 1.1924285888671875, 1.234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 13.0, 5.0, 12.0, 15.0, 22.0, 28.0, 47.0, 62.0, 85.0, 138.0, 241.0, 412.0, 695.0, 801.0, 590.0, 309.0, 185.0, 120.0, 79.0, 40.0, 42.0, 23.0, 20.0, 18.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.9755859375, -1.9277496337890625, -1.879913330078125, -1.8320770263671875, -1.78424072265625, -1.7364044189453125, -1.688568115234375, -1.6407318115234375, -1.5928955078125, -1.5450592041015625, -1.497222900390625, -1.4493865966796875, -1.40155029296875, -1.3537139892578125, -1.305877685546875, -1.2580413818359375, -1.210205078125, -1.1623687744140625, -1.114532470703125, -1.0666961669921875, -1.01885986328125, -0.9710235595703125, -0.923187255859375, -0.8753509521484375, -0.8275146484375, -0.7796783447265625, -0.731842041015625, -0.6840057373046875, -0.63616943359375, -0.5883331298828125, -0.540496826171875, -0.4926605224609375, -0.44482421875, -0.3969879150390625, -0.349151611328125, -0.3013153076171875, -0.25347900390625, -0.2056427001953125, -0.157806396484375, -0.1099700927734375, -0.0621337890625, -0.0142974853515625, 0.033538818359375, 0.0813751220703125, 0.12921142578125, 0.1770477294921875, 0.224884033203125, 0.2727203369140625, 0.320556640625, 0.3683929443359375, 0.416229248046875, 0.4640655517578125, 0.51190185546875, 0.5597381591796875, 0.607574462890625, 0.6554107666015625, 0.7032470703125, 0.7510833740234375, 0.798919677734375, 0.8467559814453125, 0.89459228515625, 0.9424285888671875, 0.990264892578125, 1.0381011962890625, 1.0859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 15.0, 51.0, 84.0, 193.0, 232.0, 191.0, 109.0, 57.0, 16.0, 6.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.047576904296875, -15.441932678222656, -14.836287498474121, -14.230642318725586, -13.624998092651367, -13.019353866577148, -12.413708686828613, -11.808063507080078, -11.20241928100586, -10.59677505493164, -9.991129875183105, -9.38548469543457, -8.779840469360352, -8.174196243286133, -7.568551063537598, -6.962906360626221, -6.357261657714844, -5.751616954803467, -5.14597225189209, -4.540327548980713, -3.934682846069336, -3.329038143157959, -2.723393440246582, -2.117748737335205, -1.5121040344238281, -0.9064593315124512, -0.3008146286010742, 0.30483007431030273, 0.9104747772216797, 1.5161194801330566, 2.1217641830444336, 2.7274088859558105, 3.3330535888671875, 3.9386982917785645, 4.544342994689941, 5.149987697601318, 5.755632400512695, 6.361277103424072, 6.966921806335449, 7.572566509246826, 8.178211212158203, 8.783855438232422, 9.389500617980957, 9.995145797729492, 10.600790023803711, 11.20643424987793, 11.812079429626465, 12.417724609375, 13.023368835449219, 13.629013061523438, 14.234658241271973, 14.840303421020508, 15.445947647094727, 16.051591873168945, 16.657238006591797, 17.262882232666016, 17.868526458740234, 18.474170684814453, 19.079814910888672, 19.685461044311523, 20.291105270385742, 20.89674949645996, 21.502395629882812, 22.10803985595703, 22.71368408203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 13.0, 8.0, 10.0, 15.0, 11.0, 17.0, 19.0, 28.0, 43.0, 33.0, 52.0, 35.0, 45.0, 48.0, 62.0, 66.0, 49.0, 56.0, 57.0, 34.0, 47.0, 43.0, 35.0, 30.0, 22.0, 26.0, 28.0, 14.0, 14.0, 16.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.916929244995117, -10.637404441833496, -10.357879638671875, -10.078353881835938, -9.798829078674316, -9.519304275512695, -9.239779472351074, -8.960254669189453, -8.680729866027832, -8.401205062866211, -8.12168025970459, -7.8421549797058105, -7.5626301765441895, -7.28310489654541, -7.003580093383789, -6.724055290222168, -6.444530010223389, -6.165005207061768, -5.885479927062988, -5.605955123901367, -5.326430320739746, -5.046905517578125, -4.767380237579346, -4.487855434417725, -4.208330154418945, -3.928805112838745, -3.649280309677124, -3.369755268096924, -3.0902304649353027, -2.8107054233551025, -2.5311803817749023, -2.2516555786132812, -1.9721307754516602, -1.6926058530807495, -1.4130809307098389, -1.1335558891296387, -0.854030966758728, -0.5745060443878174, -0.2949810028076172, -0.015456080436706543, 0.2640688419342041, 0.5435937643051147, 0.8231187462806702, 1.1026437282562256, 1.3821686506271362, 1.6616935729980469, 1.941218614578247, 2.2207436561584473, 2.5002684593200684, 2.7797935009002686, 3.0593183040618896, 3.33884334564209, 3.618368148803711, 3.897893190383911, 4.177418231964111, 4.456943035125732, 4.736468315124512, 5.015993118286133, 5.295518398284912, 5.575043201446533, 5.854568004608154, 6.134093284606934, 6.413618087768555, 6.693142890930176, 6.972667694091797]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 8.0, 3.0, 10.0, 10.0, 13.0, 9.0, 20.0, 30.0, 37.0, 65.0, 74.0, 121.0, 201.0, 320.0, 504.0, 778.0, 1467.0, 2499.0, 5045.0, 10663.0, 25166.0, 70875.0, 283482.0, 460373.0, 119792.0, 37640.0, 14904.0, 6586.0, 3332.0, 1781.0, 1048.0, 580.0, 340.0, 248.0, 144.0, 112.0, 82.0, 54.0, 40.0, 27.0, 25.0, 14.0, 8.0, 5.0, 10.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2138671875, -1.16925048828125, -1.1246337890625, -1.08001708984375, -1.035400390625, -0.99078369140625, -0.9461669921875, -0.90155029296875, -0.85693359375, -0.81231689453125, -0.7677001953125, -0.72308349609375, -0.678466796875, -0.63385009765625, -0.5892333984375, -0.54461669921875, -0.5, -0.45538330078125, -0.4107666015625, -0.36614990234375, -0.321533203125, -0.27691650390625, -0.2322998046875, -0.18768310546875, -0.14306640625, -0.09844970703125, -0.0538330078125, -0.00921630859375, 0.035400390625, 0.08001708984375, 0.1246337890625, 0.16925048828125, 0.2138671875, 0.25848388671875, 0.3031005859375, 0.34771728515625, 0.392333984375, 0.43695068359375, 0.4815673828125, 0.52618408203125, 0.57080078125, 0.61541748046875, 0.6600341796875, 0.70465087890625, 0.749267578125, 0.79388427734375, 0.8385009765625, 0.88311767578125, 0.927734375, 0.97235107421875, 1.0169677734375, 1.06158447265625, 1.106201171875, 1.15081787109375, 1.1954345703125, 1.24005126953125, 1.28466796875, 1.32928466796875, 1.3739013671875, 1.41851806640625, 1.463134765625, 1.50775146484375, 1.5523681640625, 1.59698486328125, 1.6416015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 12.0, 10.0, 17.0, 18.0, 19.0, 24.0, 31.0, 38.0, 37.0, 47.0, 46.0, 64.0, 63.0, 54.0, 72.0, 52.0, 64.0, 64.0, 46.0, 44.0, 28.0, 37.0, 21.0, 20.0, 14.0, 12.0, 13.0, 11.0, 5.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.98583984375, -0.9606170654296875, -0.935394287109375, -0.9101715087890625, -0.88494873046875, -0.8597259521484375, -0.834503173828125, -0.8092803955078125, -0.7840576171875, -0.7588348388671875, -0.733612060546875, -0.7083892822265625, -0.68316650390625, -0.6579437255859375, -0.632720947265625, -0.6074981689453125, -0.582275390625, -0.5570526123046875, -0.531829833984375, -0.5066070556640625, -0.48138427734375, -0.4561614990234375, -0.430938720703125, -0.4057159423828125, -0.3804931640625, -0.3552703857421875, -0.330047607421875, -0.3048248291015625, -0.27960205078125, -0.2543792724609375, -0.229156494140625, -0.2039337158203125, -0.1787109375, -0.1534881591796875, -0.128265380859375, -0.1030426025390625, -0.07781982421875, -0.0525970458984375, -0.027374267578125, -0.0021514892578125, 0.0230712890625, 0.0482940673828125, 0.073516845703125, 0.0987396240234375, 0.12396240234375, 0.1491851806640625, 0.174407958984375, 0.1996307373046875, 0.224853515625, 0.2500762939453125, 0.275299072265625, 0.3005218505859375, 0.32574462890625, 0.3509674072265625, 0.376190185546875, 0.4014129638671875, 0.4266357421875, 0.4518585205078125, 0.477081298828125, 0.5023040771484375, 0.52752685546875, 0.5527496337890625, 0.577972412109375, 0.6031951904296875, 0.62841796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 5.0, 12.0, 13.0, 26.0, 42.0, 72.0, 114.0, 182.0, 308.0, 646.0, 1587.0, 4992.0, 25557.0, 394245.0, 582283.0, 29559.0, 5588.0, 1751.0, 731.0, 353.0, 195.0, 89.0, 71.0, 42.0, 31.0, 16.0, 15.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.81390380859375, -2.7098388671875, -2.60577392578125, -2.501708984375, -2.39764404296875, -2.2935791015625, -2.18951416015625, -2.08544921875, -1.98138427734375, -1.8773193359375, -1.77325439453125, -1.669189453125, -1.56512451171875, -1.4610595703125, -1.35699462890625, -1.2529296875, -1.14886474609375, -1.0447998046875, -0.94073486328125, -0.836669921875, -0.73260498046875, -0.6285400390625, -0.52447509765625, -0.42041015625, -0.31634521484375, -0.2122802734375, -0.10821533203125, -0.004150390625, 0.09991455078125, 0.2039794921875, 0.30804443359375, 0.412109375, 0.51617431640625, 0.6202392578125, 0.72430419921875, 0.828369140625, 0.93243408203125, 1.0364990234375, 1.14056396484375, 1.24462890625, 1.34869384765625, 1.4527587890625, 1.55682373046875, 1.660888671875, 1.76495361328125, 1.8690185546875, 1.97308349609375, 2.0771484375, 2.18121337890625, 2.2852783203125, 2.38934326171875, 2.493408203125, 2.59747314453125, 2.7015380859375, 2.80560302734375, 2.90966796875, 3.01373291015625, 3.1177978515625, 3.22186279296875, 3.325927734375, 3.42999267578125, 3.5340576171875, 3.63812255859375, 3.7421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 7.0, 13.0, 10.0, 18.0, 12.0, 15.0, 23.0, 26.0, 20.0, 37.0, 31.0, 43.0, 47.0, 42.0, 37.0, 46.0, 44.0, 48.0, 54.0, 41.0, 49.0, 54.0, 42.0, 33.0, 32.0, 22.0, 29.0, 16.0, 13.0, 13.0, 15.0, 10.0, 12.0, 10.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.96875, -2.88690185546875, -2.8050537109375, -2.72320556640625, -2.641357421875, -2.55950927734375, -2.4776611328125, -2.39581298828125, -2.31396484375, -2.23211669921875, -2.1502685546875, -2.06842041015625, -1.986572265625, -1.90472412109375, -1.8228759765625, -1.74102783203125, -1.6591796875, -1.57733154296875, -1.4954833984375, -1.41363525390625, -1.331787109375, -1.24993896484375, -1.1680908203125, -1.08624267578125, -1.00439453125, -0.92254638671875, -0.8406982421875, -0.75885009765625, -0.677001953125, -0.59515380859375, -0.5133056640625, -0.43145751953125, -0.349609375, -0.26776123046875, -0.1859130859375, -0.10406494140625, -0.022216796875, 0.05963134765625, 0.1414794921875, 0.22332763671875, 0.30517578125, 0.38702392578125, 0.4688720703125, 0.55072021484375, 0.632568359375, 0.71441650390625, 0.7962646484375, 0.87811279296875, 0.9599609375, 1.04180908203125, 1.1236572265625, 1.20550537109375, 1.287353515625, 1.36920166015625, 1.4510498046875, 1.53289794921875, 1.61474609375, 1.69659423828125, 1.7784423828125, 1.86029052734375, 1.942138671875, 2.02398681640625, 2.1058349609375, 2.18768310546875, 2.26953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 10.0, 8.0, 11.0, 12.0, 22.0, 34.0, 51.0, 76.0, 137.0, 335.0, 1019.0, 4699.0, 39688.0, 830633.0, 157752.0, 11058.0, 2000.0, 525.0, 203.0, 98.0, 60.0, 33.0, 18.0, 22.0, 14.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.02734375, -1.96539306640625, -1.9034423828125, -1.84149169921875, -1.779541015625, -1.71759033203125, -1.6556396484375, -1.59368896484375, -1.53173828125, -1.46978759765625, -1.4078369140625, -1.34588623046875, -1.283935546875, -1.22198486328125, -1.1600341796875, -1.09808349609375, -1.0361328125, -0.97418212890625, -0.9122314453125, -0.85028076171875, -0.788330078125, -0.72637939453125, -0.6644287109375, -0.60247802734375, -0.54052734375, -0.47857666015625, -0.4166259765625, -0.35467529296875, -0.292724609375, -0.23077392578125, -0.1688232421875, -0.10687255859375, -0.044921875, 0.01702880859375, 0.0789794921875, 0.14093017578125, 0.202880859375, 0.26483154296875, 0.3267822265625, 0.38873291015625, 0.45068359375, 0.51263427734375, 0.5745849609375, 0.63653564453125, 0.698486328125, 0.76043701171875, 0.8223876953125, 0.88433837890625, 0.9462890625, 1.00823974609375, 1.0701904296875, 1.13214111328125, 1.194091796875, 1.25604248046875, 1.3179931640625, 1.37994384765625, 1.44189453125, 1.50384521484375, 1.5657958984375, 1.62774658203125, 1.689697265625, 1.75164794921875, 1.8135986328125, 1.87554931640625, 1.9375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 12.0, 20.0, 38.0, 40.0, 84.0, 206.0, 321.0, 129.0, 55.0, 32.0, 17.0, 12.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034356117248535156, -0.00032738223671913147, -0.0003112033009529114, -0.0002950243651866913, -0.0002788454294204712, -0.0002626664936542511, -0.000246487557888031, -0.0002303086221218109, -0.00021412968635559082, -0.00019795075058937073, -0.00018177181482315063, -0.00016559287905693054, -0.00014941394329071045, -0.00013323500752449036, -0.00011705607175827026, -0.00010087713599205017, -8.469820022583008e-05, -6.851926445960999e-05, -5.234032869338989e-05, -3.61613929271698e-05, -1.9982457160949707e-05, -3.8035213947296143e-06, 1.2375414371490479e-05, 2.855435013771057e-05, 4.4733285903930664e-05, 6.091222167015076e-05, 7.709115743637085e-05, 9.327009320259094e-05, 0.00010944902896881104, 0.00012562796473503113, 0.00014180690050125122, 0.0001579858362674713, 0.0001741647720336914, 0.0001903437077999115, 0.0002065226435661316, 0.00022270157933235168, 0.00023888051509857178, 0.00025505945086479187, 0.00027123838663101196, 0.00028741732239723206, 0.00030359625816345215, 0.00031977519392967224, 0.00033595412969589233, 0.0003521330654621124, 0.0003683120012283325, 0.0003844909369945526, 0.0004006698727607727, 0.0004168488085269928, 0.0004330277442932129, 0.000449206680059433, 0.0004653856158256531, 0.00048156455159187317, 0.0004977434873580933, 0.0005139224231243134, 0.0005301013588905334, 0.0005462802946567535, 0.0005624592304229736, 0.0005786381661891937, 0.0005948171019554138, 0.0006109960377216339, 0.000627174973487854, 0.0006433539092540741, 0.0006595328450202942, 0.0006757117807865143, 0.0006918907165527344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 4.0, 19.0, 14.0, 32.0, 57.0, 70.0, 128.0, 248.0, 477.0, 1076.0, 2567.0, 7646.0, 32759.0, 240377.0, 661993.0, 79172.0, 14585.0, 4243.0, 1550.0, 703.0, 364.0, 186.0, 120.0, 60.0, 38.0, 20.0, 9.0, 6.0, 9.0, 5.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.844085693359375, -0.80926513671875, -0.774444580078125, -0.7396240234375, -0.704803466796875, -0.66998291015625, -0.635162353515625, -0.600341796875, -0.565521240234375, -0.53070068359375, -0.495880126953125, -0.4610595703125, -0.426239013671875, -0.39141845703125, -0.356597900390625, -0.32177734375, -0.286956787109375, -0.25213623046875, -0.217315673828125, -0.1824951171875, -0.147674560546875, -0.11285400390625, -0.078033447265625, -0.043212890625, -0.008392333984375, 0.02642822265625, 0.061248779296875, 0.0960693359375, 0.130889892578125, 0.16571044921875, 0.200531005859375, 0.2353515625, 0.270172119140625, 0.30499267578125, 0.339813232421875, 0.3746337890625, 0.409454345703125, 0.44427490234375, 0.479095458984375, 0.513916015625, 0.548736572265625, 0.58355712890625, 0.618377685546875, 0.6531982421875, 0.688018798828125, 0.72283935546875, 0.757659912109375, 0.79248046875, 0.827301025390625, 0.86212158203125, 0.896942138671875, 0.9317626953125, 0.966583251953125, 1.00140380859375, 1.036224365234375, 1.071044921875, 1.105865478515625, 1.14068603515625, 1.175506591796875, 1.2103271484375, 1.245147705078125, 1.27996826171875, 1.314788818359375, 1.349609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 14.0, 11.0, 9.0, 24.0, 30.0, 36.0, 51.0, 45.0, 78.0, 93.0, 96.0, 104.0, 78.0, 77.0, 61.0, 40.0, 32.0, 34.0, 11.0, 15.0, 14.0, 4.0, 10.0, 9.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2193756103515625, -1.189727783203125, -1.1600799560546875, -1.13043212890625, -1.1007843017578125, -1.071136474609375, -1.0414886474609375, -1.0118408203125, -0.9821929931640625, -0.952545166015625, -0.9228973388671875, -0.89324951171875, -0.8636016845703125, -0.833953857421875, -0.8043060302734375, -0.774658203125, -0.7450103759765625, -0.715362548828125, -0.6857147216796875, -0.65606689453125, -0.6264190673828125, -0.596771240234375, -0.5671234130859375, -0.5374755859375, -0.5078277587890625, -0.478179931640625, -0.4485321044921875, -0.41888427734375, -0.3892364501953125, -0.359588623046875, -0.3299407958984375, -0.30029296875, -0.2706451416015625, -0.240997314453125, -0.2113494873046875, -0.18170166015625, -0.1520538330078125, -0.122406005859375, -0.0927581787109375, -0.0631103515625, -0.0334625244140625, -0.003814697265625, 0.0258331298828125, 0.05548095703125, 0.0851287841796875, 0.114776611328125, 0.1444244384765625, 0.174072265625, 0.2037200927734375, 0.233367919921875, 0.2630157470703125, 0.29266357421875, 0.3223114013671875, 0.351959228515625, 0.3816070556640625, 0.4112548828125, 0.4409027099609375, 0.470550537109375, 0.5001983642578125, 0.52984619140625, 0.5594940185546875, 0.589141845703125, 0.6187896728515625, 0.6484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 20.0, 52.0, 141.0, 264.0, 277.0, 145.0, 48.0, 15.0, 11.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.679428100585938, -28.75617790222168, -27.832927703857422, -26.909677505493164, -25.986427307128906, -25.06317710876465, -24.13992691040039, -23.2166748046875, -22.293426513671875, -21.370176315307617, -20.44692611694336, -19.5236759185791, -18.600425720214844, -17.677175521850586, -16.753925323486328, -15.830674171447754, -14.90742301940918, -13.984172821044922, -13.060922622680664, -12.137672424316406, -11.214422225952148, -10.29117202758789, -9.367920875549316, -8.444670677185059, -7.521420478820801, -6.598170280456543, -5.674920082092285, -4.751669406890869, -3.8284192085266113, -2.9051690101623535, -1.9819183349609375, -1.0586681365966797, -0.1354198455810547, 0.7878304719924927, 1.71108078956604, 2.634331226348877, 3.5575814247131348, 4.480831623077393, 5.404082298278809, 6.327332496643066, 7.250582695007324, 8.173832893371582, 9.09708309173584, 10.020334243774414, 10.943584442138672, 11.86683464050293, 12.790084838867188, 13.713335037231445, 14.636585235595703, 15.559835433959961, 16.48308563232422, 17.406335830688477, 18.329586029052734, 19.252836227416992, 20.17608642578125, 21.09933853149414, 22.022586822509766, 22.945837020874023, 23.86908721923828, 24.79233741760254, 25.715587615966797, 26.638837814331055, 27.562088012695312, 28.485340118408203, 29.40859031677246]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 20.0, 13.0, 16.0, 19.0, 23.0, 24.0, 23.0, 30.0, 31.0, 35.0, 38.0, 38.0, 34.0, 43.0, 55.0, 60.0, 50.0, 53.0, 47.0, 36.0, 28.0, 37.0, 28.0, 18.0, 28.0, 19.0, 19.0, 18.0, 17.0, 14.0, 13.0, 13.0, 8.0, 3.0, 8.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.617690086364746, -10.309447288513184, -10.001205444335938, -9.692962646484375, -9.384719848632812, -9.076478004455566, -8.768235206604004, -8.459993362426758, -8.151750564575195, -7.843508243560791, -7.535265922546387, -7.227023124694824, -6.91878080368042, -6.610538482666016, -6.302295684814453, -5.994053363800049, -5.6858110427856445, -5.37756872177124, -5.069326400756836, -4.761083602905273, -4.452841281890869, -4.144598960876465, -3.8363564014434814, -3.528113842010498, -3.2198715209960938, -2.9116291999816895, -2.603386640548706, -2.2951440811157227, -1.9869017601013184, -1.6786593198776245, -1.3704168796539307, -1.0621743202209473, -0.7539329528808594, -0.4456905126571655, -0.13744807243347168, 0.17079436779022217, 0.479036808013916, 0.7872792482376099, 1.0955216884613037, 1.403764247894287, 1.7120065689086914, 2.0202488899230957, 2.328491449356079, 2.6367340087890625, 2.944976329803467, 3.253218650817871, 3.5614612102508545, 3.869703769683838, 4.177946090698242, 4.4861884117126465, 4.794430732727051, 5.102673530578613, 5.410915851593018, 5.719158172607422, 6.027400970458984, 6.335643291473389, 6.643885612487793, 6.952127933502197, 7.260370254516602, 7.568613052368164, 7.876855373382568, 8.185097694396973, 8.493340492248535, 8.801582336425781, 9.109825134277344]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 49.0, 92.0, 300.0, 1683.0, 14581.0, 312918.0, 3662206.0, 190393.0, 10401.0, 1224.0, 252.0, 90.0, 40.0, 19.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.140716552734375, -2.06268310546875, -1.984649658203125, -1.9066162109375, -1.828582763671875, -1.75054931640625, -1.672515869140625, -1.594482421875, -1.516448974609375, -1.43841552734375, -1.360382080078125, -1.2823486328125, -1.204315185546875, -1.12628173828125, -1.048248291015625, -0.97021484375, -0.892181396484375, -0.81414794921875, -0.736114501953125, -0.6580810546875, -0.580047607421875, -0.50201416015625, -0.423980712890625, -0.345947265625, -0.267913818359375, -0.18988037109375, -0.111846923828125, -0.0338134765625, 0.044219970703125, 0.12225341796875, 0.200286865234375, 0.2783203125, 0.356353759765625, 0.43438720703125, 0.512420654296875, 0.5904541015625, 0.668487548828125, 0.74652099609375, 0.824554443359375, 0.902587890625, 0.980621337890625, 1.05865478515625, 1.136688232421875, 1.2147216796875, 1.292755126953125, 1.37078857421875, 1.448822021484375, 1.52685546875, 1.604888916015625, 1.68292236328125, 1.760955810546875, 1.8389892578125, 1.917022705078125, 1.99505615234375, 2.073089599609375, 2.151123046875, 2.229156494140625, 2.30718994140625, 2.385223388671875, 2.4632568359375, 2.541290283203125, 2.61932373046875, 2.697357177734375, 2.775390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 9.0, 7.0, 11.0, 16.0, 18.0, 25.0, 28.0, 37.0, 53.0, 51.0, 64.0, 76.0, 61.0, 60.0, 77.0, 75.0, 53.0, 55.0, 53.0, 44.0, 33.0, 36.0, 22.0, 15.0, 6.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.220703125, -1.1933059692382812, -1.1659088134765625, -1.1385116577148438, -1.111114501953125, -1.0837173461914062, -1.0563201904296875, -1.0289230346679688, -1.00152587890625, -0.9741287231445312, -0.9467315673828125, -0.9193344116210938, -0.891937255859375, -0.8645401000976562, -0.8371429443359375, -0.8097457885742188, -0.7823486328125, -0.7549514770507812, -0.7275543212890625, -0.7001571655273438, -0.672760009765625, -0.6453628540039062, -0.6179656982421875, -0.5905685424804688, -0.56317138671875, -0.5357742309570312, -0.5083770751953125, -0.48097991943359375, -0.453582763671875, -0.42618560791015625, -0.3987884521484375, -0.37139129638671875, -0.343994140625, -0.31659698486328125, -0.2891998291015625, -0.26180267333984375, -0.234405517578125, -0.20700836181640625, -0.1796112060546875, -0.15221405029296875, -0.12481689453125, -0.09741973876953125, -0.0700225830078125, -0.04262542724609375, -0.015228271484375, 0.01216888427734375, 0.0395660400390625, 0.06696319580078125, 0.0943603515625, 0.12175750732421875, 0.1491546630859375, 0.17655181884765625, 0.203948974609375, 0.23134613037109375, 0.2587432861328125, 0.28614044189453125, 0.31353759765625, 0.34093475341796875, 0.3683319091796875, 0.39572906494140625, 0.423126220703125, 0.45052337646484375, 0.4779205322265625, 0.5053176879882812, 0.53271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 11.0, 11.0, 12.0, 27.0, 34.0, 60.0, 84.0, 130.0, 260.0, 375.0, 709.0, 1446.0, 3359.0, 9659.0, 32762.0, 154350.0, 1412826.0, 2272710.0, 234331.0, 47935.0, 14013.0, 4864.0, 2052.0, 968.0, 494.0, 288.0, 193.0, 92.0, 59.0, 55.0, 32.0, 15.0, 13.0, 15.0, 9.0, 5.0, 5.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.23828125, -1.1926116943359375, -1.146942138671875, -1.1012725830078125, -1.05560302734375, -1.0099334716796875, -0.964263916015625, -0.9185943603515625, -0.8729248046875, -0.8272552490234375, -0.781585693359375, -0.7359161376953125, -0.69024658203125, -0.6445770263671875, -0.598907470703125, -0.5532379150390625, -0.507568359375, -0.4618988037109375, -0.416229248046875, -0.3705596923828125, -0.32489013671875, -0.2792205810546875, -0.233551025390625, -0.1878814697265625, -0.1422119140625, -0.0965423583984375, -0.050872802734375, -0.0052032470703125, 0.04046630859375, 0.0861358642578125, 0.131805419921875, 0.1774749755859375, 0.22314453125, 0.2688140869140625, 0.314483642578125, 0.3601531982421875, 0.40582275390625, 0.4514923095703125, 0.497161865234375, 0.5428314208984375, 0.5885009765625, 0.6341705322265625, 0.679840087890625, 0.7255096435546875, 0.77117919921875, 0.8168487548828125, 0.862518310546875, 0.9081878662109375, 0.953857421875, 0.9995269775390625, 1.045196533203125, 1.0908660888671875, 1.13653564453125, 1.1822052001953125, 1.227874755859375, 1.2735443115234375, 1.3192138671875, 1.3648834228515625, 1.410552978515625, 1.4562225341796875, 1.50189208984375, 1.5475616455078125, 1.593231201171875, 1.6389007568359375, 1.6845703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 12.0, 5.0, 14.0, 24.0, 24.0, 43.0, 76.0, 92.0, 175.0, 257.0, 442.0, 621.0, 736.0, 557.0, 343.0, 219.0, 127.0, 89.0, 63.0, 40.0, 27.0, 24.0, 11.0, 10.0, 7.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.951385498046875, -1.88909912109375, -1.826812744140625, -1.7645263671875, -1.702239990234375, -1.63995361328125, -1.577667236328125, -1.515380859375, -1.453094482421875, -1.39080810546875, -1.328521728515625, -1.2662353515625, -1.203948974609375, -1.14166259765625, -1.079376220703125, -1.01708984375, -0.954803466796875, -0.89251708984375, -0.830230712890625, -0.7679443359375, -0.705657958984375, -0.64337158203125, -0.581085205078125, -0.518798828125, -0.456512451171875, -0.39422607421875, -0.331939697265625, -0.2696533203125, -0.207366943359375, -0.14508056640625, -0.082794189453125, -0.0205078125, 0.041778564453125, 0.10406494140625, 0.166351318359375, 0.2286376953125, 0.290924072265625, 0.35321044921875, 0.415496826171875, 0.477783203125, 0.540069580078125, 0.60235595703125, 0.664642333984375, 0.7269287109375, 0.789215087890625, 0.85150146484375, 0.913787841796875, 0.97607421875, 1.038360595703125, 1.10064697265625, 1.162933349609375, 1.2252197265625, 1.287506103515625, 1.34979248046875, 1.412078857421875, 1.474365234375, 1.536651611328125, 1.59893798828125, 1.661224365234375, 1.7235107421875, 1.785797119140625, 1.84808349609375, 1.910369873046875, 1.97265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 29.0, 81.0, 188.0, 271.0, 203.0, 131.0, 34.0, 18.0, 10.0, 7.0, 3.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.060928344726562, -27.200525283813477, -26.34012222290039, -25.479721069335938, -24.61931800842285, -23.758914947509766, -22.89851188659668, -22.038108825683594, -21.177705764770508, -20.317302703857422, -19.456899642944336, -18.59649658203125, -17.736095428466797, -16.87569236755371, -16.015289306640625, -15.154886245727539, -14.29448413848877, -13.434081077575684, -12.573678970336914, -11.713275909423828, -10.852872848510742, -9.992469787597656, -9.132067680358887, -8.2716646194458, -7.411262035369873, -6.550859451293945, -5.690456390380859, -4.830053806304932, -3.969650983810425, -3.109248161315918, -2.2488455772399902, -1.3884425163269043, -0.5280399322509766, 0.3323628306388855, 1.1927655935287476, 2.053168296813965, 2.9135711193084717, 3.7739739418029785, 4.634376525878906, 5.494779586791992, 6.35518217086792, 7.215584754943848, 8.075987815856934, 8.936389923095703, 9.796792984008789, 10.657196044921875, 11.517599105834961, 12.378002166748047, 13.238404273986816, 14.098807334899902, 14.959209442138672, 15.819612503051758, 16.680015563964844, 17.54041862487793, 18.400821685791016, 19.26122283935547, 20.121625900268555, 20.98202896118164, 21.842432022094727, 22.702835083007812, 23.563236236572266, 24.42363929748535, 25.284042358398438, 26.144445419311523, 27.00484848022461]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 11.0, 20.0, 24.0, 30.0, 14.0, 27.0, 29.0, 36.0, 27.0, 34.0, 44.0, 30.0, 35.0, 31.0, 47.0, 51.0, 37.0, 36.0, 42.0, 48.0, 35.0, 35.0, 43.0, 28.0, 25.0, 24.0, 21.0, 17.0, 14.0, 18.0, 13.0, 12.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.075824737548828, -6.839612007141113, -6.603399276733398, -6.367186546325684, -6.130973815917969, -5.894761085510254, -5.658548355102539, -5.422335624694824, -5.186122894287109, -4.9499101638793945, -4.71369743347168, -4.477484703063965, -4.24127197265625, -4.005059242248535, -3.7688465118408203, -3.5326337814331055, -3.2964212894439697, -3.060208559036255, -2.82399582862854, -2.587783098220825, -2.3515703678131104, -2.1153578758239746, -1.8791450262069702, -1.6429322957992554, -1.4067195653915405, -1.1705068349838257, -0.9342941045761108, -0.6980814337730408, -0.4618687033653259, -0.22565603256225586, 0.010556697845458984, 0.24676942825317383, 0.48298215866088867, 0.7191948890686035, 0.9554076194763184, 1.1916203498840332, 1.427833080291748, 1.6640456914901733, 1.9002584218978882, 2.1364712715148926, 2.3726840019226074, 2.6088967323303223, 2.845109462738037, 3.081322193145752, 3.317534923553467, 3.5537476539611816, 3.7899603843688965, 4.026173114776611, 4.262385368347168, 4.498598098754883, 4.734810829162598, 4.9710235595703125, 5.207236289978027, 5.443449020385742, 5.679661750793457, 5.915874481201172, 6.152087211608887, 6.388299942016602, 6.624512672424316, 6.860725402832031, 7.096938133239746, 7.333150863647461, 7.569363594055176, 7.805576324462891, 8.041789054870605]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 14.0, 13.0, 18.0, 22.0, 49.0, 56.0, 106.0, 171.0, 263.0, 419.0, 877.0, 1633.0, 3065.0, 6388.0, 14770.0, 34247.0, 84749.0, 247269.0, 406364.0, 148334.0, 56420.0, 23456.0, 10056.0, 4643.0, 2343.0, 1221.0, 613.0, 357.0, 245.0, 120.0, 65.0, 60.0, 38.0, 23.0, 15.0, 11.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.513671875, -1.469512939453125, -1.42535400390625, -1.381195068359375, -1.3370361328125, -1.292877197265625, -1.24871826171875, -1.204559326171875, -1.160400390625, -1.116241455078125, -1.07208251953125, -1.027923583984375, -0.9837646484375, -0.939605712890625, -0.89544677734375, -0.851287841796875, -0.80712890625, -0.762969970703125, -0.71881103515625, -0.674652099609375, -0.6304931640625, -0.586334228515625, -0.54217529296875, -0.498016357421875, -0.453857421875, -0.409698486328125, -0.36553955078125, -0.321380615234375, -0.2772216796875, -0.233062744140625, -0.18890380859375, -0.144744873046875, -0.1005859375, -0.056427001953125, -0.01226806640625, 0.031890869140625, 0.0760498046875, 0.120208740234375, 0.16436767578125, 0.208526611328125, 0.252685546875, 0.296844482421875, 0.34100341796875, 0.385162353515625, 0.4293212890625, 0.473480224609375, 0.51763916015625, 0.561798095703125, 0.60595703125, 0.650115966796875, 0.69427490234375, 0.738433837890625, 0.7825927734375, 0.826751708984375, 0.87091064453125, 0.915069580078125, 0.959228515625, 1.003387451171875, 1.04754638671875, 1.091705322265625, 1.1358642578125, 1.180023193359375, 1.22418212890625, 1.268341064453125, 1.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 10.0, 9.0, 26.0, 27.0, 34.0, 50.0, 57.0, 51.0, 72.0, 79.0, 71.0, 68.0, 75.0, 58.0, 66.0, 73.0, 46.0, 35.0, 21.0, 21.0, 9.0, 14.0, 9.0, 4.0, 5.0, 6.0, 0.0, 3.0], "bins": [-1.447265625, -1.4164276123046875, -1.385589599609375, -1.3547515869140625, -1.32391357421875, -1.2930755615234375, -1.262237548828125, -1.2313995361328125, -1.2005615234375, -1.1697235107421875, -1.138885498046875, -1.1080474853515625, -1.07720947265625, -1.0463714599609375, -1.015533447265625, -0.9846954345703125, -0.953857421875, -0.9230194091796875, -0.892181396484375, -0.8613433837890625, -0.83050537109375, -0.7996673583984375, -0.768829345703125, -0.7379913330078125, -0.7071533203125, -0.6763153076171875, -0.645477294921875, -0.6146392822265625, -0.58380126953125, -0.5529632568359375, -0.522125244140625, -0.4912872314453125, -0.46044921875, -0.4296112060546875, -0.398773193359375, -0.3679351806640625, -0.33709716796875, -0.3062591552734375, -0.275421142578125, -0.2445831298828125, -0.2137451171875, -0.1829071044921875, -0.152069091796875, -0.1212310791015625, -0.09039306640625, -0.0595550537109375, -0.028717041015625, 0.0021209716796875, 0.032958984375, 0.0637969970703125, 0.094635009765625, 0.1254730224609375, 0.15631103515625, 0.1871490478515625, 0.217987060546875, 0.2488250732421875, 0.2796630859375, 0.3105010986328125, 0.341339111328125, 0.3721771240234375, 0.40301513671875, 0.4338531494140625, 0.464691162109375, 0.4955291748046875, 0.5263671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 35.0, 49.0, 86.0, 167.0, 292.0, 587.0, 1320.0, 3705.0, 17571.0, 365910.0, 630920.0, 20913.0, 4101.0, 1474.0, 671.0, 296.0, 172.0, 109.0, 49.0, 39.0, 22.0, 15.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.36767578125, -4.2119140625, -4.05615234375, -3.900390625, -3.74462890625, -3.5888671875, -3.43310546875, -3.27734375, -3.12158203125, -2.9658203125, -2.81005859375, -2.654296875, -2.49853515625, -2.3427734375, -2.18701171875, -2.03125, -1.87548828125, -1.7197265625, -1.56396484375, -1.408203125, -1.25244140625, -1.0966796875, -0.94091796875, -0.78515625, -0.62939453125, -0.4736328125, -0.31787109375, -0.162109375, -0.00634765625, 0.1494140625, 0.30517578125, 0.4609375, 0.61669921875, 0.7724609375, 0.92822265625, 1.083984375, 1.23974609375, 1.3955078125, 1.55126953125, 1.70703125, 1.86279296875, 2.0185546875, 2.17431640625, 2.330078125, 2.48583984375, 2.6416015625, 2.79736328125, 2.953125, 3.10888671875, 3.2646484375, 3.42041015625, 3.576171875, 3.73193359375, 3.8876953125, 4.04345703125, 4.19921875, 4.35498046875, 4.5107421875, 4.66650390625, 4.822265625, 4.97802734375, 5.1337890625, 5.28955078125, 5.4453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 13.0, 12.0, 16.0, 16.0, 15.0, 31.0, 30.0, 40.0, 41.0, 40.0, 49.0, 51.0, 58.0, 60.0, 63.0, 56.0, 48.0, 49.0, 49.0, 37.0, 41.0, 31.0, 31.0, 28.0, 20.0, 16.0, 7.0, 14.0, 3.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.924163818359375, -2.81707763671875, -2.709991455078125, -2.6029052734375, -2.495819091796875, -2.38873291015625, -2.281646728515625, -2.174560546875, -2.067474365234375, -1.96038818359375, -1.853302001953125, -1.7462158203125, -1.639129638671875, -1.53204345703125, -1.424957275390625, -1.31787109375, -1.210784912109375, -1.10369873046875, -0.996612548828125, -0.8895263671875, -0.782440185546875, -0.67535400390625, -0.568267822265625, -0.461181640625, -0.354095458984375, -0.24700927734375, -0.139923095703125, -0.0328369140625, 0.074249267578125, 0.18133544921875, 0.288421630859375, 0.3955078125, 0.502593994140625, 0.60968017578125, 0.716766357421875, 0.8238525390625, 0.930938720703125, 1.03802490234375, 1.145111083984375, 1.252197265625, 1.359283447265625, 1.46636962890625, 1.573455810546875, 1.6805419921875, 1.787628173828125, 1.89471435546875, 2.001800537109375, 2.10888671875, 2.215972900390625, 2.32305908203125, 2.430145263671875, 2.5372314453125, 2.644317626953125, 2.75140380859375, 2.858489990234375, 2.965576171875, 3.072662353515625, 3.17974853515625, 3.286834716796875, 3.3939208984375, 3.501007080078125, 3.60809326171875, 3.715179443359375, 3.822265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 12.0, 14.0, 23.0, 41.0, 54.0, 110.0, 153.0, 277.0, 592.0, 1355.0, 3710.0, 13393.0, 66769.0, 636350.0, 270929.0, 41046.0, 9035.0, 2515.0, 1007.0, 502.0, 248.0, 127.0, 57.0, 53.0, 41.0, 25.0, 26.0, 11.0, 11.0, 6.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.087890625, -1.053741455078125, -1.01959228515625, -0.985443115234375, -0.9512939453125, -0.917144775390625, -0.88299560546875, -0.848846435546875, -0.814697265625, -0.780548095703125, -0.74639892578125, -0.712249755859375, -0.6781005859375, -0.643951416015625, -0.60980224609375, -0.575653076171875, -0.54150390625, -0.507354736328125, -0.47320556640625, -0.439056396484375, -0.4049072265625, -0.370758056640625, -0.33660888671875, -0.302459716796875, -0.268310546875, -0.234161376953125, -0.20001220703125, -0.165863037109375, -0.1317138671875, -0.097564697265625, -0.06341552734375, -0.029266357421875, 0.0048828125, 0.039031982421875, 0.07318115234375, 0.107330322265625, 0.1414794921875, 0.175628662109375, 0.20977783203125, 0.243927001953125, 0.278076171875, 0.312225341796875, 0.34637451171875, 0.380523681640625, 0.4146728515625, 0.448822021484375, 0.48297119140625, 0.517120361328125, 0.55126953125, 0.585418701171875, 0.61956787109375, 0.653717041015625, 0.6878662109375, 0.722015380859375, 0.75616455078125, 0.790313720703125, 0.824462890625, 0.858612060546875, 0.89276123046875, 0.926910400390625, 0.9610595703125, 0.995208740234375, 1.02935791015625, 1.063507080078125, 1.09765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 11.0, 14.0, 13.0, 18.0, 24.0, 20.0, 24.0, 31.0, 52.0, 55.0, 93.0, 141.0, 139.0, 63.0, 62.0, 49.0, 33.0, 26.0, 19.0, 17.0, 24.0, 13.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002503395080566406, -0.00024197623133659363, -0.00023361295461654663, -0.00022524967789649963, -0.00021688640117645264, -0.00020852312445640564, -0.00020015984773635864, -0.00019179657101631165, -0.00018343329429626465, -0.00017507001757621765, -0.00016670674085617065, -0.00015834346413612366, -0.00014998018741607666, -0.00014161691069602966, -0.00013325363397598267, -0.00012489035725593567, -0.00011652708053588867, -0.00010816380381584167, -9.980052709579468e-05, -9.143725037574768e-05, -8.307397365570068e-05, -7.471069693565369e-05, -6.634742021560669e-05, -5.798414349555969e-05, -4.9620866775512695e-05, -4.12575900554657e-05, -3.28943133354187e-05, -2.4531036615371704e-05, -1.6167759895324707e-05, -7.80448317527771e-06, 5.587935447692871e-07, 8.922070264816284e-06, 1.728534698486328e-05, 2.564862370491028e-05, 3.4011900424957275e-05, 4.237517714500427e-05, 5.073845386505127e-05, 5.9101730585098267e-05, 6.746500730514526e-05, 7.582828402519226e-05, 8.419156074523926e-05, 9.255483746528625e-05, 0.00010091811418533325, 0.00010928139090538025, 0.00011764466762542725, 0.00012600794434547424, 0.00013437122106552124, 0.00014273449778556824, 0.00015109777450561523, 0.00015946105122566223, 0.00016782432794570923, 0.00017618760466575623, 0.00018455088138580322, 0.00019291415810585022, 0.00020127743482589722, 0.00020964071154594421, 0.0002180039882659912, 0.0002263672649860382, 0.0002347305417060852, 0.0002430938184261322, 0.0002514570951461792, 0.0002598203718662262, 0.0002681836485862732, 0.0002765469253063202, 0.0002849102020263672]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 6.0, 7.0, 10.0, 11.0, 33.0, 40.0, 51.0, 112.0, 272.0, 570.0, 1471.0, 4481.0, 23499.0, 351243.0, 628656.0, 29981.0, 5251.0, 1680.0, 602.0, 284.0, 133.0, 74.0, 39.0, 19.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.105377197265625, -1.05743408203125, -1.009490966796875, -0.9615478515625, -0.913604736328125, -0.86566162109375, -0.817718505859375, -0.769775390625, -0.721832275390625, -0.67388916015625, -0.625946044921875, -0.5780029296875, -0.530059814453125, -0.48211669921875, -0.434173583984375, -0.38623046875, -0.338287353515625, -0.29034423828125, -0.242401123046875, -0.1944580078125, -0.146514892578125, -0.09857177734375, -0.050628662109375, -0.002685546875, 0.045257568359375, 0.09320068359375, 0.141143798828125, 0.1890869140625, 0.237030029296875, 0.28497314453125, 0.332916259765625, 0.380859375, 0.428802490234375, 0.47674560546875, 0.524688720703125, 0.5726318359375, 0.620574951171875, 0.66851806640625, 0.716461181640625, 0.764404296875, 0.812347412109375, 0.86029052734375, 0.908233642578125, 0.9561767578125, 1.004119873046875, 1.05206298828125, 1.100006103515625, 1.14794921875, 1.195892333984375, 1.24383544921875, 1.291778564453125, 1.3397216796875, 1.387664794921875, 1.43560791015625, 1.483551025390625, 1.531494140625, 1.579437255859375, 1.62738037109375, 1.675323486328125, 1.7232666015625, 1.771209716796875, 1.81915283203125, 1.867095947265625, 1.9150390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 13.0, 17.0, 13.0, 25.0, 53.0, 33.0, 55.0, 55.0, 68.0, 75.0, 98.0, 83.0, 81.0, 56.0, 52.0, 48.0, 30.0, 26.0, 16.0, 19.0, 18.0, 6.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7885971069335938, -0.7593231201171875, -0.7300491333007812, -0.700775146484375, -0.6715011596679688, -0.6422271728515625, -0.6129531860351562, -0.58367919921875, -0.5544052124023438, -0.5251312255859375, -0.49585723876953125, -0.466583251953125, -0.43730926513671875, -0.4080352783203125, -0.37876129150390625, -0.3494873046875, -0.32021331787109375, -0.2909393310546875, -0.26166534423828125, -0.232391357421875, -0.20311737060546875, -0.1738433837890625, -0.14456939697265625, -0.11529541015625, -0.08602142333984375, -0.0567474365234375, -0.02747344970703125, 0.001800537109375, 0.03107452392578125, 0.0603485107421875, 0.08962249755859375, 0.118896484375, 0.14817047119140625, 0.1774444580078125, 0.20671844482421875, 0.235992431640625, 0.26526641845703125, 0.2945404052734375, 0.32381439208984375, 0.35308837890625, 0.38236236572265625, 0.4116363525390625, 0.44091033935546875, 0.470184326171875, 0.49945831298828125, 0.5287322998046875, 0.5580062866210938, 0.5872802734375, 0.6165542602539062, 0.6458282470703125, 0.6751022338867188, 0.704376220703125, 0.7336502075195312, 0.7629241943359375, 0.7921981811523438, 0.82147216796875, 0.8507461547851562, 0.8800201416015625, 0.9092941284179688, 0.938568115234375, 0.9678421020507812, 0.9971160888671875, 1.0263900756835938, 1.0556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 13.0, 28.0, 59.0, 136.0, 231.0, 245.0, 138.0, 63.0, 31.0, 15.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.754072189331055, -26.940380096435547, -26.12668800354004, -25.31299591064453, -24.499305725097656, -23.68561363220215, -22.87192153930664, -22.058229446411133, -21.244537353515625, -20.430845260620117, -19.61715316772461, -18.803462982177734, -17.989770889282227, -17.17607879638672, -16.36238670349121, -15.548694610595703, -14.735003471374512, -13.921311378479004, -13.107620239257812, -12.293928146362305, -11.480236053466797, -10.666543960571289, -9.852852821350098, -9.03916072845459, -8.225469589233398, -7.411777973175049, -6.598085880279541, -5.784394264221191, -4.970702171325684, -4.157010555267334, -3.3433189392089844, -2.5296268463134766, -1.7159347534179688, -0.9022429585456848, -0.08855116367340088, 0.7251405715942383, 1.538832426071167, 2.3525242805480957, 3.1662158966064453, 3.979907989501953, 4.793599605560303, 5.607291221618652, 6.42098331451416, 7.23467493057251, 8.04836654663086, 8.862058639526367, 9.675750732421875, 10.489442825317383, 11.303133964538574, 12.116826057434082, 12.930517196655273, 13.744209289550781, 14.557901382446289, 15.371593475341797, 16.185283660888672, 16.998977661132812, 17.812667846679688, 18.626359939575195, 19.440052032470703, 20.253742218017578, 21.067434310913086, 21.881126403808594, 22.6948184967041, 23.50851058959961, 24.322202682495117]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 7.0, 3.0, 8.0, 10.0, 10.0, 15.0, 10.0, 23.0, 17.0, 20.0, 20.0, 17.0, 21.0, 21.0, 31.0, 35.0, 30.0, 32.0, 41.0, 53.0, 45.0, 54.0, 52.0, 47.0, 32.0, 44.0, 37.0, 25.0, 30.0, 27.0, 21.0, 23.0, 21.0, 15.0, 10.0, 8.0, 11.0, 13.0, 13.0, 5.0, 4.0, 5.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-10.03938102722168, -9.736881256103516, -9.434381484985352, -9.131881713867188, -8.829381942749023, -8.52688217163086, -8.224382400512695, -7.921882629394531, -7.619382858276367, -7.316883087158203, -7.014383316040039, -6.711883544921875, -6.409383773803711, -6.106884002685547, -5.804384231567383, -5.501884460449219, -5.199384689331055, -4.896884918212891, -4.594385147094727, -4.2918853759765625, -3.9893856048583984, -3.6868858337402344, -3.3843860626220703, -3.0818862915039062, -2.779386520385742, -2.476886749267578, -2.174386978149414, -1.87188720703125, -1.569387435913086, -1.2668876647949219, -0.9643878936767578, -0.6618881225585938, -0.3593883514404297, -0.056888580322265625, 0.24561119079589844, 0.5481109619140625, 0.8506107330322266, 1.1531105041503906, 1.4556102752685547, 1.7581100463867188, 2.060609817504883, 2.363109588623047, 2.665609359741211, 2.968109130859375, 3.270608901977539, 3.573108673095703, 3.875608444213867, 4.178108215332031, 4.480607986450195, 4.783107757568359, 5.085607528686523, 5.3881072998046875, 5.690607070922852, 5.993106842041016, 6.29560661315918, 6.598106384277344, 6.900606155395508, 7.203105926513672, 7.505605697631836, 7.80810546875, 8.110605239868164, 8.413105010986328, 8.715604782104492, 9.018104553222656, 9.32060432434082]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 15.0, 29.0, 64.0, 102.0, 230.0, 673.0, 2035.0, 9413.0, 67907.0, 1320856.0, 2641013.0, 130439.0, 16614.0, 3398.0, 918.0, 311.0, 138.0, 65.0, 26.0, 15.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.455078125, -2.4006805419921875, -2.346282958984375, -2.2918853759765625, -2.23748779296875, -2.1830902099609375, -2.128692626953125, -2.0742950439453125, -2.0198974609375, -1.9654998779296875, -1.911102294921875, -1.8567047119140625, -1.80230712890625, -1.7479095458984375, -1.693511962890625, -1.6391143798828125, -1.584716796875, -1.5303192138671875, -1.475921630859375, -1.4215240478515625, -1.36712646484375, -1.3127288818359375, -1.258331298828125, -1.2039337158203125, -1.1495361328125, -1.0951385498046875, -1.040740966796875, -0.9863433837890625, -0.93194580078125, -0.8775482177734375, -0.823150634765625, -0.7687530517578125, -0.71435546875, -0.6599578857421875, -0.605560302734375, -0.5511627197265625, -0.49676513671875, -0.4423675537109375, -0.387969970703125, -0.3335723876953125, -0.2791748046875, -0.2247772216796875, -0.170379638671875, -0.1159820556640625, -0.06158447265625, -0.0071868896484375, 0.047210693359375, 0.1016082763671875, 0.156005859375, 0.2104034423828125, 0.264801025390625, 0.3191986083984375, 0.37359619140625, 0.4279937744140625, 0.482391357421875, 0.5367889404296875, 0.5911865234375, 0.6455841064453125, 0.699981689453125, 0.7543792724609375, 0.80877685546875, 0.8631744384765625, 0.917572021484375, 0.9719696044921875, 1.0263671875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 7.0, 14.0, 16.0, 23.0, 39.0, 45.0, 59.0, 81.0, 88.0, 88.0, 105.0, 100.0, 86.0, 78.0, 50.0, 44.0, 24.0, 25.0, 18.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.8583984375, -1.820556640625, -1.78271484375, -1.744873046875, -1.70703125, -1.669189453125, -1.63134765625, -1.593505859375, -1.5556640625, -1.517822265625, -1.47998046875, -1.442138671875, -1.404296875, -1.366455078125, -1.32861328125, -1.290771484375, -1.2529296875, -1.215087890625, -1.17724609375, -1.139404296875, -1.1015625, -1.063720703125, -1.02587890625, -0.988037109375, -0.9501953125, -0.912353515625, -0.87451171875, -0.836669921875, -0.798828125, -0.760986328125, -0.72314453125, -0.685302734375, -0.6474609375, -0.609619140625, -0.57177734375, -0.533935546875, -0.49609375, -0.458251953125, -0.42041015625, -0.382568359375, -0.3447265625, -0.306884765625, -0.26904296875, -0.231201171875, -0.193359375, -0.155517578125, -0.11767578125, -0.079833984375, -0.0419921875, -0.004150390625, 0.03369140625, 0.071533203125, 0.109375, 0.147216796875, 0.18505859375, 0.222900390625, 0.2607421875, 0.298583984375, 0.33642578125, 0.374267578125, 0.412109375, 0.449951171875, 0.48779296875, 0.525634765625, 0.5634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 13.0, 31.0, 36.0, 52.0, 105.0, 164.0, 309.0, 605.0, 1298.0, 3045.0, 9848.0, 42044.0, 313868.0, 3130023.0, 609647.0, 62795.0, 13426.0, 3966.0, 1494.0, 685.0, 345.0, 197.0, 96.0, 61.0, 41.0, 15.0, 17.0, 16.0, 12.0, 2.0, 3.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.8303375244140625, -1.775909423828125, -1.7214813232421875, -1.66705322265625, -1.6126251220703125, -1.558197021484375, -1.5037689208984375, -1.4493408203125, -1.3949127197265625, -1.340484619140625, -1.2860565185546875, -1.23162841796875, -1.1772003173828125, -1.122772216796875, -1.0683441162109375, -1.013916015625, -0.9594879150390625, -0.905059814453125, -0.8506317138671875, -0.79620361328125, -0.7417755126953125, -0.687347412109375, -0.6329193115234375, -0.5784912109375, -0.5240631103515625, -0.469635009765625, -0.4152069091796875, -0.36077880859375, -0.3063507080078125, -0.251922607421875, -0.1974945068359375, -0.14306640625, -0.0886383056640625, -0.034210205078125, 0.0202178955078125, 0.07464599609375, 0.1290740966796875, 0.183502197265625, 0.2379302978515625, 0.2923583984375, 0.3467864990234375, 0.401214599609375, 0.4556427001953125, 0.51007080078125, 0.5644989013671875, 0.618927001953125, 0.6733551025390625, 0.727783203125, 0.7822113037109375, 0.836639404296875, 0.8910675048828125, 0.94549560546875, 0.9999237060546875, 1.054351806640625, 1.1087799072265625, 1.1632080078125, 1.2176361083984375, 1.272064208984375, 1.3264923095703125, 1.38092041015625, 1.4353485107421875, 1.489776611328125, 1.5442047119140625, 1.5986328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 7.0, 11.0, 13.0, 21.0, 27.0, 47.0, 61.0, 96.0, 133.0, 253.0, 318.0, 531.0, 682.0, 637.0, 455.0, 269.0, 143.0, 108.0, 86.0, 38.0, 30.0, 21.0, 26.0, 16.0, 10.0, 6.0, 9.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3656463623046875, -1.308441162109375, -1.2512359619140625, -1.19403076171875, -1.1368255615234375, -1.079620361328125, -1.0224151611328125, -0.9652099609375, -0.9080047607421875, -0.850799560546875, -0.7935943603515625, -0.73638916015625, -0.6791839599609375, -0.621978759765625, -0.5647735595703125, -0.507568359375, -0.4503631591796875, -0.393157958984375, -0.3359527587890625, -0.27874755859375, -0.2215423583984375, -0.164337158203125, -0.1071319580078125, -0.0499267578125, 0.0072784423828125, 0.064483642578125, 0.1216888427734375, 0.17889404296875, 0.2360992431640625, 0.293304443359375, 0.3505096435546875, 0.40771484375, 0.4649200439453125, 0.522125244140625, 0.5793304443359375, 0.63653564453125, 0.6937408447265625, 0.750946044921875, 0.8081512451171875, 0.8653564453125, 0.9225616455078125, 0.979766845703125, 1.0369720458984375, 1.09417724609375, 1.1513824462890625, 1.208587646484375, 1.2657928466796875, 1.322998046875, 1.3802032470703125, 1.437408447265625, 1.4946136474609375, 1.55181884765625, 1.6090240478515625, 1.666229248046875, 1.7234344482421875, 1.7806396484375, 1.8378448486328125, 1.895050048828125, 1.9522552490234375, 2.00946044921875, 2.0666656494140625, 2.123870849609375, 2.1810760498046875, 2.23828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 13.0, 15.0, 50.0, 121.0, 198.0, 262.0, 156.0, 96.0, 37.0, 18.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.47132110595703, -34.741455078125, -34.01158905029297, -33.2817268371582, -32.55186080932617, -31.82199478149414, -31.09212875366211, -30.36226463317871, -29.632400512695312, -28.90253448486328, -28.172670364379883, -27.44280433654785, -26.712940216064453, -25.983074188232422, -25.25320816040039, -24.523344039916992, -23.79347801208496, -23.06361198425293, -22.33374786376953, -21.6038818359375, -20.8740177154541, -20.14415168762207, -19.414287567138672, -18.68442153930664, -17.95455551147461, -17.224689483642578, -16.49482536315918, -15.764959335327148, -15.03509521484375, -14.305229187011719, -13.575364112854004, -12.845499038696289, -12.11563491821289, -11.385769844055176, -10.655904769897461, -9.92603874206543, -9.196174621582031, -8.46630859375, -7.736443519592285, -7.00657844543457, -6.2767133712768555, -5.546848297119141, -4.816983222961426, -4.087117671966553, -3.357252597808838, -2.627387523651123, -1.89752197265625, -1.1676568984985352, -0.4377918243408203, 0.2920733690261841, 1.0219385623931885, 1.7518038749694824, 2.4816689491271973, 3.211534023284912, 3.941399574279785, 4.6712646484375, 5.401129722595215, 6.13099479675293, 6.8608598709106445, 7.590725421905518, 8.32059097290039, 9.050455093383789, 9.78032112121582, 10.510186195373535, 11.24005126953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 8.0, 16.0, 21.0, 19.0, 28.0, 28.0, 26.0, 32.0, 38.0, 36.0, 40.0, 52.0, 44.0, 48.0, 56.0, 42.0, 47.0, 63.0, 48.0, 57.0, 44.0, 35.0, 30.0, 26.0, 28.0, 22.0, 12.0, 14.0, 8.0, 9.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.01160717010498, -7.712160110473633, -7.412713050842285, -7.1132659912109375, -6.81381893157959, -6.514371871948242, -6.214925289154053, -5.915478229522705, -5.616031169891357, -5.31658411026001, -5.017137050628662, -4.7176899909973145, -4.418243408203125, -4.118796348571777, -3.8193492889404297, -3.519902229309082, -3.2204551696777344, -2.9210081100463867, -2.621561050415039, -2.3221142292022705, -2.022667169570923, -1.7232201099395752, -1.423773169517517, -1.124326229095459, -0.8248791694641113, -0.5254321694374084, -0.22598516941070557, 0.07346183061599731, 0.3729088306427002, 0.6723558902740479, 0.971802830696106, 1.271249771118164, 1.5706968307495117, 1.8701438903808594, 2.169590950012207, 2.4690377712249756, 2.7684848308563232, 3.067931890487671, 3.3673787117004395, 3.666825771331787, 3.9662728309631348, 4.265719890594482, 4.56516695022583, 4.864614009857178, 5.164060592651367, 5.463507652282715, 5.7629547119140625, 6.06240177154541, 6.361848831176758, 6.6612958908081055, 6.960742950439453, 7.260190010070801, 7.559637069702148, 7.859084129333496, 8.158531188964844, 8.457977294921875, 8.757425308227539, 9.056872367858887, 9.356319427490234, 9.655766487121582, 9.95521354675293, 10.254660606384277, 10.554107666015625, 10.853553771972656, 11.153000831604004]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 10.0, 6.0, 10.0, 6.0, 25.0, 32.0, 28.0, 59.0, 107.0, 136.0, 240.0, 430.0, 641.0, 1163.0, 2403.0, 4715.0, 10366.0, 24827.0, 77797.0, 359946.0, 422184.0, 92818.0, 28273.0, 11446.0, 5182.0, 2627.0, 1324.0, 697.0, 413.0, 241.0, 114.0, 107.0, 61.0, 35.0, 34.0, 15.0, 7.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.66015625, -1.611419677734375, -1.56268310546875, -1.513946533203125, -1.4652099609375, -1.416473388671875, -1.36773681640625, -1.319000244140625, -1.270263671875, -1.221527099609375, -1.17279052734375, -1.124053955078125, -1.0753173828125, -1.026580810546875, -0.97784423828125, -0.929107666015625, -0.88037109375, -0.831634521484375, -0.78289794921875, -0.734161376953125, -0.6854248046875, -0.636688232421875, -0.58795166015625, -0.539215087890625, -0.490478515625, -0.441741943359375, -0.39300537109375, -0.344268798828125, -0.2955322265625, -0.246795654296875, -0.19805908203125, -0.149322509765625, -0.1005859375, -0.051849365234375, -0.00311279296875, 0.045623779296875, 0.0943603515625, 0.143096923828125, 0.19183349609375, 0.240570068359375, 0.289306640625, 0.338043212890625, 0.38677978515625, 0.435516357421875, 0.4842529296875, 0.532989501953125, 0.58172607421875, 0.630462646484375, 0.67919921875, 0.727935791015625, 0.77667236328125, 0.825408935546875, 0.8741455078125, 0.922882080078125, 0.97161865234375, 1.020355224609375, 1.069091796875, 1.117828369140625, 1.16656494140625, 1.215301513671875, 1.2640380859375, 1.312774658203125, 1.36151123046875, 1.410247802734375, 1.458984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 14.0, 13.0, 22.0, 21.0, 19.0, 28.0, 27.0, 30.0, 41.0, 44.0, 55.0, 56.0, 41.0, 46.0, 53.0, 54.0, 63.0, 57.0, 42.0, 45.0, 27.0, 38.0, 31.0, 19.0, 20.0, 18.0, 15.0, 11.0, 9.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.8974609375, -0.875457763671875, -0.85345458984375, -0.831451416015625, -0.8094482421875, -0.787445068359375, -0.76544189453125, -0.743438720703125, -0.721435546875, -0.699432373046875, -0.67742919921875, -0.655426025390625, -0.6334228515625, -0.611419677734375, -0.58941650390625, -0.567413330078125, -0.54541015625, -0.523406982421875, -0.50140380859375, -0.479400634765625, -0.4573974609375, -0.435394287109375, -0.41339111328125, -0.391387939453125, -0.369384765625, -0.347381591796875, -0.32537841796875, -0.303375244140625, -0.2813720703125, -0.259368896484375, -0.23736572265625, -0.215362548828125, -0.193359375, -0.171356201171875, -0.14935302734375, -0.127349853515625, -0.1053466796875, -0.083343505859375, -0.06134033203125, -0.039337158203125, -0.017333984375, 0.004669189453125, 0.02667236328125, 0.048675537109375, 0.0706787109375, 0.092681884765625, 0.11468505859375, 0.136688232421875, 0.15869140625, 0.180694580078125, 0.20269775390625, 0.224700927734375, 0.2467041015625, 0.268707275390625, 0.29071044921875, 0.312713623046875, 0.334716796875, 0.356719970703125, 0.37872314453125, 0.400726318359375, 0.4227294921875, 0.444732666015625, 0.46673583984375, 0.488739013671875, 0.5107421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 20.0, 20.0, 44.0, 81.0, 126.0, 244.0, 493.0, 1095.0, 3356.0, 18355.0, 598389.0, 404311.0, 16683.0, 3159.0, 1053.0, 502.0, 253.0, 150.0, 76.0, 41.0, 24.0, 23.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.58746337890625, -4.4483642578125, -4.30926513671875, -4.170166015625, -4.03106689453125, -3.8919677734375, -3.75286865234375, -3.61376953125, -3.47467041015625, -3.3355712890625, -3.19647216796875, -3.057373046875, -2.91827392578125, -2.7791748046875, -2.64007568359375, -2.5009765625, -2.36187744140625, -2.2227783203125, -2.08367919921875, -1.944580078125, -1.80548095703125, -1.6663818359375, -1.52728271484375, -1.38818359375, -1.24908447265625, -1.1099853515625, -0.97088623046875, -0.831787109375, -0.69268798828125, -0.5535888671875, -0.41448974609375, -0.275390625, -0.13629150390625, 0.0028076171875, 0.14190673828125, 0.281005859375, 0.42010498046875, 0.5592041015625, 0.69830322265625, 0.83740234375, 0.97650146484375, 1.1156005859375, 1.25469970703125, 1.393798828125, 1.53289794921875, 1.6719970703125, 1.81109619140625, 1.9501953125, 2.08929443359375, 2.2283935546875, 2.36749267578125, 2.506591796875, 2.64569091796875, 2.7847900390625, 2.92388916015625, 3.06298828125, 3.20208740234375, 3.3411865234375, 3.48028564453125, 3.619384765625, 3.75848388671875, 3.8975830078125, 4.03668212890625, 4.17578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 7.0, 6.0, 5.0, 11.0, 12.0, 16.0, 14.0, 27.0, 27.0, 24.0, 29.0, 35.0, 30.0, 46.0, 53.0, 42.0, 48.0, 45.0, 49.0, 52.0, 57.0, 49.0, 35.0, 39.0, 31.0, 30.0, 36.0, 21.0, 19.0, 13.0, 18.0, 12.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.595703125, -2.51434326171875, -2.4329833984375, -2.35162353515625, -2.270263671875, -2.18890380859375, -2.1075439453125, -2.02618408203125, -1.94482421875, -1.86346435546875, -1.7821044921875, -1.70074462890625, -1.619384765625, -1.53802490234375, -1.4566650390625, -1.37530517578125, -1.2939453125, -1.21258544921875, -1.1312255859375, -1.04986572265625, -0.968505859375, -0.88714599609375, -0.8057861328125, -0.72442626953125, -0.64306640625, -0.56170654296875, -0.4803466796875, -0.39898681640625, -0.317626953125, -0.23626708984375, -0.1549072265625, -0.07354736328125, 0.0078125, 0.08917236328125, 0.1705322265625, 0.25189208984375, 0.333251953125, 0.41461181640625, 0.4959716796875, 0.57733154296875, 0.65869140625, 0.74005126953125, 0.8214111328125, 0.90277099609375, 0.984130859375, 1.06549072265625, 1.1468505859375, 1.22821044921875, 1.3095703125, 1.39093017578125, 1.4722900390625, 1.55364990234375, 1.635009765625, 1.71636962890625, 1.7977294921875, 1.87908935546875, 1.96044921875, 2.04180908203125, 2.1231689453125, 2.20452880859375, 2.285888671875, 2.36724853515625, 2.4486083984375, 2.52996826171875, 2.611328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 8.0, 8.0, 20.0, 20.0, 57.0, 91.0, 169.0, 396.0, 973.0, 4099.0, 23121.0, 233116.0, 728832.0, 47914.0, 7029.0, 1656.0, 541.0, 234.0, 109.0, 65.0, 25.0, 15.0, 18.0, 7.0, 12.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4810791015625, -1.437744140625, -1.3944091796875, -1.35107421875, -1.3077392578125, -1.264404296875, -1.2210693359375, -1.177734375, -1.1343994140625, -1.091064453125, -1.0477294921875, -1.00439453125, -0.9610595703125, -0.917724609375, -0.8743896484375, -0.8310546875, -0.7877197265625, -0.744384765625, -0.7010498046875, -0.65771484375, -0.6143798828125, -0.571044921875, -0.5277099609375, -0.484375, -0.4410400390625, -0.397705078125, -0.3543701171875, -0.31103515625, -0.2677001953125, -0.224365234375, -0.1810302734375, -0.1376953125, -0.0943603515625, -0.051025390625, -0.0076904296875, 0.03564453125, 0.0789794921875, 0.122314453125, 0.1656494140625, 0.208984375, 0.2523193359375, 0.295654296875, 0.3389892578125, 0.38232421875, 0.4256591796875, 0.468994140625, 0.5123291015625, 0.5556640625, 0.5989990234375, 0.642333984375, 0.6856689453125, 0.72900390625, 0.7723388671875, 0.815673828125, 0.8590087890625, 0.90234375, 0.9456787109375, 0.989013671875, 1.0323486328125, 1.07568359375, 1.1190185546875, 1.162353515625, 1.2056884765625, 1.2490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 3.0, 5.0, 7.0, 7.0, 9.0, 13.0, 20.0, 23.0, 28.0, 20.0, 46.0, 75.0, 112.0, 144.0, 135.0, 85.0, 67.0, 38.0, 36.0, 17.0, 25.0, 12.0, 6.0, 12.0, 7.0, 8.0, 5.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026607513427734375, -0.0002579689025878906, -0.0002498626708984375, -0.00024175643920898438, -0.00023365020751953125, -0.00022554397583007812, -0.000217437744140625, -0.00020933151245117188, -0.00020122528076171875, -0.00019311904907226562, -0.0001850128173828125, -0.00017690658569335938, -0.00016880035400390625, -0.00016069412231445312, -0.000152587890625, -0.00014448165893554688, -0.00013637542724609375, -0.00012826919555664062, -0.0001201629638671875, -0.00011205673217773438, -0.00010395050048828125, -9.584426879882812e-05, -8.7738037109375e-05, -7.963180541992188e-05, -7.152557373046875e-05, -6.341934204101562e-05, -5.53131103515625e-05, -4.7206878662109375e-05, -3.910064697265625e-05, -3.0994415283203125e-05, -2.288818359375e-05, -1.4781951904296875e-05, -6.67572021484375e-06, 1.430511474609375e-06, 9.5367431640625e-06, 1.7642974853515625e-05, 2.574920654296875e-05, 3.3855438232421875e-05, 4.1961669921875e-05, 5.0067901611328125e-05, 5.817413330078125e-05, 6.628036499023438e-05, 7.43865966796875e-05, 8.249282836914062e-05, 9.059906005859375e-05, 9.870529174804688e-05, 0.0001068115234375, 0.00011491775512695312, 0.00012302398681640625, 0.00013113021850585938, 0.0001392364501953125, 0.00014734268188476562, 0.00015544891357421875, 0.00016355514526367188, 0.000171661376953125, 0.00017976760864257812, 0.00018787384033203125, 0.00019598007202148438, 0.0002040863037109375, 0.00021219253540039062, 0.00022029876708984375, 0.00022840499877929688, 0.00023651123046875, 0.0002446174621582031, 0.00025272369384765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 10.0, 16.0, 24.0, 32.0, 46.0, 87.0, 124.0, 193.0, 344.0, 686.0, 1158.0, 2549.0, 6665.0, 23055.0, 108089.0, 688765.0, 169311.0, 32165.0, 8869.0, 3075.0, 1402.0, 752.0, 427.0, 226.0, 148.0, 115.0, 65.0, 41.0, 31.0, 23.0, 8.0, 11.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7242584228515625, -0.697052001953125, -0.6698455810546875, -0.64263916015625, -0.6154327392578125, -0.588226318359375, -0.5610198974609375, -0.5338134765625, -0.5066070556640625, -0.479400634765625, -0.4521942138671875, -0.42498779296875, -0.3977813720703125, -0.370574951171875, -0.3433685302734375, -0.316162109375, -0.2889556884765625, -0.261749267578125, -0.2345428466796875, -0.20733642578125, -0.1801300048828125, -0.152923583984375, -0.1257171630859375, -0.0985107421875, -0.0713043212890625, -0.044097900390625, -0.0168914794921875, 0.01031494140625, 0.0375213623046875, 0.064727783203125, 0.0919342041015625, 0.119140625, 0.1463470458984375, 0.173553466796875, 0.2007598876953125, 0.22796630859375, 0.2551727294921875, 0.282379150390625, 0.3095855712890625, 0.3367919921875, 0.3639984130859375, 0.391204833984375, 0.4184112548828125, 0.44561767578125, 0.4728240966796875, 0.500030517578125, 0.5272369384765625, 0.554443359375, 0.5816497802734375, 0.608856201171875, 0.6360626220703125, 0.66326904296875, 0.6904754638671875, 0.717681884765625, 0.7448883056640625, 0.7720947265625, 0.7993011474609375, 0.826507568359375, 0.8537139892578125, 0.88092041015625, 0.9081268310546875, 0.935333251953125, 0.9625396728515625, 0.98974609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 8.0, 12.0, 8.0, 7.0, 17.0, 25.0, 31.0, 38.0, 50.0, 62.0, 78.0, 94.0, 86.0, 85.0, 86.0, 63.0, 48.0, 32.0, 26.0, 27.0, 24.0, 18.0, 18.0, 12.0, 6.0, 4.0, 11.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73193359375, -0.7071914672851562, -0.6824493408203125, -0.6577072143554688, -0.632965087890625, -0.6082229614257812, -0.5834808349609375, -0.5587387084960938, -0.53399658203125, -0.5092544555664062, -0.4845123291015625, -0.45977020263671875, -0.435028076171875, -0.41028594970703125, -0.3855438232421875, -0.36080169677734375, -0.3360595703125, -0.31131744384765625, -0.2865753173828125, -0.26183319091796875, -0.237091064453125, -0.21234893798828125, -0.1876068115234375, -0.16286468505859375, -0.13812255859375, -0.11338043212890625, -0.0886383056640625, -0.06389617919921875, -0.039154052734375, -0.01441192626953125, 0.0103302001953125, 0.03507232666015625, 0.059814453125, 0.08455657958984375, 0.1092987060546875, 0.13404083251953125, 0.158782958984375, 0.18352508544921875, 0.2082672119140625, 0.23300933837890625, 0.25775146484375, 0.28249359130859375, 0.3072357177734375, 0.33197784423828125, 0.356719970703125, 0.38146209716796875, 0.4062042236328125, 0.43094635009765625, 0.4556884765625, 0.48043060302734375, 0.5051727294921875, 0.5299148559570312, 0.554656982421875, 0.5793991088867188, 0.6041412353515625, 0.6288833618164062, 0.65362548828125, 0.6783676147460938, 0.7031097412109375, 0.7278518676757812, 0.752593994140625, 0.7773361206054688, 0.8020782470703125, 0.8268203735351562, 0.8515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 10.0, 17.0, 64.0, 166.0, 432.0, 196.0, 67.0, 26.0, 8.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.84894561767578, -36.7847785949707, -35.720611572265625, -34.65644073486328, -33.5922737121582, -32.528106689453125, -31.463937759399414, -30.399768829345703, -29.335601806640625, -28.271434783935547, -27.207265853881836, -26.143096923828125, -25.078929901123047, -24.01476287841797, -22.950593948364258, -21.886425018310547, -20.82225799560547, -19.75809097290039, -18.69392204284668, -17.62975311279297, -16.56558609008789, -15.501418113708496, -14.437250137329102, -13.373082160949707, -12.308914184570312, -11.244746208190918, -10.180578231811523, -9.116410255432129, -8.052242279052734, -6.98807430267334, -5.923906326293945, -4.859738349914551, -3.795574188232422, -2.7314062118530273, -1.6672382354736328, -0.6030702590942383, 0.46109771728515625, 1.5252656936645508, 2.5894336700439453, 3.65360164642334, 4.717769622802734, 5.781937599182129, 6.846105575561523, 7.910273551940918, 8.974441528320312, 10.038609504699707, 11.102777481079102, 12.166945457458496, 13.23111343383789, 14.295281410217285, 15.35944938659668, 16.42361831665039, 17.48778533935547, 18.551952362060547, 19.616121292114258, 20.68029022216797, 21.744457244873047, 22.808624267578125, 23.872793197631836, 24.936962127685547, 26.001129150390625, 27.065296173095703, 28.129465103149414, 29.193634033203125, 30.257801055908203]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 12.0, 16.0, 9.0, 9.0, 14.0, 21.0, 30.0, 33.0, 30.0, 49.0, 47.0, 34.0, 71.0, 60.0, 71.0, 77.0, 69.0, 40.0, 38.0, 35.0, 42.0, 18.0, 34.0, 23.0, 22.0, 14.0, 11.0, 12.0, 11.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.929452896118164, -9.5798978805542, -9.230341911315918, -8.880786895751953, -8.531230926513672, -8.181675910949707, -7.832120418548584, -7.482564926147461, -7.133009910583496, -6.783454418182373, -6.43389892578125, -6.084343910217285, -5.734788417816162, -5.385232925415039, -5.035677433013916, -4.686121940612793, -4.33656644821167, -3.987010955810547, -3.637455701828003, -3.28790020942688, -2.938344955444336, -2.588789463043213, -2.23923397064209, -1.889678716659546, -1.5401232242584229, -1.1905678510665894, -0.8410124182701111, -0.4914569854736328, -0.14190161228179932, 0.20765376091003418, 0.5572092533111572, 0.9067645072937012, 1.2563199996948242, 1.6058753728866577, 1.9554307460784912, 2.3049862384796143, 2.654541492462158, 3.0040969848632812, 3.3536524772644043, 3.7032077312469482, 4.052762985229492, 4.402318477630615, 4.751873970031738, 5.101428985595703, 5.450984477996826, 5.800539970397949, 6.150095462799072, 6.499650955200195, 6.849206447601318, 7.198761940002441, 7.5483174324035645, 7.8978729248046875, 8.247427940368652, 8.596982955932617, 8.946538925170898, 9.296093940734863, 9.645649909973145, 9.99520492553711, 10.34476089477539, 10.694315910339355, 11.043871879577637, 11.393426895141602, 11.742982864379883, 12.092537879943848, 12.442092895507812]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 19.0, 13.0, 26.0, 44.0, 95.0, 186.0, 405.0, 1184.0, 4361.0, 24405.0, 338349.0, 3553119.0, 245353.0, 20902.0, 3990.0, 1078.0, 396.0, 161.0, 86.0, 41.0, 20.0, 15.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.9644622802734375, -1.907440185546875, -1.8504180908203125, -1.79339599609375, -1.7363739013671875, -1.679351806640625, -1.6223297119140625, -1.5653076171875, -1.5082855224609375, -1.451263427734375, -1.3942413330078125, -1.33721923828125, -1.2801971435546875, -1.223175048828125, -1.1661529541015625, -1.109130859375, -1.0521087646484375, -0.995086669921875, -0.9380645751953125, -0.88104248046875, -0.8240203857421875, -0.766998291015625, -0.7099761962890625, -0.6529541015625, -0.5959320068359375, -0.538909912109375, -0.4818878173828125, -0.42486572265625, -0.3678436279296875, -0.310821533203125, -0.2537994384765625, -0.19677734375, -0.1397552490234375, -0.082733154296875, -0.0257110595703125, 0.03131103515625, 0.0883331298828125, 0.145355224609375, 0.2023773193359375, 0.2593994140625, 0.3164215087890625, 0.373443603515625, 0.4304656982421875, 0.48748779296875, 0.5445098876953125, 0.601531982421875, 0.6585540771484375, 0.715576171875, 0.7725982666015625, 0.829620361328125, 0.8866424560546875, 0.94366455078125, 1.0006866455078125, 1.057708740234375, 1.1147308349609375, 1.1717529296875, 1.2287750244140625, 1.285797119140625, 1.3428192138671875, 1.39984130859375, 1.4568634033203125, 1.513885498046875, 1.5709075927734375, 1.6279296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 18.0, 18.0, 24.0, 27.0, 44.0, 41.0, 41.0, 70.0, 64.0, 81.0, 69.0, 73.0, 71.0, 75.0, 64.0, 59.0, 39.0, 26.0, 31.0, 15.0, 13.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.359375, -1.3295745849609375, -1.299774169921875, -1.2699737548828125, -1.24017333984375, -1.2103729248046875, -1.180572509765625, -1.1507720947265625, -1.1209716796875, -1.0911712646484375, -1.061370849609375, -1.0315704345703125, -1.00177001953125, -0.9719696044921875, -0.942169189453125, -0.9123687744140625, -0.882568359375, -0.8527679443359375, -0.822967529296875, -0.7931671142578125, -0.76336669921875, -0.7335662841796875, -0.703765869140625, -0.6739654541015625, -0.6441650390625, -0.6143646240234375, -0.584564208984375, -0.5547637939453125, -0.52496337890625, -0.4951629638671875, -0.465362548828125, -0.4355621337890625, -0.40576171875, -0.3759613037109375, -0.346160888671875, -0.3163604736328125, -0.28656005859375, -0.2567596435546875, -0.226959228515625, -0.1971588134765625, -0.1673583984375, -0.1375579833984375, -0.107757568359375, -0.0779571533203125, -0.04815673828125, -0.0183563232421875, 0.011444091796875, 0.0412445068359375, 0.071044921875, 0.1008453369140625, 0.130645751953125, 0.1604461669921875, 0.19024658203125, 0.2200469970703125, 0.249847412109375, 0.2796478271484375, 0.3094482421875, 0.3392486572265625, 0.369049072265625, 0.3988494873046875, 0.42864990234375, 0.4584503173828125, 0.488250732421875, 0.5180511474609375, 0.5478515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 15.0, 35.0, 61.0, 88.0, 168.0, 379.0, 789.0, 2099.0, 6085.0, 29776.0, 549361.0, 3481500.0, 105856.0, 12708.0, 3265.0, 1173.0, 416.0, 230.0, 100.0, 59.0, 28.0, 14.0, 17.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.8797607421875, -2.802490234375, -2.7252197265625, -2.64794921875, -2.5706787109375, -2.493408203125, -2.4161376953125, -2.3388671875, -2.2615966796875, -2.184326171875, -2.1070556640625, -2.02978515625, -1.9525146484375, -1.875244140625, -1.7979736328125, -1.720703125, -1.6434326171875, -1.566162109375, -1.4888916015625, -1.41162109375, -1.3343505859375, -1.257080078125, -1.1798095703125, -1.1025390625, -1.0252685546875, -0.947998046875, -0.8707275390625, -0.79345703125, -0.7161865234375, -0.638916015625, -0.5616455078125, -0.484375, -0.4071044921875, -0.329833984375, -0.2525634765625, -0.17529296875, -0.0980224609375, -0.020751953125, 0.0565185546875, 0.1337890625, 0.2110595703125, 0.288330078125, 0.3656005859375, 0.44287109375, 0.5201416015625, 0.597412109375, 0.6746826171875, 0.751953125, 0.8292236328125, 0.906494140625, 0.9837646484375, 1.06103515625, 1.1383056640625, 1.215576171875, 1.2928466796875, 1.3701171875, 1.4473876953125, 1.524658203125, 1.6019287109375, 1.67919921875, 1.7564697265625, 1.833740234375, 1.9110107421875, 1.98828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 4.0, 18.0, 16.0, 32.0, 64.0, 93.0, 165.0, 306.0, 700.0, 974.0, 795.0, 402.0, 201.0, 96.0, 69.0, 38.0, 24.0, 20.0, 4.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.703399658203125, -2.63531494140625, -2.567230224609375, -2.4991455078125, -2.431060791015625, -2.36297607421875, -2.294891357421875, -2.226806640625, -2.158721923828125, -2.09063720703125, -2.022552490234375, -1.9544677734375, -1.886383056640625, -1.81829833984375, -1.750213623046875, -1.68212890625, -1.614044189453125, -1.54595947265625, -1.477874755859375, -1.4097900390625, -1.341705322265625, -1.27362060546875, -1.205535888671875, -1.137451171875, -1.069366455078125, -1.00128173828125, -0.933197021484375, -0.8651123046875, -0.797027587890625, -0.72894287109375, -0.660858154296875, -0.5927734375, -0.524688720703125, -0.45660400390625, -0.388519287109375, -0.3204345703125, -0.252349853515625, -0.18426513671875, -0.116180419921875, -0.048095703125, 0.019989013671875, 0.08807373046875, 0.156158447265625, 0.2242431640625, 0.292327880859375, 0.36041259765625, 0.428497314453125, 0.49658203125, 0.564666748046875, 0.63275146484375, 0.700836181640625, 0.7689208984375, 0.837005615234375, 0.90509033203125, 0.973175048828125, 1.041259765625, 1.109344482421875, 1.17742919921875, 1.245513916015625, 1.3135986328125, 1.381683349609375, 1.44976806640625, 1.517852783203125, 1.5859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 4.0, 7.0, 20.0, 63.0, 215.0, 390.0, 214.0, 48.0, 18.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.615047454833984, -43.541160583496094, -42.46727752685547, -41.39339065551758, -40.31950759887695, -39.24562072753906, -38.17173767089844, -37.09785079956055, -36.02396774291992, -34.95008087158203, -33.876197814941406, -32.802310943603516, -31.72842788696289, -30.654542922973633, -29.580657958984375, -28.506771087646484, -27.432886123657227, -26.35900115966797, -25.28511619567871, -24.211231231689453, -23.137346267700195, -22.063461303710938, -20.989574432373047, -19.915691375732422, -18.84180450439453, -17.767919540405273, -16.694034576416016, -15.620149612426758, -14.5462646484375, -13.472379684448242, -12.398493766784668, -11.32460880279541, -10.250724792480469, -9.176839828491211, -8.102954864501953, -7.029069423675537, -5.955184459686279, -4.8812994956970215, -3.8074140548706055, -2.7335290908813477, -1.6596441268920898, -0.5857590436935425, 0.4881260395050049, 1.5620112419128418, 2.6358962059020996, 3.7097811698913574, 4.783666610717773, 5.857551574707031, 6.931436538696289, 8.005321502685547, 9.079206466674805, 10.153091430664062, 11.22697639465332, 12.300861358642578, 13.374747276306152, 14.44863224029541, 15.522517204284668, 16.596403121948242, 17.6702880859375, 18.744173049926758, 19.818058013916016, 20.891942977905273, 21.96582794189453, 23.03971290588379, 24.113597869873047]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 11.0, 6.0, 14.0, 16.0, 20.0, 31.0, 32.0, 41.0, 42.0, 57.0, 55.0, 60.0, 67.0, 65.0, 69.0, 67.0, 60.0, 67.0, 41.0, 38.0, 27.0, 25.0, 27.0, 14.0, 14.0, 8.0, 9.0, 3.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.014646530151367, -8.716702461242676, -8.418757438659668, -8.120813369750977, -7.822869300842285, -7.5249247550964355, -7.226980209350586, -6.9290361404418945, -6.631091594696045, -6.333147048950195, -6.035202980041504, -5.737258434295654, -5.439313888549805, -5.141369819641113, -4.843425273895264, -4.545480728149414, -4.247536659240723, -3.949592351913452, -3.6516480445861816, -3.353703498840332, -3.0557591915130615, -2.757814884185791, -2.4598703384399414, -2.161926031112671, -1.8639817237854004, -1.5660374164581299, -1.2680929899215698, -0.9701486229896545, -0.6722042560577393, -0.37425994873046875, -0.07631552219390869, 0.22162890434265137, 0.5195732116699219, 0.8175175786018372, 1.1154619455337524, 1.4134063720703125, 1.711350679397583, 2.0092949867248535, 2.307239532470703, 2.6051838397979736, 2.903128147125244, 3.2010724544525146, 3.499016761779785, 3.7969613075256348, 4.094905853271484, 4.392849922180176, 4.690794467926025, 4.988739013671875, 5.286683082580566, 5.584627628326416, 5.882571697235107, 6.180516242980957, 6.478460311889648, 6.776404857635498, 7.074349403381348, 7.372293472290039, 7.670238018035889, 7.968182563781738, 8.26612663269043, 8.564070701599121, 8.862015724182129, 9.15995979309082, 9.457903861999512, 9.75584888458252, 10.053792953491211]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 8.0, 13.0, 20.0, 39.0, 37.0, 93.0, 190.0, 338.0, 877.0, 2121.0, 6428.0, 27219.0, 213558.0, 646271.0, 125099.0, 18198.0, 4970.0, 1684.0, 694.0, 306.0, 143.0, 75.0, 34.0, 35.0, 25.0, 14.0, 11.0, 10.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5157928466796875, -1.464202880859375, -1.4126129150390625, -1.36102294921875, -1.3094329833984375, -1.257843017578125, -1.2062530517578125, -1.1546630859375, -1.1030731201171875, -1.051483154296875, -0.9998931884765625, -0.94830322265625, -0.8967132568359375, -0.845123291015625, -0.7935333251953125, -0.741943359375, -0.6903533935546875, -0.638763427734375, -0.5871734619140625, -0.53558349609375, -0.4839935302734375, -0.432403564453125, -0.3808135986328125, -0.3292236328125, -0.2776336669921875, -0.226043701171875, -0.1744537353515625, -0.12286376953125, -0.0712738037109375, -0.019683837890625, 0.0319061279296875, 0.08349609375, 0.1350860595703125, 0.186676025390625, 0.2382659912109375, 0.28985595703125, 0.3414459228515625, 0.393035888671875, 0.4446258544921875, 0.4962158203125, 0.5478057861328125, 0.599395751953125, 0.6509857177734375, 0.70257568359375, 0.7541656494140625, 0.805755615234375, 0.8573455810546875, 0.908935546875, 0.9605255126953125, 1.012115478515625, 1.0637054443359375, 1.11529541015625, 1.1668853759765625, 1.218475341796875, 1.2700653076171875, 1.3216552734375, 1.3732452392578125, 1.424835205078125, 1.4764251708984375, 1.52801513671875, 1.5796051025390625, 1.631195068359375, 1.6827850341796875, 1.734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 10.0, 15.0, 28.0, 20.0, 36.0, 32.0, 53.0, 62.0, 59.0, 67.0, 77.0, 68.0, 70.0, 78.0, 60.0, 51.0, 59.0, 53.0, 29.0, 26.0, 11.0, 12.0, 11.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3310546875, -1.2988510131835938, -1.2666473388671875, -1.2344436645507812, -1.202239990234375, -1.1700363159179688, -1.1378326416015625, -1.1056289672851562, -1.07342529296875, -1.0412216186523438, -1.0090179443359375, -0.9768142700195312, -0.944610595703125, -0.9124069213867188, -0.8802032470703125, -0.8479995727539062, -0.8157958984375, -0.7835922241210938, -0.7513885498046875, -0.7191848754882812, -0.686981201171875, -0.6547775268554688, -0.6225738525390625, -0.5903701782226562, -0.55816650390625, -0.5259628295898438, -0.4937591552734375, -0.46155548095703125, -0.429351806640625, -0.39714813232421875, -0.3649444580078125, -0.33274078369140625, -0.300537109375, -0.26833343505859375, -0.2361297607421875, -0.20392608642578125, -0.171722412109375, -0.13951873779296875, -0.1073150634765625, -0.07511138916015625, -0.04290771484375, -0.01070404052734375, 0.0214996337890625, 0.05370330810546875, 0.085906982421875, 0.11811065673828125, 0.1503143310546875, 0.18251800537109375, 0.2147216796875, 0.24692535400390625, 0.2791290283203125, 0.31133270263671875, 0.343536376953125, 0.37574005126953125, 0.4079437255859375, 0.44014739990234375, 0.47235107421875, 0.5045547485351562, 0.5367584228515625, 0.5689620971679688, 0.601165771484375, 0.6333694458007812, 0.6655731201171875, 0.6977767944335938, 0.72998046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 13.0, 24.0, 24.0, 39.0, 48.0, 71.0, 121.0, 221.0, 343.0, 689.0, 1566.0, 3795.0, 13313.0, 85441.0, 669559.0, 232385.0, 29858.0, 6559.0, 2302.0, 981.0, 467.0, 254.0, 147.0, 75.0, 66.0, 45.0, 27.0, 28.0, 15.0, 8.0, 11.0, 11.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.59375, -1.5465087890625, -1.499267578125, -1.4520263671875, -1.40478515625, -1.3575439453125, -1.310302734375, -1.2630615234375, -1.2158203125, -1.1685791015625, -1.121337890625, -1.0740966796875, -1.02685546875, -0.9796142578125, -0.932373046875, -0.8851318359375, -0.837890625, -0.7906494140625, -0.743408203125, -0.6961669921875, -0.64892578125, -0.6016845703125, -0.554443359375, -0.5072021484375, -0.4599609375, -0.4127197265625, -0.365478515625, -0.3182373046875, -0.27099609375, -0.2237548828125, -0.176513671875, -0.1292724609375, -0.08203125, -0.0347900390625, 0.012451171875, 0.0596923828125, 0.10693359375, 0.1541748046875, 0.201416015625, 0.2486572265625, 0.2958984375, 0.3431396484375, 0.390380859375, 0.4376220703125, 0.48486328125, 0.5321044921875, 0.579345703125, 0.6265869140625, 0.673828125, 0.7210693359375, 0.768310546875, 0.8155517578125, 0.86279296875, 0.9100341796875, 0.957275390625, 1.0045166015625, 1.0517578125, 1.0989990234375, 1.146240234375, 1.1934814453125, 1.24072265625, 1.2879638671875, 1.335205078125, 1.3824462890625, 1.4296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 9.0, 8.0, 18.0, 20.0, 25.0, 16.0, 39.0, 42.0, 56.0, 47.0, 43.0, 50.0, 63.0, 55.0, 75.0, 54.0, 55.0, 56.0, 38.0, 46.0, 35.0, 30.0, 28.0, 27.0, 18.0, 5.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.241455078125, -2.15087890625, -2.060302734375, -1.9697265625, -1.879150390625, -1.78857421875, -1.697998046875, -1.607421875, -1.516845703125, -1.42626953125, -1.335693359375, -1.2451171875, -1.154541015625, -1.06396484375, -0.973388671875, -0.8828125, -0.792236328125, -0.70166015625, -0.611083984375, -0.5205078125, -0.429931640625, -0.33935546875, -0.248779296875, -0.158203125, -0.067626953125, 0.02294921875, 0.113525390625, 0.2041015625, 0.294677734375, 0.38525390625, 0.475830078125, 0.56640625, 0.656982421875, 0.74755859375, 0.838134765625, 0.9287109375, 1.019287109375, 1.10986328125, 1.200439453125, 1.291015625, 1.381591796875, 1.47216796875, 1.562744140625, 1.6533203125, 1.743896484375, 1.83447265625, 1.925048828125, 2.015625, 2.106201171875, 2.19677734375, 2.287353515625, 2.3779296875, 2.468505859375, 2.55908203125, 2.649658203125, 2.740234375, 2.830810546875, 2.92138671875, 3.011962890625, 3.1025390625, 3.193115234375, 3.28369140625, 3.374267578125, 3.46484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 9.0, 15.0, 19.0, 25.0, 19.0, 36.0, 82.0, 135.0, 250.0, 610.0, 1288.0, 3138.0, 8527.0, 28152.0, 124765.0, 639004.0, 185569.0, 38701.0, 11171.0, 3912.0, 1633.0, 710.0, 362.0, 171.0, 86.0, 55.0, 38.0, 20.0, 15.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5498046875, -0.5334510803222656, -0.5170974731445312, -0.5007438659667969, -0.4843902587890625, -0.4680366516113281, -0.45168304443359375, -0.4353294372558594, -0.418975830078125, -0.4026222229003906, -0.38626861572265625, -0.3699150085449219, -0.3535614013671875, -0.3372077941894531, -0.32085418701171875, -0.3045005798339844, -0.28814697265625, -0.2717933654785156, -0.25543975830078125, -0.23908615112304688, -0.2227325439453125, -0.20637893676757812, -0.19002532958984375, -0.17367172241210938, -0.157318115234375, -0.14096450805664062, -0.12461090087890625, -0.10825729370117188, -0.0919036865234375, -0.07555007934570312, -0.05919647216796875, -0.042842864990234375, -0.0264892578125, -0.010135650634765625, 0.00621795654296875, 0.022571563720703125, 0.0389251708984375, 0.055278778076171875, 0.07163238525390625, 0.08798599243164062, 0.104339599609375, 0.12069320678710938, 0.13704681396484375, 0.15340042114257812, 0.1697540283203125, 0.18610763549804688, 0.20246124267578125, 0.21881484985351562, 0.23516845703125, 0.2515220642089844, 0.26787567138671875, 0.2842292785644531, 0.3005828857421875, 0.3169364929199219, 0.33329010009765625, 0.3496437072753906, 0.365997314453125, 0.3823509216308594, 0.39870452880859375, 0.4150581359863281, 0.4314117431640625, 0.4477653503417969, 0.46411895751953125, 0.4804725646972656, 0.496826171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 12.0, 18.0, 16.0, 35.0, 57.0, 93.0, 144.0, 175.0, 176.0, 102.0, 73.0, 32.0, 22.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000270843505859375, -0.0002632215619087219, -0.00025559961795806885, -0.00024797767400741577, -0.0002403557300567627, -0.00023273378610610962, -0.00022511184215545654, -0.00021748989820480347, -0.0002098679542541504, -0.00020224601030349731, -0.00019462406635284424, -0.00018700212240219116, -0.00017938017845153809, -0.000171758234500885, -0.00016413629055023193, -0.00015651434659957886, -0.00014889240264892578, -0.0001412704586982727, -0.00013364851474761963, -0.00012602657079696655, -0.00011840462684631348, -0.0001107826828956604, -0.00010316073894500732, -9.553879499435425e-05, -8.791685104370117e-05, -8.02949070930481e-05, -7.267296314239502e-05, -6.505101919174194e-05, -5.742907524108887e-05, -4.980713129043579e-05, -4.2185187339782715e-05, -3.456324338912964e-05, -2.6941299438476562e-05, -1.9319355487823486e-05, -1.169741153717041e-05, -4.075467586517334e-06, 3.546476364135742e-06, 1.1168420314788818e-05, 1.8790364265441895e-05, 2.641230821609497e-05, 3.403425216674805e-05, 4.165619611740112e-05, 4.92781400680542e-05, 5.6900084018707275e-05, 6.452202796936035e-05, 7.214397192001343e-05, 7.97659158706665e-05, 8.738785982131958e-05, 9.500980377197266e-05, 0.00010263174772262573, 0.00011025369167327881, 0.00011787563562393188, 0.00012549757957458496, 0.00013311952352523804, 0.0001407414674758911, 0.0001483634114265442, 0.00015598535537719727, 0.00016360729932785034, 0.00017122924327850342, 0.0001788511872291565, 0.00018647313117980957, 0.00019409507513046265, 0.00020171701908111572, 0.0002093389630317688, 0.00021696090698242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 17.0, 17.0, 26.0, 24.0, 36.0, 68.0, 99.0, 200.0, 328.0, 637.0, 1554.0, 3890.0, 11349.0, 41087.0, 189892.0, 622983.0, 131790.0, 30084.0, 8838.0, 3077.0, 1245.0, 526.0, 307.0, 153.0, 103.0, 61.0, 42.0, 31.0, 17.0, 20.0, 14.0, 7.0, 5.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.607421875, -0.5902557373046875, -0.573089599609375, -0.5559234619140625, -0.53875732421875, -0.5215911865234375, -0.504425048828125, -0.4872589111328125, -0.4700927734375, -0.4529266357421875, -0.435760498046875, -0.4185943603515625, -0.40142822265625, -0.3842620849609375, -0.367095947265625, -0.3499298095703125, -0.332763671875, -0.3155975341796875, -0.298431396484375, -0.2812652587890625, -0.26409912109375, -0.2469329833984375, -0.229766845703125, -0.2126007080078125, -0.1954345703125, -0.1782684326171875, -0.161102294921875, -0.1439361572265625, -0.12677001953125, -0.1096038818359375, -0.092437744140625, -0.0752716064453125, -0.05810546875, -0.0409393310546875, -0.023773193359375, -0.0066070556640625, 0.01055908203125, 0.0277252197265625, 0.044891357421875, 0.0620574951171875, 0.0792236328125, 0.0963897705078125, 0.113555908203125, 0.1307220458984375, 0.14788818359375, 0.1650543212890625, 0.182220458984375, 0.1993865966796875, 0.216552734375, 0.2337188720703125, 0.250885009765625, 0.2680511474609375, 0.28521728515625, 0.3023834228515625, 0.319549560546875, 0.3367156982421875, 0.3538818359375, 0.3710479736328125, 0.388214111328125, 0.4053802490234375, 0.42254638671875, 0.4397125244140625, 0.456878662109375, 0.4740447998046875, 0.4912109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 7.0, 14.0, 24.0, 22.0, 39.0, 44.0, 65.0, 97.0, 110.0, 103.0, 111.0, 95.0, 62.0, 58.0, 33.0, 37.0, 17.0, 18.0, 9.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.942718505859375, -0.92059326171875, -0.898468017578125, -0.8763427734375, -0.854217529296875, -0.83209228515625, -0.809967041015625, -0.787841796875, -0.765716552734375, -0.74359130859375, -0.721466064453125, -0.6993408203125, -0.677215576171875, -0.65509033203125, -0.632965087890625, -0.61083984375, -0.588714599609375, -0.56658935546875, -0.544464111328125, -0.5223388671875, -0.500213623046875, -0.47808837890625, -0.455963134765625, -0.433837890625, -0.411712646484375, -0.38958740234375, -0.367462158203125, -0.3453369140625, -0.323211669921875, -0.30108642578125, -0.278961181640625, -0.2568359375, -0.234710693359375, -0.21258544921875, -0.190460205078125, -0.1683349609375, -0.146209716796875, -0.12408447265625, -0.101959228515625, -0.079833984375, -0.057708740234375, -0.03558349609375, -0.013458251953125, 0.0086669921875, 0.030792236328125, 0.05291748046875, 0.075042724609375, 0.09716796875, 0.119293212890625, 0.14141845703125, 0.163543701171875, 0.1856689453125, 0.207794189453125, 0.22991943359375, 0.252044677734375, 0.274169921875, 0.296295166015625, 0.31842041015625, 0.340545654296875, 0.3626708984375, 0.384796142578125, 0.40692138671875, 0.429046630859375, 0.451171875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 18.0, 29.0, 70.0, 174.0, 319.0, 210.0, 97.0, 28.0, 16.0, 13.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.155841827392578, -24.617198944091797, -24.078556060791016, -23.539913177490234, -23.001270294189453, -22.462627410888672, -21.92398452758789, -21.385339736938477, -20.846696853637695, -20.308053970336914, -19.769411087036133, -19.23076820373535, -18.69212532043457, -18.153480529785156, -17.614837646484375, -17.076194763183594, -16.537551879882812, -15.998908996582031, -15.46026611328125, -14.921623229980469, -14.382979393005371, -13.84433650970459, -13.305693626403809, -12.767050743103027, -12.228408813476562, -11.689765930175781, -11.151123046875, -10.612480163574219, -10.073836326599121, -9.53519344329834, -8.996550559997559, -8.457907676696777, -7.91926383972168, -7.380620956420898, -6.841977596282959, -6.303334712982178, -5.764691352844238, -5.226048469543457, -4.687405586242676, -4.1487627029418945, -3.610119342803955, -3.0714762210845947, -2.5328330993652344, -1.9941902160644531, -1.4555470943450928, -0.9169039726257324, -0.37826108932495117, 0.16038203239440918, 0.6990251541137695, 1.2376682758331299, 1.7763112783432007, 2.3149542808532715, 2.853597402572632, 3.392240524291992, 3.9308834075927734, 4.469526290893555, 5.008169651031494, 5.546812534332275, 6.085455894470215, 6.624098777770996, 7.162741661071777, 7.701385021209717, 8.240028381347656, 8.778671264648438, 9.317314147949219]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 16.0, 17.0, 18.0, 15.0, 31.0, 25.0, 36.0, 35.0, 47.0, 53.0, 61.0, 92.0, 81.0, 75.0, 55.0, 41.0, 48.0, 33.0, 35.0, 29.0, 34.0, 25.0, 15.0, 15.0, 10.0, 10.0, 11.0, 11.0, 4.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9634370803833, -9.612728118896484, -9.262018203735352, -8.911308288574219, -8.560599327087402, -8.209890365600586, -7.859180450439453, -7.5084710121154785, -7.157761573791504, -6.807052135467529, -6.456342697143555, -6.10563325881958, -5.7549238204956055, -5.404214382171631, -5.053504943847656, -4.702795505523682, -4.352086067199707, -4.001376628875732, -3.650667190551758, -3.299957752227783, -2.9492483139038086, -2.598538875579834, -2.2478294372558594, -1.8971199989318848, -1.5464105606079102, -1.1957011222839355, -0.8449916839599609, -0.49428224563598633, -0.14357280731201172, 0.2071366310119629, 0.5578460693359375, 0.9085555076599121, 1.2592658996582031, 1.6099753379821777, 1.9606847763061523, 2.311394214630127, 2.6621036529541016, 3.012813091278076, 3.363522529602051, 3.7142319679260254, 4.06494140625, 4.415650844573975, 4.766360282897949, 5.117069721221924, 5.467779159545898, 5.818488597869873, 6.169198036193848, 6.519907474517822, 6.870616912841797, 7.2213263511657715, 7.572035789489746, 7.922745227813721, 8.273454666137695, 8.624164581298828, 8.974873542785645, 9.325582504272461, 9.676292419433594, 10.027002334594727, 10.377711296081543, 10.72842025756836, 11.079130172729492, 11.429840087890625, 11.780549049377441, 12.131258010864258, 12.48196792602539]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 15.0, 15.0, 26.0, 33.0, 48.0, 70.0, 84.0, 174.0, 245.0, 428.0, 687.0, 1344.0, 2680.0, 5547.0, 13351.0, 38956.0, 160786.0, 1070569.0, 2348903.0, 431282.0, 79517.0, 23009.0, 8520.0, 3869.0, 1832.0, 921.0, 459.0, 318.0, 191.0, 112.0, 77.0, 59.0, 38.0, 21.0, 9.0, 15.0, 11.0, 9.0, 9.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.81005859375, -0.784149169921875, -0.75823974609375, -0.732330322265625, -0.7064208984375, -0.680511474609375, -0.65460205078125, -0.628692626953125, -0.602783203125, -0.576873779296875, -0.55096435546875, -0.525054931640625, -0.4991455078125, -0.473236083984375, -0.44732666015625, -0.421417236328125, -0.3955078125, -0.369598388671875, -0.34368896484375, -0.317779541015625, -0.2918701171875, -0.265960693359375, -0.24005126953125, -0.214141845703125, -0.188232421875, -0.162322998046875, -0.13641357421875, -0.110504150390625, -0.0845947265625, -0.058685302734375, -0.03277587890625, -0.006866455078125, 0.01904296875, 0.044952392578125, 0.07086181640625, 0.096771240234375, 0.1226806640625, 0.148590087890625, 0.17449951171875, 0.200408935546875, 0.226318359375, 0.252227783203125, 0.27813720703125, 0.304046630859375, 0.3299560546875, 0.355865478515625, 0.38177490234375, 0.407684326171875, 0.43359375, 0.459503173828125, 0.48541259765625, 0.511322021484375, 0.5372314453125, 0.563140869140625, 0.58905029296875, 0.614959716796875, 0.640869140625, 0.666778564453125, 0.69268798828125, 0.718597412109375, 0.7445068359375, 0.770416259765625, 0.79632568359375, 0.822235107421875, 0.84814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 10.0, 13.0, 13.0, 15.0, 18.0, 18.0, 19.0, 19.0, 25.0, 22.0, 28.0, 34.0, 30.0, 35.0, 39.0, 40.0, 32.0, 32.0, 40.0, 46.0, 47.0, 38.0, 37.0, 39.0, 31.0, 28.0, 31.0, 30.0, 31.0, 27.0, 17.0, 12.0, 16.0, 19.0, 8.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.5185546875, -0.5024642944335938, -0.4863739013671875, -0.47028350830078125, -0.454193115234375, -0.43810272216796875, -0.4220123291015625, -0.40592193603515625, -0.38983154296875, -0.37374114990234375, -0.3576507568359375, -0.34156036376953125, -0.325469970703125, -0.30937957763671875, -0.2932891845703125, -0.27719879150390625, -0.2611083984375, -0.24501800537109375, -0.2289276123046875, -0.21283721923828125, -0.196746826171875, -0.18065643310546875, -0.1645660400390625, -0.14847564697265625, -0.13238525390625, -0.11629486083984375, -0.1002044677734375, -0.08411407470703125, -0.068023681640625, -0.05193328857421875, -0.0358428955078125, -0.01975250244140625, -0.003662109375, 0.01242828369140625, 0.0285186767578125, 0.04460906982421875, 0.060699462890625, 0.07678985595703125, 0.0928802490234375, 0.10897064208984375, 0.12506103515625, 0.14115142822265625, 0.1572418212890625, 0.17333221435546875, 0.189422607421875, 0.20551300048828125, 0.2216033935546875, 0.23769378662109375, 0.2537841796875, 0.26987457275390625, 0.2859649658203125, 0.30205535888671875, 0.318145751953125, 0.33423614501953125, 0.3503265380859375, 0.36641693115234375, 0.38250732421875, 0.39859771728515625, 0.4146881103515625, 0.43077850341796875, 0.446868896484375, 0.46295928955078125, 0.4790496826171875, 0.49514007568359375, 0.51123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 16.0, 24.0, 65.0, 165.0, 647.0, 5410.0, 1341400.0, 2838023.0, 7389.0, 767.0, 225.0, 79.0, 34.0, 22.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.98883056640625, -4.8331298828125, -4.67742919921875, -4.521728515625, -4.36602783203125, -4.2103271484375, -4.05462646484375, -3.89892578125, -3.74322509765625, -3.5875244140625, -3.43182373046875, -3.276123046875, -3.12042236328125, -2.9647216796875, -2.80902099609375, -2.6533203125, -2.49761962890625, -2.3419189453125, -2.18621826171875, -2.030517578125, -1.87481689453125, -1.7191162109375, -1.56341552734375, -1.40771484375, -1.25201416015625, -1.0963134765625, -0.94061279296875, -0.784912109375, -0.62921142578125, -0.4735107421875, -0.31781005859375, -0.162109375, -0.00640869140625, 0.1492919921875, 0.30499267578125, 0.460693359375, 0.61639404296875, 0.7720947265625, 0.92779541015625, 1.08349609375, 1.23919677734375, 1.3948974609375, 1.55059814453125, 1.706298828125, 1.86199951171875, 2.0177001953125, 2.17340087890625, 2.3291015625, 2.48480224609375, 2.6405029296875, 2.79620361328125, 2.951904296875, 3.10760498046875, 3.2633056640625, 3.41900634765625, 3.57470703125, 3.73040771484375, 3.8861083984375, 4.04180908203125, 4.197509765625, 4.35321044921875, 4.5089111328125, 4.66461181640625, 4.8203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 13.0, 20.0, 22.0, 35.0, 55.0, 95.0, 123.0, 262.0, 412.0, 668.0, 790.0, 582.0, 364.0, 228.0, 105.0, 91.0, 59.0, 40.0, 21.0, 18.0, 13.0, 6.0, 7.0, 7.0, 2.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.271484375, -1.2232666015625, -1.175048828125, -1.1268310546875, -1.07861328125, -1.0303955078125, -0.982177734375, -0.9339599609375, -0.8857421875, -0.8375244140625, -0.789306640625, -0.7410888671875, -0.69287109375, -0.6446533203125, -0.596435546875, -0.5482177734375, -0.5, -0.4517822265625, -0.403564453125, -0.3553466796875, -0.30712890625, -0.2589111328125, -0.210693359375, -0.1624755859375, -0.1142578125, -0.0660400390625, -0.017822265625, 0.0303955078125, 0.07861328125, 0.1268310546875, 0.175048828125, 0.2232666015625, 0.271484375, 0.3197021484375, 0.367919921875, 0.4161376953125, 0.46435546875, 0.5125732421875, 0.560791015625, 0.6090087890625, 0.6572265625, 0.7054443359375, 0.753662109375, 0.8018798828125, 0.85009765625, 0.8983154296875, 0.946533203125, 0.9947509765625, 1.04296875, 1.0911865234375, 1.139404296875, 1.1876220703125, 1.23583984375, 1.2840576171875, 1.332275390625, 1.3804931640625, 1.4287109375, 1.4769287109375, 1.525146484375, 1.5733642578125, 1.62158203125, 1.6697998046875, 1.718017578125, 1.7662353515625, 1.814453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 14.0, 52.0, 142.0, 354.0, 296.0, 112.0, 20.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.669219970703125, -29.66935920715332, -28.669498443603516, -27.669639587402344, -26.66977882385254, -25.669918060302734, -24.67005729675293, -23.670196533203125, -22.670337677001953, -21.67047691345215, -20.670616149902344, -19.670757293701172, -18.670896530151367, -17.671035766601562, -16.671175003051758, -15.671314239501953, -14.671453475952148, -13.671592712402344, -12.671732902526855, -11.67187213897705, -10.672012329101562, -9.672151565551758, -8.672290802001953, -7.672430515289307, -6.67257022857666, -5.672709941864014, -4.672849655151367, -3.6729888916015625, -2.673128604888916, -1.6732683181762695, -0.6734075546264648, 0.32645273208618164, 1.3263130187988281, 2.3261733055114746, 3.3260338306427, 4.325894355773926, 5.325754642486572, 6.325614929199219, 7.325475692749023, 8.325336456298828, 9.325196266174316, 10.325057029724121, 11.32491683959961, 12.324777603149414, 13.324638366699219, 14.324498176574707, 15.324358940124512, 16.32421875, 17.324079513549805, 18.32394027709961, 19.323801040649414, 20.32366180419922, 21.32352066040039, 22.323381423950195, 23.3232421875, 24.323102951049805, 25.32296371459961, 26.322824478149414, 27.32268524169922, 28.32254409790039, 29.322404861450195, 30.322265625, 31.322126388549805, 32.32198715209961, 33.32184600830078]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 15.0, 13.0, 29.0, 26.0, 31.0, 33.0, 54.0, 53.0, 54.0, 57.0, 60.0, 72.0, 65.0, 50.0, 52.0, 66.0, 39.0, 44.0, 48.0, 30.0, 27.0, 21.0, 7.0, 10.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.64519214630127, -8.379648208618164, -8.114103317260742, -7.848559379577637, -7.583015441894531, -7.317471027374268, -7.051926612854004, -6.786382675170898, -6.520838260650635, -6.255293846130371, -5.989749908447266, -5.724205493927002, -5.458661079406738, -5.193117141723633, -4.927572727203369, -4.6620283126831055, -4.396484375, -4.130939960479736, -3.865396022796631, -3.599851608276367, -3.3343074321746826, -3.068763256072998, -2.8032188415527344, -2.53767466545105, -2.2721304893493652, -2.0065863132476807, -1.7410420179367065, -1.4754977226257324, -1.2099535465240479, -0.9444093704223633, -0.6788650751113892, -0.41332077980041504, -0.14777755737304688, 0.11776667833328247, 0.3833109140396118, 0.6488551497459412, 0.9143993854522705, 1.179943561553955, 1.4454878568649292, 1.7110321521759033, 1.976576328277588, 2.2421205043792725, 2.507664680480957, 2.7732090950012207, 3.0387532711029053, 3.30429744720459, 3.5698418617248535, 3.835386037826538, 4.100930213928223, 4.366474628448486, 4.632018566131592, 4.8975629806518555, 5.163106918334961, 5.428651332855225, 5.694195747375488, 5.959739685058594, 6.225284099578857, 6.490828514099121, 6.756372451782227, 7.02191686630249, 7.287461280822754, 7.553005218505859, 7.818549633026123, 8.084094047546387, 8.349637985229492]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 10.0, 29.0, 48.0, 94.0, 194.0, 447.0, 1141.0, 3238.0, 11911.0, 72207.0, 570419.0, 338744.0, 38603.0, 7639.0, 2287.0, 818.0, 386.0, 161.0, 86.0, 28.0, 20.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.36126708984375, -1.3123779296875, -1.26348876953125, -1.214599609375, -1.16571044921875, -1.1168212890625, -1.06793212890625, -1.01904296875, -0.97015380859375, -0.9212646484375, -0.87237548828125, -0.823486328125, -0.77459716796875, -0.7257080078125, -0.67681884765625, -0.6279296875, -0.57904052734375, -0.5301513671875, -0.48126220703125, -0.432373046875, -0.38348388671875, -0.3345947265625, -0.28570556640625, -0.23681640625, -0.18792724609375, -0.1390380859375, -0.09014892578125, -0.041259765625, 0.00762939453125, 0.0565185546875, 0.10540771484375, 0.154296875, 0.20318603515625, 0.2520751953125, 0.30096435546875, 0.349853515625, 0.39874267578125, 0.4476318359375, 0.49652099609375, 0.54541015625, 0.59429931640625, 0.6431884765625, 0.69207763671875, 0.740966796875, 0.78985595703125, 0.8387451171875, 0.88763427734375, 0.9365234375, 0.98541259765625, 1.0343017578125, 1.08319091796875, 1.132080078125, 1.18096923828125, 1.2298583984375, 1.27874755859375, 1.32763671875, 1.37652587890625, 1.4254150390625, 1.47430419921875, 1.523193359375, 1.57208251953125, 1.6209716796875, 1.66986083984375, 1.71875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 9.0, 12.0, 19.0, 21.0, 25.0, 20.0, 26.0, 23.0, 28.0, 40.0, 37.0, 36.0, 43.0, 43.0, 48.0, 45.0, 41.0, 43.0, 44.0, 45.0, 52.0, 57.0, 33.0, 32.0, 29.0, 24.0, 24.0, 9.0, 17.0, 8.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.74072265625, -0.720123291015625, -0.69952392578125, -0.678924560546875, -0.6583251953125, -0.637725830078125, -0.61712646484375, -0.596527099609375, -0.575927734375, -0.555328369140625, -0.53472900390625, -0.514129638671875, -0.4935302734375, -0.472930908203125, -0.45233154296875, -0.431732177734375, -0.4111328125, -0.390533447265625, -0.36993408203125, -0.349334716796875, -0.3287353515625, -0.308135986328125, -0.28753662109375, -0.266937255859375, -0.246337890625, -0.225738525390625, -0.20513916015625, -0.184539794921875, -0.1639404296875, -0.143341064453125, -0.12274169921875, -0.102142333984375, -0.08154296875, -0.060943603515625, -0.04034423828125, -0.019744873046875, 0.0008544921875, 0.021453857421875, 0.04205322265625, 0.062652587890625, 0.083251953125, 0.103851318359375, 0.12445068359375, 0.145050048828125, 0.1656494140625, 0.186248779296875, 0.20684814453125, 0.227447509765625, 0.248046875, 0.268646240234375, 0.28924560546875, 0.309844970703125, 0.3304443359375, 0.351043701171875, 0.37164306640625, 0.392242431640625, 0.412841796875, 0.433441162109375, 0.45404052734375, 0.474639892578125, 0.4952392578125, 0.515838623046875, 0.53643798828125, 0.557037353515625, 0.57763671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 10.0, 17.0, 15.0, 22.0, 27.0, 39.0, 53.0, 82.0, 97.0, 152.0, 237.0, 390.0, 700.0, 1588.0, 4394.0, 17131.0, 101611.0, 720895.0, 166258.0, 24860.0, 5920.0, 1975.0, 827.0, 448.0, 269.0, 139.0, 100.0, 69.0, 69.0, 47.0, 25.0, 23.0, 10.0, 12.0, 6.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.338592529296875, -1.29339599609375, -1.248199462890625, -1.2030029296875, -1.157806396484375, -1.11260986328125, -1.067413330078125, -1.022216796875, -0.977020263671875, -0.93182373046875, -0.886627197265625, -0.8414306640625, -0.796234130859375, -0.75103759765625, -0.705841064453125, -0.66064453125, -0.615447998046875, -0.57025146484375, -0.525054931640625, -0.4798583984375, -0.434661865234375, -0.38946533203125, -0.344268798828125, -0.299072265625, -0.253875732421875, -0.20867919921875, -0.163482666015625, -0.1182861328125, -0.073089599609375, -0.02789306640625, 0.017303466796875, 0.0625, 0.107696533203125, 0.15289306640625, 0.198089599609375, 0.2432861328125, 0.288482666015625, 0.33367919921875, 0.378875732421875, 0.424072265625, 0.469268798828125, 0.51446533203125, 0.559661865234375, 0.6048583984375, 0.650054931640625, 0.69525146484375, 0.740447998046875, 0.78564453125, 0.830841064453125, 0.87603759765625, 0.921234130859375, 0.9664306640625, 1.011627197265625, 1.05682373046875, 1.102020263671875, 1.147216796875, 1.192413330078125, 1.23760986328125, 1.282806396484375, 1.3280029296875, 1.373199462890625, 1.41839599609375, 1.463592529296875, 1.5087890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 6.0, 5.0, 10.0, 12.0, 16.0, 11.0, 22.0, 22.0, 19.0, 26.0, 30.0, 28.0, 40.0, 51.0, 52.0, 45.0, 65.0, 66.0, 45.0, 54.0, 51.0, 48.0, 38.0, 46.0, 26.0, 24.0, 21.0, 17.0, 13.0, 15.0, 13.0, 10.0, 6.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.296875, -2.212890625, -2.12890625, -2.044921875, -1.9609375, -1.876953125, -1.79296875, -1.708984375, -1.625, -1.541015625, -1.45703125, -1.373046875, -1.2890625, -1.205078125, -1.12109375, -1.037109375, -0.953125, -0.869140625, -0.78515625, -0.701171875, -0.6171875, -0.533203125, -0.44921875, -0.365234375, -0.28125, -0.197265625, -0.11328125, -0.029296875, 0.0546875, 0.138671875, 0.22265625, 0.306640625, 0.390625, 0.474609375, 0.55859375, 0.642578125, 0.7265625, 0.810546875, 0.89453125, 0.978515625, 1.0625, 1.146484375, 1.23046875, 1.314453125, 1.3984375, 1.482421875, 1.56640625, 1.650390625, 1.734375, 1.818359375, 1.90234375, 1.986328125, 2.0703125, 2.154296875, 2.23828125, 2.322265625, 2.40625, 2.490234375, 2.57421875, 2.658203125, 2.7421875, 2.826171875, 2.91015625, 2.994140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 15.0, 9.0, 11.0, 25.0, 42.0, 56.0, 55.0, 122.0, 178.0, 303.0, 496.0, 1035.0, 2064.0, 4782.0, 12347.0, 37188.0, 149478.0, 668852.0, 120543.0, 31736.0, 10793.0, 4244.0, 1914.0, 896.0, 553.0, 287.0, 181.0, 121.0, 61.0, 59.0, 30.0, 24.0, 14.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.415771484375, -0.4016456604003906, -0.38751983642578125, -0.3733940124511719, -0.3592681884765625, -0.3451423645019531, -0.33101654052734375, -0.3168907165527344, -0.302764892578125, -0.2886390686035156, -0.27451324462890625, -0.2603874206542969, -0.2462615966796875, -0.23213577270507812, -0.21800994873046875, -0.20388412475585938, -0.18975830078125, -0.17563247680664062, -0.16150665283203125, -0.14738082885742188, -0.1332550048828125, -0.11912918090820312, -0.10500335693359375, -0.09087753295898438, -0.076751708984375, -0.06262588500976562, -0.04850006103515625, -0.034374237060546875, -0.0202484130859375, -0.006122589111328125, 0.00800323486328125, 0.022129058837890625, 0.0362548828125, 0.050380706787109375, 0.06450653076171875, 0.07863235473632812, 0.0927581787109375, 0.10688400268554688, 0.12100982666015625, 0.13513565063476562, 0.149261474609375, 0.16338729858398438, 0.17751312255859375, 0.19163894653320312, 0.2057647705078125, 0.21989059448242188, 0.23401641845703125, 0.24814224243164062, 0.26226806640625, 0.2763938903808594, 0.29051971435546875, 0.3046455383300781, 0.3187713623046875, 0.3328971862792969, 0.34702301025390625, 0.3611488342285156, 0.375274658203125, 0.3894004821777344, 0.40352630615234375, 0.4176521301269531, 0.4317779541015625, 0.4459037780761719, 0.46002960205078125, 0.4741554260253906, 0.48828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 3.0, 13.0, 14.0, 15.0, 32.0, 29.0, 44.0, 67.0, 102.0, 111.0, 139.0, 137.0, 83.0, 52.0, 29.0, 26.0, 24.0, 14.0, 11.0, 12.0, 5.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014495849609375, -0.000140337273478508, -0.000135716050863266, -0.000131094828248024, -0.00012647360563278198, -0.00012185238301753998, -0.00011723116040229797, -0.00011260993778705597, -0.00010798871517181396, -0.00010336749255657196, -9.874626994132996e-05, -9.412504732608795e-05, -8.950382471084595e-05, -8.488260209560394e-05, -8.026137948036194e-05, -7.564015686511993e-05, -7.101893424987793e-05, -6.639771163463593e-05, -6.177648901939392e-05, -5.7155266404151917e-05, -5.253404378890991e-05, -4.791282117366791e-05, -4.32915985584259e-05, -3.86703759431839e-05, -3.4049153327941895e-05, -2.942793071269989e-05, -2.4806708097457886e-05, -2.018548548221588e-05, -1.5564262866973877e-05, -1.0943040251731873e-05, -6.321817636489868e-06, -1.7005950212478638e-06, 2.9206275939941406e-06, 7.541850209236145e-06, 1.216307282447815e-05, 1.6784295439720154e-05, 2.1405518054962158e-05, 2.6026740670204163e-05, 3.064796328544617e-05, 3.526918590068817e-05, 3.9890408515930176e-05, 4.451163113117218e-05, 4.9132853746414185e-05, 5.375407636165619e-05, 5.837529897689819e-05, 6.29965215921402e-05, 6.76177442073822e-05, 7.22389668226242e-05, 7.686018943786621e-05, 8.148141205310822e-05, 8.610263466835022e-05, 9.072385728359222e-05, 9.534507989883423e-05, 9.996630251407623e-05, 0.00010458752512931824, 0.00010920874774456024, 0.00011382997035980225, 0.00011845119297504425, 0.00012307241559028625, 0.00012769363820552826, 0.00013231486082077026, 0.00013693608343601227, 0.00014155730605125427, 0.00014617852866649628, 0.00015079975128173828]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 12.0, 12.0, 8.0, 14.0, 19.0, 32.0, 33.0, 62.0, 103.0, 204.0, 387.0, 812.0, 1799.0, 4480.0, 14641.0, 68001.0, 710150.0, 202353.0, 31755.0, 8391.0, 2887.0, 1155.0, 527.0, 295.0, 155.0, 92.0, 58.0, 32.0, 36.0, 8.0, 13.0, 8.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6530914306640625, -0.631866455078125, -0.6106414794921875, -0.58941650390625, -0.5681915283203125, -0.546966552734375, -0.5257415771484375, -0.5045166015625, -0.4832916259765625, -0.462066650390625, -0.4408416748046875, -0.41961669921875, -0.3983917236328125, -0.377166748046875, -0.3559417724609375, -0.334716796875, -0.3134918212890625, -0.292266845703125, -0.2710418701171875, -0.24981689453125, -0.2285919189453125, -0.207366943359375, -0.1861419677734375, -0.1649169921875, -0.1436920166015625, -0.122467041015625, -0.1012420654296875, -0.08001708984375, -0.0587921142578125, -0.037567138671875, -0.0163421630859375, 0.0048828125, 0.0261077880859375, 0.047332763671875, 0.0685577392578125, 0.08978271484375, 0.1110076904296875, 0.132232666015625, 0.1534576416015625, 0.1746826171875, 0.1959075927734375, 0.217132568359375, 0.2383575439453125, 0.25958251953125, 0.2808074951171875, 0.302032470703125, 0.3232574462890625, 0.344482421875, 0.3657073974609375, 0.386932373046875, 0.4081573486328125, 0.42938232421875, 0.4506072998046875, 0.471832275390625, 0.4930572509765625, 0.5142822265625, 0.5355072021484375, 0.556732177734375, 0.5779571533203125, 0.59918212890625, 0.6204071044921875, 0.641632080078125, 0.6628570556640625, 0.68408203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 5.0, 12.0, 14.0, 15.0, 11.0, 13.0, 20.0, 24.0, 36.0, 31.0, 48.0, 69.0, 86.0, 135.0, 104.0, 88.0, 58.0, 57.0, 37.0, 26.0, 19.0, 20.0, 8.0, 8.0, 8.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5988998413085938, -0.5801239013671875, -0.5613479614257812, -0.542572021484375, -0.5237960815429688, -0.5050201416015625, -0.48624420166015625, -0.46746826171875, -0.44869232177734375, -0.4299163818359375, -0.41114044189453125, -0.392364501953125, -0.37358856201171875, -0.3548126220703125, -0.33603668212890625, -0.3172607421875, -0.29848480224609375, -0.2797088623046875, -0.26093292236328125, -0.242156982421875, -0.22338104248046875, -0.2046051025390625, -0.18582916259765625, -0.16705322265625, -0.14827728271484375, -0.1295013427734375, -0.11072540283203125, -0.091949462890625, -0.07317352294921875, -0.0543975830078125, -0.03562164306640625, -0.016845703125, 0.00193023681640625, 0.0207061767578125, 0.03948211669921875, 0.058258056640625, 0.07703399658203125, 0.0958099365234375, 0.11458587646484375, 0.13336181640625, 0.15213775634765625, 0.1709136962890625, 0.18968963623046875, 0.208465576171875, 0.22724151611328125, 0.2460174560546875, 0.26479339599609375, 0.2835693359375, 0.30234527587890625, 0.3211212158203125, 0.33989715576171875, 0.358673095703125, 0.37744903564453125, 0.3962249755859375, 0.41500091552734375, 0.43377685546875, 0.45255279541015625, 0.4713287353515625, 0.49010467529296875, 0.508880615234375, 0.5276565551757812, 0.5464324951171875, 0.5652084350585938, 0.583984375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 19.0, 38.0, 104.0, 240.0, 315.0, 142.0, 61.0, 31.0, 15.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.366168022155762, -14.780821800231934, -14.195475578308105, -13.610129356384277, -13.024782180786133, -12.439435958862305, -11.854089736938477, -11.268743515014648, -10.68339729309082, -10.098051071166992, -9.512704849243164, -8.927358627319336, -8.342012405395508, -7.7566657066345215, -7.171319007873535, -6.585972785949707, -6.000626564025879, -5.415280342102051, -4.829934120178223, -4.244587421417236, -3.659241199493408, -3.07389497756958, -2.488548517227173, -1.9032020568847656, -1.3178558349609375, -0.7325094938278198, -0.14716315269470215, 0.4381831884384155, 1.0235295295715332, 1.6088757514953613, 2.1942222118377686, 2.779568672180176, 3.3649158477783203, 3.9502620697021484, 4.535608291625977, 5.120954990386963, 5.706301212310791, 6.291647434234619, 6.8769941329956055, 7.462340354919434, 8.047686576843262, 8.63303279876709, 9.218379020690918, 9.803725242614746, 10.38907241821289, 10.974418640136719, 11.559764862060547, 12.145111083984375, 12.730457305908203, 13.315803527832031, 13.90114974975586, 14.486495971679688, 15.071842193603516, 15.657188415527344, 16.242534637451172, 16.827880859375, 17.413227081298828, 17.998573303222656, 18.583919525146484, 19.169265747070312, 19.75461196899414, 20.33995819091797, 20.925304412841797, 21.510650634765625, 22.095998764038086]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 5.0, 3.0, 14.0, 6.0, 11.0, 9.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 17.0, 29.0, 39.0, 32.0, 38.0, 58.0, 77.0, 71.0, 69.0, 55.0, 50.0, 40.0, 33.0, 33.0, 40.0, 22.0, 24.0, 14.0, 14.0, 18.0, 13.0, 11.0, 11.0, 6.0, 11.0, 4.0, 9.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.99497127532959, -9.699907302856445, -9.404842376708984, -9.109777450561523, -8.814713478088379, -8.519649505615234, -8.224584579467773, -7.929520130157471, -7.634455680847168, -7.339391231536865, -7.0443267822265625, -6.74926233291626, -6.454197883605957, -6.159133434295654, -5.864068984985352, -5.569004535675049, -5.273940086364746, -4.978875637054443, -4.683811187744141, -4.388746738433838, -4.093682289123535, -3.7986178398132324, -3.5035533905029297, -3.208488941192627, -2.913424491882324, -2.6183600425720215, -2.3232955932617188, -2.028231143951416, -1.7331666946411133, -1.4381022453308105, -1.1430377960205078, -0.8479733467102051, -0.5529098510742188, -0.257845401763916, 0.03721904754638672, 0.33228349685668945, 0.6273479461669922, 0.9224123954772949, 1.2174768447875977, 1.5125412940979004, 1.8076057434082031, 2.102670192718506, 2.3977346420288086, 2.6927990913391113, 2.987863540649414, 3.282927989959717, 3.5779924392700195, 3.8730568885803223, 4.168121337890625, 4.463185787200928, 4.7582502365112305, 5.053314685821533, 5.348379135131836, 5.643443584442139, 5.938508033752441, 6.233572483062744, 6.528636932373047, 6.82370138168335, 7.118765830993652, 7.413830280303955, 7.708894729614258, 8.003959655761719, 8.299023628234863, 8.594087600708008, 8.889152526855469]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 13.0, 9.0, 8.0, 12.0, 13.0, 10.0, 24.0, 19.0, 32.0, 26.0, 51.0, 69.0, 100.0, 158.0, 321.0, 753.0, 2174.0, 8404.0, 57914.0, 1185987.0, 2792140.0, 126995.0, 13925.0, 3091.0, 969.0, 439.0, 220.0, 109.0, 78.0, 40.0, 38.0, 22.0, 20.0, 17.0, 21.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.465362548828125, -1.41510009765625, -1.364837646484375, -1.3145751953125, -1.264312744140625, -1.21405029296875, -1.163787841796875, -1.113525390625, -1.063262939453125, -1.01300048828125, -0.962738037109375, -0.9124755859375, -0.862213134765625, -0.81195068359375, -0.761688232421875, -0.71142578125, -0.661163330078125, -0.61090087890625, -0.560638427734375, -0.5103759765625, -0.460113525390625, -0.40985107421875, -0.359588623046875, -0.309326171875, -0.259063720703125, -0.20880126953125, -0.158538818359375, -0.1082763671875, -0.058013916015625, -0.00775146484375, 0.042510986328125, 0.0927734375, 0.143035888671875, 0.19329833984375, 0.243560791015625, 0.2938232421875, 0.344085693359375, 0.39434814453125, 0.444610595703125, 0.494873046875, 0.545135498046875, 0.59539794921875, 0.645660400390625, 0.6959228515625, 0.746185302734375, 0.79644775390625, 0.846710205078125, 0.89697265625, 0.947235107421875, 0.99749755859375, 1.047760009765625, 1.0980224609375, 1.148284912109375, 1.19854736328125, 1.248809814453125, 1.299072265625, 1.349334716796875, 1.39959716796875, 1.449859619140625, 1.5001220703125, 1.550384521484375, 1.60064697265625, 1.650909423828125, 1.701171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 9.0, 11.0, 18.0, 16.0, 17.0, 30.0, 25.0, 32.0, 31.0, 36.0, 32.0, 59.0, 53.0, 50.0, 46.0, 51.0, 45.0, 35.0, 53.0, 43.0, 32.0, 48.0, 32.0, 25.0, 24.0, 22.0, 12.0, 24.0, 5.0, 19.0, 8.0, 10.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.611328125, -0.5904693603515625, -0.569610595703125, -0.5487518310546875, -0.52789306640625, -0.5070343017578125, -0.486175537109375, -0.4653167724609375, -0.4444580078125, -0.4235992431640625, -0.402740478515625, -0.3818817138671875, -0.36102294921875, -0.3401641845703125, -0.319305419921875, -0.2984466552734375, -0.277587890625, -0.2567291259765625, -0.235870361328125, -0.2150115966796875, -0.19415283203125, -0.1732940673828125, -0.152435302734375, -0.1315765380859375, -0.1107177734375, -0.0898590087890625, -0.069000244140625, -0.0481414794921875, -0.02728271484375, -0.0064239501953125, 0.014434814453125, 0.0352935791015625, 0.05615234375, 0.0770111083984375, 0.097869873046875, 0.1187286376953125, 0.13958740234375, 0.1604461669921875, 0.181304931640625, 0.2021636962890625, 0.2230224609375, 0.2438812255859375, 0.264739990234375, 0.2855987548828125, 0.30645751953125, 0.3273162841796875, 0.348175048828125, 0.3690338134765625, 0.389892578125, 0.4107513427734375, 0.431610107421875, 0.4524688720703125, 0.47332763671875, 0.4941864013671875, 0.515045166015625, 0.5359039306640625, 0.5567626953125, 0.5776214599609375, 0.598480224609375, 0.6193389892578125, 0.64019775390625, 0.6610565185546875, 0.681915283203125, 0.7027740478515625, 0.7236328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 14.0, 18.0, 37.0, 144.0, 398.0, 1819.0, 89450.0, 4088537.0, 12378.0, 1035.0, 281.0, 100.0, 40.0, 10.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.19293212890625, -2.0147705078125, -1.83660888671875, -1.658447265625, -1.48028564453125, -1.3021240234375, -1.12396240234375, -0.94580078125, -0.76763916015625, -0.5894775390625, -0.41131591796875, -0.233154296875, -0.05499267578125, 0.1231689453125, 0.30133056640625, 0.4794921875, 0.65765380859375, 0.8358154296875, 1.01397705078125, 1.192138671875, 1.37030029296875, 1.5484619140625, 1.72662353515625, 1.90478515625, 2.08294677734375, 2.2611083984375, 2.43927001953125, 2.617431640625, 2.79559326171875, 2.9737548828125, 3.15191650390625, 3.330078125, 3.50823974609375, 3.6864013671875, 3.86456298828125, 4.042724609375, 4.22088623046875, 4.3990478515625, 4.57720947265625, 4.75537109375, 4.93353271484375, 5.1116943359375, 5.28985595703125, 5.468017578125, 5.64617919921875, 5.8243408203125, 6.00250244140625, 6.1806640625, 6.35882568359375, 6.5369873046875, 6.71514892578125, 6.893310546875, 7.07147216796875, 7.2496337890625, 7.42779541015625, 7.60595703125, 7.78411865234375, 7.9622802734375, 8.14044189453125, 8.318603515625, 8.49676513671875, 8.6749267578125, 8.85308837890625, 9.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 12.0, 25.0, 42.0, 61.0, 110.0, 235.0, 465.0, 888.0, 1053.0, 560.0, 293.0, 134.0, 73.0, 41.0, 34.0, 13.0, 6.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.54296875, -2.474456787109375, -2.40594482421875, -2.337432861328125, -2.2689208984375, -2.200408935546875, -2.13189697265625, -2.063385009765625, -1.994873046875, -1.926361083984375, -1.85784912109375, -1.789337158203125, -1.7208251953125, -1.652313232421875, -1.58380126953125, -1.515289306640625, -1.44677734375, -1.378265380859375, -1.30975341796875, -1.241241455078125, -1.1727294921875, -1.104217529296875, -1.03570556640625, -0.967193603515625, -0.898681640625, -0.830169677734375, -0.76165771484375, -0.693145751953125, -0.6246337890625, -0.556121826171875, -0.48760986328125, -0.419097900390625, -0.3505859375, -0.282073974609375, -0.21356201171875, -0.145050048828125, -0.0765380859375, -0.008026123046875, 0.06048583984375, 0.128997802734375, 0.197509765625, 0.266021728515625, 0.33453369140625, 0.403045654296875, 0.4715576171875, 0.540069580078125, 0.60858154296875, 0.677093505859375, 0.74560546875, 0.814117431640625, 0.88262939453125, 0.951141357421875, 1.0196533203125, 1.088165283203125, 1.15667724609375, 1.225189208984375, 1.293701171875, 1.362213134765625, 1.43072509765625, 1.499237060546875, 1.5677490234375, 1.636260986328125, 1.70477294921875, 1.773284912109375, 1.841796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 19.0, 55.0, 148.0, 262.0, 275.0, 116.0, 62.0, 22.0, 13.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.362067222595215, -12.566646575927734, -11.771224975585938, -10.975804328918457, -10.18038272857666, -9.38496208190918, -8.589540481567383, -7.794119834899902, -6.998698711395264, -6.203277587890625, -5.407856464385986, -4.612435340881348, -3.817014455795288, -3.0215933322906494, -2.22617244720459, -1.4307513236999512, -0.6353302001953125, 0.1600908637046814, 0.9555119276046753, 1.7509329319000244, 2.546354055404663, 3.3417751789093018, 4.137196063995361, 4.9326171875, 5.728038311004639, 6.523459434509277, 7.318880558013916, 8.114301681518555, 8.909722328186035, 9.705143928527832, 10.500564575195312, 11.29598617553711, 12.091405868530273, 12.886826515197754, 13.68224811553955, 14.477668762207031, 15.273090362548828, 16.068511962890625, 16.86393165588379, 17.659353256225586, 18.454774856567383, 19.25019645690918, 20.045616149902344, 20.84103775024414, 21.636459350585938, 22.431880950927734, 23.2273006439209, 24.022722244262695, 24.81814193725586, 25.613563537597656, 26.40898323059082, 27.204404830932617, 27.999826431274414, 28.79524803161621, 29.590667724609375, 30.386089324951172, 31.18151092529297, 31.976932525634766, 32.77235412597656, 33.56777572631836, 34.36319351196289, 35.15861511230469, 35.954036712646484, 36.74945831298828, 37.54487991333008]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 12.0, 10.0, 11.0, 7.0, 7.0, 21.0, 12.0, 17.0, 13.0, 25.0, 24.0, 37.0, 30.0, 39.0, 36.0, 39.0, 47.0, 34.0, 44.0, 47.0, 37.0, 36.0, 34.0, 34.0, 39.0, 34.0, 29.0, 27.0, 23.0, 30.0, 27.0, 11.0, 17.0, 16.0, 17.0, 14.0, 17.0, 4.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.2947845458984375, -6.113229274749756, -5.931674003601074, -5.750118732452393, -5.568563461303711, -5.387008190155029, -5.205452919006348, -5.023897171020508, -4.842342376708984, -4.660787105560303, -4.479231834411621, -4.2976765632629395, -4.116121292114258, -3.934566020965576, -3.7530105113983154, -3.571455240249634, -3.389899730682373, -3.2083444595336914, -3.0267891883850098, -2.845233917236328, -2.6636786460876465, -2.482123374938965, -2.300567865371704, -2.1190125942230225, -1.9374573230743408, -1.7559020519256592, -1.5743467807769775, -1.3927913904190063, -1.2112361192703247, -1.029680848121643, -0.8481254577636719, -0.6665701866149902, -0.4850144386291504, -0.30345913767814636, -0.12190383672714233, 0.05965149402618408, 0.24120676517486572, 0.42276203632354736, 0.6043174266815186, 0.7858726978302002, 0.9674279689788818, 1.1489832401275635, 1.3305385112762451, 1.5120939016342163, 1.693649172782898, 1.8752044439315796, 2.056759834289551, 2.2383151054382324, 2.419870376586914, 2.6014256477355957, 2.7829809188842773, 2.964536190032959, 3.1460914611816406, 3.3276467323303223, 3.509202241897583, 3.6907575130462646, 3.8723127841949463, 4.053868293762207, 4.235423564910889, 4.41697883605957, 4.598534107208252, 4.780089378356934, 4.961644649505615, 5.143199920654297, 5.3247551918029785]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 12.0, 13.0, 30.0, 65.0, 140.0, 328.0, 799.0, 2345.0, 7815.0, 35588.0, 261034.0, 617834.0, 98973.0, 16987.0, 4287.0, 1339.0, 536.0, 206.0, 112.0, 50.0, 26.0, 9.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3029327392578125, -1.251373291015625, -1.1998138427734375, -1.14825439453125, -1.0966949462890625, -1.045135498046875, -0.9935760498046875, -0.9420166015625, -0.8904571533203125, -0.838897705078125, -0.7873382568359375, -0.73577880859375, -0.6842193603515625, -0.632659912109375, -0.5811004638671875, -0.529541015625, -0.4779815673828125, -0.426422119140625, -0.3748626708984375, -0.32330322265625, -0.2717437744140625, -0.220184326171875, -0.1686248779296875, -0.1170654296875, -0.0655059814453125, -0.013946533203125, 0.0376129150390625, 0.08917236328125, 0.1407318115234375, 0.192291259765625, 0.2438507080078125, 0.29541015625, 0.3469696044921875, 0.398529052734375, 0.4500885009765625, 0.50164794921875, 0.5532073974609375, 0.604766845703125, 0.6563262939453125, 0.7078857421875, 0.7594451904296875, 0.811004638671875, 0.8625640869140625, 0.91412353515625, 0.9656829833984375, 1.017242431640625, 1.0688018798828125, 1.120361328125, 1.1719207763671875, 1.223480224609375, 1.2750396728515625, 1.32659912109375, 1.3781585693359375, 1.429718017578125, 1.4812774658203125, 1.5328369140625, 1.5843963623046875, 1.635955810546875, 1.6875152587890625, 1.73907470703125, 1.7906341552734375, 1.842193603515625, 1.8937530517578125, 1.9453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 7.0, 6.0, 6.0, 8.0, 7.0, 12.0, 16.0, 26.0, 13.0, 20.0, 20.0, 25.0, 44.0, 35.0, 30.0, 39.0, 52.0, 39.0, 51.0, 51.0, 44.0, 47.0, 44.0, 46.0, 44.0, 34.0, 34.0, 37.0, 32.0, 24.0, 25.0, 20.0, 14.0, 15.0, 11.0, 2.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6591796875, -0.6370849609375, -0.614990234375, -0.5928955078125, -0.57080078125, -0.5487060546875, -0.526611328125, -0.5045166015625, -0.482421875, -0.4603271484375, -0.438232421875, -0.4161376953125, -0.39404296875, -0.3719482421875, -0.349853515625, -0.3277587890625, -0.3056640625, -0.2835693359375, -0.261474609375, -0.2393798828125, -0.21728515625, -0.1951904296875, -0.173095703125, -0.1510009765625, -0.12890625, -0.1068115234375, -0.084716796875, -0.0626220703125, -0.04052734375, -0.0184326171875, 0.003662109375, 0.0257568359375, 0.0478515625, 0.0699462890625, 0.092041015625, 0.1141357421875, 0.13623046875, 0.1583251953125, 0.180419921875, 0.2025146484375, 0.224609375, 0.2467041015625, 0.268798828125, 0.2908935546875, 0.31298828125, 0.3350830078125, 0.357177734375, 0.3792724609375, 0.4013671875, 0.4234619140625, 0.445556640625, 0.4676513671875, 0.48974609375, 0.5118408203125, 0.533935546875, 0.5560302734375, 0.578125, 0.6002197265625, 0.622314453125, 0.6444091796875, 0.66650390625, 0.6885986328125, 0.710693359375, 0.7327880859375, 0.7548828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 12.0, 17.0, 32.0, 39.0, 56.0, 100.0, 117.0, 182.0, 319.0, 626.0, 1208.0, 3216.0, 13152.0, 99542.0, 821703.0, 89906.0, 12315.0, 3258.0, 1225.0, 591.0, 331.0, 215.0, 106.0, 88.0, 58.0, 39.0, 31.0, 15.0, 17.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.0899200439453125, -2.027496337890625, -1.9650726318359375, -1.90264892578125, -1.8402252197265625, -1.777801513671875, -1.7153778076171875, -1.6529541015625, -1.5905303955078125, -1.528106689453125, -1.4656829833984375, -1.40325927734375, -1.3408355712890625, -1.278411865234375, -1.2159881591796875, -1.153564453125, -1.0911407470703125, -1.028717041015625, -0.9662933349609375, -0.90386962890625, -0.8414459228515625, -0.779022216796875, -0.7165985107421875, -0.6541748046875, -0.5917510986328125, -0.529327392578125, -0.4669036865234375, -0.40447998046875, -0.3420562744140625, -0.279632568359375, -0.2172088623046875, -0.15478515625, -0.0923614501953125, -0.029937744140625, 0.0324859619140625, 0.09490966796875, 0.1573333740234375, 0.219757080078125, 0.2821807861328125, 0.3446044921875, 0.4070281982421875, 0.469451904296875, 0.5318756103515625, 0.59429931640625, 0.6567230224609375, 0.719146728515625, 0.7815704345703125, 0.843994140625, 0.9064178466796875, 0.968841552734375, 1.0312652587890625, 1.09368896484375, 1.1561126708984375, 1.218536376953125, 1.2809600830078125, 1.3433837890625, 1.4058074951171875, 1.468231201171875, 1.5306549072265625, 1.59307861328125, 1.6555023193359375, 1.717926025390625, 1.7803497314453125, 1.8427734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 2.0, 7.0, 7.0, 8.0, 12.0, 15.0, 20.0, 22.0, 30.0, 22.0, 24.0, 34.0, 48.0, 49.0, 47.0, 55.0, 43.0, 78.0, 58.0, 51.0, 47.0, 44.0, 42.0, 31.0, 22.0, 31.0, 27.0, 18.0, 21.0, 9.0, 16.0, 5.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.67578125, -2.590850830078125, -2.50592041015625, -2.420989990234375, -2.3360595703125, -2.251129150390625, -2.16619873046875, -2.081268310546875, -1.996337890625, -1.911407470703125, -1.82647705078125, -1.741546630859375, -1.6566162109375, -1.571685791015625, -1.48675537109375, -1.401824951171875, -1.31689453125, -1.231964111328125, -1.14703369140625, -1.062103271484375, -0.9771728515625, -0.892242431640625, -0.80731201171875, -0.722381591796875, -0.637451171875, -0.552520751953125, -0.46759033203125, -0.382659912109375, -0.2977294921875, -0.212799072265625, -0.12786865234375, -0.042938232421875, 0.0419921875, 0.126922607421875, 0.21185302734375, 0.296783447265625, 0.3817138671875, 0.466644287109375, 0.55157470703125, 0.636505126953125, 0.721435546875, 0.806365966796875, 0.89129638671875, 0.976226806640625, 1.0611572265625, 1.146087646484375, 1.23101806640625, 1.315948486328125, 1.40087890625, 1.485809326171875, 1.57073974609375, 1.655670166015625, 1.7406005859375, 1.825531005859375, 1.91046142578125, 1.995391845703125, 2.080322265625, 2.165252685546875, 2.25018310546875, 2.335113525390625, 2.4200439453125, 2.504974365234375, 2.58990478515625, 2.674835205078125, 2.759765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 5.0, 21.0, 24.0, 36.0, 62.0, 106.0, 161.0, 358.0, 727.0, 2091.0, 7767.0, 43009.0, 728428.0, 231814.0, 25640.0, 5351.0, 1621.0, 625.0, 286.0, 145.0, 92.0, 57.0, 32.0, 28.0, 16.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5597305297851562, -0.5388946533203125, -0.5180587768554688, -0.497222900390625, -0.47638702392578125, -0.4555511474609375, -0.43471527099609375, -0.41387939453125, -0.39304351806640625, -0.3722076416015625, -0.35137176513671875, -0.330535888671875, -0.30970001220703125, -0.2888641357421875, -0.26802825927734375, -0.2471923828125, -0.22635650634765625, -0.2055206298828125, -0.18468475341796875, -0.163848876953125, -0.14301300048828125, -0.1221771240234375, -0.10134124755859375, -0.08050537109375, -0.05966949462890625, -0.0388336181640625, -0.01799774169921875, 0.002838134765625, 0.02367401123046875, 0.0445098876953125, 0.06534576416015625, 0.086181640625, 0.10701751708984375, 0.1278533935546875, 0.14868927001953125, 0.169525146484375, 0.19036102294921875, 0.2111968994140625, 0.23203277587890625, 0.25286865234375, 0.27370452880859375, 0.2945404052734375, 0.31537628173828125, 0.336212158203125, 0.35704803466796875, 0.3778839111328125, 0.39871978759765625, 0.4195556640625, 0.44039154052734375, 0.4612274169921875, 0.48206329345703125, 0.502899169921875, 0.5237350463867188, 0.5445709228515625, 0.5654067993164062, 0.58624267578125, 0.6070785522460938, 0.6279144287109375, 0.6487503051757812, 0.669586181640625, 0.6904220581054688, 0.7112579345703125, 0.7320938110351562, 0.7529296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 5.0, 4.0, 3.0, 11.0, 5.0, 13.0, 25.0, 42.0, 63.0, 137.0, 208.0, 196.0, 104.0, 70.0, 42.0, 19.0, 17.0, 15.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025391578674316406, -0.00024643726646900177, -0.00023895874619483948, -0.00023148022592067719, -0.0002240017056465149, -0.0002165231853723526, -0.0002090446650981903, -0.00020156614482402802, -0.00019408762454986572, -0.00018660910427570343, -0.00017913058400154114, -0.00017165206372737885, -0.00016417354345321655, -0.00015669502317905426, -0.00014921650290489197, -0.00014173798263072968, -0.00013425946235656738, -0.0001267809420824051, -0.0001193024218082428, -0.0001118239015340805, -0.00010434538125991821, -9.686686098575592e-05, -8.938834071159363e-05, -8.190982043743134e-05, -7.443130016326904e-05, -6.695277988910675e-05, -5.947425961494446e-05, -5.1995739340782166e-05, -4.451721906661987e-05, -3.703869879245758e-05, -2.9560178518295288e-05, -2.2081658244132996e-05, -1.4603137969970703e-05, -7.124617695808411e-06, 3.5390257835388184e-07, 7.832422852516174e-06, 1.5310943126678467e-05, 2.278946340084076e-05, 3.0267983675003052e-05, 3.7746503949165344e-05, 4.522502422332764e-05, 5.270354449748993e-05, 6.018206477165222e-05, 6.766058504581451e-05, 7.51391053199768e-05, 8.26176255941391e-05, 9.009614586830139e-05, 9.757466614246368e-05, 0.00010505318641662598, 0.00011253170669078827, 0.00012001022696495056, 0.00012748874723911285, 0.00013496726751327515, 0.00014244578778743744, 0.00014992430806159973, 0.00015740282833576202, 0.00016488134860992432, 0.0001723598688840866, 0.0001798383891582489, 0.0001873169094324112, 0.00019479542970657349, 0.00020227394998073578, 0.00020975247025489807, 0.00021723099052906036, 0.00022470951080322266]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 12.0, 18.0, 25.0, 33.0, 46.0, 74.0, 136.0, 287.0, 410.0, 868.0, 1908.0, 4938.0, 15973.0, 67315.0, 641290.0, 250613.0, 45740.0, 11687.0, 3825.0, 1611.0, 751.0, 396.0, 218.0, 134.0, 71.0, 55.0, 34.0, 25.0, 9.0, 11.0, 9.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.53369140625, -0.5179367065429688, -0.5021820068359375, -0.48642730712890625, -0.470672607421875, -0.45491790771484375, -0.4391632080078125, -0.42340850830078125, -0.40765380859375, -0.39189910888671875, -0.3761444091796875, -0.36038970947265625, -0.344635009765625, -0.32888031005859375, -0.3131256103515625, -0.29737091064453125, -0.2816162109375, -0.26586151123046875, -0.2501068115234375, -0.23435211181640625, -0.218597412109375, -0.20284271240234375, -0.1870880126953125, -0.17133331298828125, -0.15557861328125, -0.13982391357421875, -0.1240692138671875, -0.10831451416015625, -0.092559814453125, -0.07680511474609375, -0.0610504150390625, -0.04529571533203125, -0.029541015625, -0.01378631591796875, 0.0019683837890625, 0.01772308349609375, 0.033477783203125, 0.04923248291015625, 0.0649871826171875, 0.08074188232421875, 0.09649658203125, 0.11225128173828125, 0.1280059814453125, 0.14376068115234375, 0.159515380859375, 0.17527008056640625, 0.1910247802734375, 0.20677947998046875, 0.2225341796875, 0.23828887939453125, 0.2540435791015625, 0.26979827880859375, 0.285552978515625, 0.30130767822265625, 0.3170623779296875, 0.33281707763671875, 0.34857177734375, 0.36432647705078125, 0.3800811767578125, 0.39583587646484375, 0.411590576171875, 0.42734527587890625, 0.4430999755859375, 0.45885467529296875, 0.474609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 6.0, 8.0, 13.0, 11.0, 20.0, 22.0, 41.0, 53.0, 62.0, 98.0, 135.0, 116.0, 101.0, 69.0, 66.0, 44.0, 32.0, 22.0, 18.0, 17.0, 14.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5780181884765625, -0.558868408203125, -0.5397186279296875, -0.52056884765625, -0.5014190673828125, -0.482269287109375, -0.4631195068359375, -0.4439697265625, -0.4248199462890625, -0.405670166015625, -0.3865203857421875, -0.36737060546875, -0.3482208251953125, -0.329071044921875, -0.3099212646484375, -0.290771484375, -0.2716217041015625, -0.252471923828125, -0.2333221435546875, -0.21417236328125, -0.1950225830078125, -0.175872802734375, -0.1567230224609375, -0.1375732421875, -0.1184234619140625, -0.099273681640625, -0.0801239013671875, -0.06097412109375, -0.0418243408203125, -0.022674560546875, -0.0035247802734375, 0.015625, 0.0347747802734375, 0.053924560546875, 0.0730743408203125, 0.09222412109375, 0.1113739013671875, 0.130523681640625, 0.1496734619140625, 0.1688232421875, 0.1879730224609375, 0.207122802734375, 0.2262725830078125, 0.24542236328125, 0.2645721435546875, 0.283721923828125, 0.3028717041015625, 0.322021484375, 0.3411712646484375, 0.360321044921875, 0.3794708251953125, 0.39862060546875, 0.4177703857421875, 0.436920166015625, 0.4560699462890625, 0.4752197265625, 0.4943695068359375, 0.513519287109375, 0.5326690673828125, 0.55181884765625, 0.5709686279296875, 0.590118408203125, 0.6092681884765625, 0.62841796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 19.0, 45.0, 83.0, 153.0, 312.0, 162.0, 80.0, 47.0, 34.0, 16.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.572731018066406, -18.11406135559082, -17.6553897857666, -17.196720123291016, -16.738048553466797, -16.27937889099121, -15.820708274841309, -15.362037658691406, -14.90336799621582, -14.444697380065918, -13.986026763916016, -13.52735710144043, -13.068686485290527, -12.610015869140625, -12.151345252990723, -11.69267463684082, -11.234004020690918, -10.775333404541016, -10.316662788391113, -9.857992172241211, -9.399322509765625, -8.940651893615723, -8.48198127746582, -8.023310661315918, -7.564640522003174, -7.1059699058532715, -6.647299766540527, -6.188629150390625, -5.729958534240723, -5.2712883949279785, -4.812617778778076, -4.353947639465332, -3.895277976989746, -3.436607599258423, -2.9779372215270996, -2.5192666053771973, -2.060596227645874, -1.6019258499145508, -1.1432552337646484, -0.6845848560333252, -0.22591447830200195, 0.23275595903396606, 0.6914263963699341, 1.1500968933105469, 1.6087672710418701, 2.0674376487731934, 2.5261082649230957, 2.984778642654419, 3.443449020385742, 3.9021193981170654, 4.360789775848389, 4.819460391998291, 5.278130531311035, 5.7368011474609375, 6.19547176361084, 6.654142379760742, 7.112812519073486, 7.571483135223389, 8.030153274536133, 8.488823890686035, 8.947494506835938, 9.406164169311523, 9.864835739135742, 10.323505401611328, 10.78217601776123]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 6.0, 6.0, 16.0, 10.0, 12.0, 15.0, 19.0, 18.0, 25.0, 33.0, 21.0, 24.0, 27.0, 28.0, 53.0, 66.0, 119.0, 96.0, 74.0, 55.0, 40.0, 40.0, 34.0, 23.0, 21.0, 28.0, 14.0, 14.0, 8.0, 10.0, 10.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.744438171386719, -9.383305549621582, -9.022173881530762, -8.661041259765625, -8.299908638000488, -7.93877649307251, -7.577644348144531, -7.2165117263793945, -6.855379581451416, -6.4942474365234375, -6.133114814758301, -5.771982669830322, -5.410850524902344, -5.049717903137207, -4.6885857582092285, -4.32745361328125, -3.9663209915161133, -3.6051886081695557, -3.244056224822998, -2.8829240798950195, -2.521791696548462, -2.1606593132019043, -1.7995271682739258, -1.4383947849273682, -1.0772624015808105, -0.7161300778388977, -0.35499775409698486, 0.006134510040283203, 0.3672668933868408, 0.7283992767333984, 1.089531421661377, 1.4506638050079346, 1.8117952346801758, 2.1729276180267334, 2.534060001373291, 2.8951921463012695, 3.256324529647827, 3.6174569129943848, 3.9785890579223633, 4.3397216796875, 4.7008538246154785, 5.061985969543457, 5.423118591308594, 5.784250736236572, 6.145382881164551, 6.5065155029296875, 6.867647647857666, 7.2287797927856445, 7.589912414550781, 7.95104455947876, 8.312176704406738, 8.673309326171875, 9.034441947937012, 9.395574569702148, 9.756706237792969, 10.117838859558105, 10.478971481323242, 10.840104103088379, 11.2012357711792, 11.562368392944336, 11.923501014709473, 12.28463363647461, 12.64576530456543, 13.006897926330566, 13.368029594421387]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 13.0, 15.0, 20.0, 27.0, 57.0, 124.0, 327.0, 898.0, 3505.0, 19997.0, 255886.0, 3369917.0, 507776.0, 29153.0, 4679.0, 1125.0, 382.0, 179.0, 90.0, 38.0, 25.0, 17.0, 10.0, 10.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.60345458984375, -2.5155029296875, -2.42755126953125, -2.339599609375, -2.25164794921875, -2.1636962890625, -2.07574462890625, -1.98779296875, -1.89984130859375, -1.8118896484375, -1.72393798828125, -1.635986328125, -1.54803466796875, -1.4600830078125, -1.37213134765625, -1.2841796875, -1.19622802734375, -1.1082763671875, -1.02032470703125, -0.932373046875, -0.84442138671875, -0.7564697265625, -0.66851806640625, -0.58056640625, -0.49261474609375, -0.4046630859375, -0.31671142578125, -0.228759765625, -0.14080810546875, -0.0528564453125, 0.03509521484375, 0.123046875, 0.21099853515625, 0.2989501953125, 0.38690185546875, 0.474853515625, 0.56280517578125, 0.6507568359375, 0.73870849609375, 0.82666015625, 0.91461181640625, 1.0025634765625, 1.09051513671875, 1.178466796875, 1.26641845703125, 1.3543701171875, 1.44232177734375, 1.5302734375, 1.61822509765625, 1.7061767578125, 1.79412841796875, 1.882080078125, 1.97003173828125, 2.0579833984375, 2.14593505859375, 2.23388671875, 2.32183837890625, 2.4097900390625, 2.49774169921875, 2.585693359375, 2.67364501953125, 2.7615966796875, 2.84954833984375, 2.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 9.0, 3.0, 8.0, 8.0, 11.0, 18.0, 18.0, 23.0, 31.0, 34.0, 50.0, 50.0, 57.0, 53.0, 61.0, 48.0, 61.0, 49.0, 57.0, 47.0, 37.0, 48.0, 50.0, 35.0, 29.0, 31.0, 14.0, 21.0, 7.0, 5.0, 11.0, 3.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8052520751953125, -0.780426025390625, -0.7555999755859375, -0.73077392578125, -0.7059478759765625, -0.681121826171875, -0.6562957763671875, -0.6314697265625, -0.6066436767578125, -0.581817626953125, -0.5569915771484375, -0.53216552734375, -0.5073394775390625, -0.482513427734375, -0.4576873779296875, -0.432861328125, -0.4080352783203125, -0.383209228515625, -0.3583831787109375, -0.33355712890625, -0.3087310791015625, -0.283905029296875, -0.2590789794921875, -0.2342529296875, -0.2094268798828125, -0.184600830078125, -0.1597747802734375, -0.13494873046875, -0.1101226806640625, -0.085296630859375, -0.0604705810546875, -0.03564453125, -0.0108184814453125, 0.014007568359375, 0.0388336181640625, 0.06365966796875, 0.0884857177734375, 0.113311767578125, 0.1381378173828125, 0.1629638671875, 0.1877899169921875, 0.212615966796875, 0.2374420166015625, 0.26226806640625, 0.2870941162109375, 0.311920166015625, 0.3367462158203125, 0.361572265625, 0.3863983154296875, 0.411224365234375, 0.4360504150390625, 0.46087646484375, 0.4857025146484375, 0.510528564453125, 0.5353546142578125, 0.5601806640625, 0.5850067138671875, 0.609832763671875, 0.6346588134765625, 0.65948486328125, 0.6843109130859375, 0.709136962890625, 0.7339630126953125, 0.7587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 6.0, 16.0, 33.0, 58.0, 83.0, 196.0, 520.0, 2114.0, 39798.0, 4138017.0, 11215.0, 1400.0, 452.0, 171.0, 92.0, 38.0, 19.0, 11.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.59375, -11.22412109375, -10.8544921875, -10.48486328125, -10.115234375, -9.74560546875, -9.3759765625, -9.00634765625, -8.63671875, -8.26708984375, -7.8974609375, -7.52783203125, -7.158203125, -6.78857421875, -6.4189453125, -6.04931640625, -5.6796875, -5.31005859375, -4.9404296875, -4.57080078125, -4.201171875, -3.83154296875, -3.4619140625, -3.09228515625, -2.72265625, -2.35302734375, -1.9833984375, -1.61376953125, -1.244140625, -0.87451171875, -0.5048828125, -0.13525390625, 0.234375, 0.60400390625, 0.9736328125, 1.34326171875, 1.712890625, 2.08251953125, 2.4521484375, 2.82177734375, 3.19140625, 3.56103515625, 3.9306640625, 4.30029296875, 4.669921875, 5.03955078125, 5.4091796875, 5.77880859375, 6.1484375, 6.51806640625, 6.8876953125, 7.25732421875, 7.626953125, 7.99658203125, 8.3662109375, 8.73583984375, 9.10546875, 9.47509765625, 9.8447265625, 10.21435546875, 10.583984375, 10.95361328125, 11.3232421875, 11.69287109375, 12.0625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 16.0, 22.0, 38.0, 51.0, 98.0, 125.0, 232.0, 389.0, 664.0, 993.0, 648.0, 343.0, 157.0, 112.0, 64.0, 48.0, 29.0, 17.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.74114990234375, -2.6190185546875, -2.49688720703125, -2.374755859375, -2.25262451171875, -2.1304931640625, -2.00836181640625, -1.88623046875, -1.76409912109375, -1.6419677734375, -1.51983642578125, -1.397705078125, -1.27557373046875, -1.1534423828125, -1.03131103515625, -0.9091796875, -0.78704833984375, -0.6649169921875, -0.54278564453125, -0.420654296875, -0.29852294921875, -0.1763916015625, -0.05426025390625, 0.06787109375, 0.19000244140625, 0.3121337890625, 0.43426513671875, 0.556396484375, 0.67852783203125, 0.8006591796875, 0.92279052734375, 1.044921875, 1.16705322265625, 1.2891845703125, 1.41131591796875, 1.533447265625, 1.65557861328125, 1.7777099609375, 1.89984130859375, 2.02197265625, 2.14410400390625, 2.2662353515625, 2.38836669921875, 2.510498046875, 2.63262939453125, 2.7547607421875, 2.87689208984375, 2.9990234375, 3.12115478515625, 3.2432861328125, 3.36541748046875, 3.487548828125, 3.60968017578125, 3.7318115234375, 3.85394287109375, 3.97607421875, 4.09820556640625, 4.2203369140625, 4.34246826171875, 4.464599609375, 4.58673095703125, 4.7088623046875, 4.83099365234375, 4.953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 13.0, 47.0, 267.0, 518.0, 111.0, 33.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-182.2290802001953, -178.86874389648438, -175.5084228515625, -172.14808654785156, -168.78775024414062, -165.4274139404297, -162.06707763671875, -158.70675659179688, -155.34642028808594, -151.986083984375, -148.62576293945312, -145.2654266357422, -141.90509033203125, -138.5447540283203, -135.18441772460938, -131.8240966796875, -128.46376037597656, -125.10342407226562, -121.74309539794922, -118.38276672363281, -115.02243041992188, -111.66209411621094, -108.30176544189453, -104.94143676757812, -101.58110046386719, -98.22076416015625, -94.86043548583984, -91.50010681152344, -88.1397705078125, -84.77943420410156, -81.41910552978516, -78.05877685546875, -74.69844055175781, -71.33810424804688, -67.97777557373047, -64.61744689941406, -61.257110595703125, -57.89677810668945, -54.53644561767578, -51.17611312866211, -47.81578063964844, -44.455448150634766, -41.095115661621094, -37.73478317260742, -34.37445068359375, -31.014118194580078, -27.653785705566406, -24.293453216552734, -20.933120727539062, -17.57278823852539, -14.212455749511719, -10.852123260498047, -7.491790771484375, -4.131458282470703, -0.7711257934570312, 2.5892066955566406, 5.9495391845703125, 9.309871673583984, 12.670204162597656, 16.030536651611328, 19.390869140625, 22.751201629638672, 26.111534118652344, 29.471866607666016, 32.83219909667969]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 9.0, 11.0, 20.0, 21.0, 21.0, 27.0, 47.0, 49.0, 67.0, 79.0, 60.0, 87.0, 82.0, 65.0, 50.0, 61.0, 38.0, 42.0, 28.0, 28.0, 16.0, 13.0, 13.0, 13.0, 9.0, 8.0, 2.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.76395034790039, -25.14447021484375, -24.524991989135742, -23.9055118560791, -23.286033630371094, -22.666553497314453, -22.047075271606445, -21.427595138549805, -20.808116912841797, -20.188636779785156, -19.56915855407715, -18.949678421020508, -18.3302001953125, -17.71072006225586, -17.09124183654785, -16.47176170349121, -15.85228157043457, -15.232802391052246, -14.613323211669922, -13.993844032287598, -13.374364852905273, -12.754884719848633, -12.135405540466309, -11.515926361083984, -10.89644718170166, -10.276968002319336, -9.657488822937012, -9.038009643554688, -8.418529510498047, -7.799050807952881, -7.179571151733398, -6.560091972351074, -5.940613746643066, -5.321134567260742, -4.701655387878418, -4.0821757316589355, -3.4626965522766113, -2.843217372894287, -2.223737955093384, -1.6042585372924805, -0.9847793579101562, -0.3653000593185425, 0.2541792392730713, 0.8736585378646851, 1.4931378364562988, 2.112617015838623, 2.7320964336395264, 3.3515758514404297, 3.971055030822754, 4.590534210205078, 5.210013389587402, 5.829493045806885, 6.448972225189209, 7.068451404571533, 7.687931060791016, 8.30741024017334, 8.926889419555664, 9.546368598937988, 10.165847778320312, 10.785326957702637, 11.404806137084961, 12.024286270141602, 12.643765449523926, 13.26324462890625, 13.882723808288574]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 13.0, 19.0, 35.0, 38.0, 56.0, 92.0, 166.0, 256.0, 542.0, 1090.0, 2832.0, 8337.0, 32587.0, 198274.0, 681878.0, 94253.0, 18877.0, 5417.0, 2005.0, 828.0, 411.0, 200.0, 122.0, 67.0, 33.0, 31.0, 19.0, 21.0, 10.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.678985595703125, -1.61968994140625, -1.560394287109375, -1.5010986328125, -1.441802978515625, -1.38250732421875, -1.323211669921875, -1.263916015625, -1.204620361328125, -1.14532470703125, -1.086029052734375, -1.0267333984375, -0.967437744140625, -0.90814208984375, -0.848846435546875, -0.78955078125, -0.730255126953125, -0.67095947265625, -0.611663818359375, -0.5523681640625, -0.493072509765625, -0.43377685546875, -0.374481201171875, -0.315185546875, -0.255889892578125, -0.19659423828125, -0.137298583984375, -0.0780029296875, -0.018707275390625, 0.04058837890625, 0.099884033203125, 0.1591796875, 0.218475341796875, 0.27777099609375, 0.337066650390625, 0.3963623046875, 0.455657958984375, 0.51495361328125, 0.574249267578125, 0.633544921875, 0.692840576171875, 0.75213623046875, 0.811431884765625, 0.8707275390625, 0.930023193359375, 0.98931884765625, 1.048614501953125, 1.10791015625, 1.167205810546875, 1.22650146484375, 1.285797119140625, 1.3450927734375, 1.404388427734375, 1.46368408203125, 1.522979736328125, 1.582275390625, 1.641571044921875, 1.70086669921875, 1.760162353515625, 1.8194580078125, 1.878753662109375, 1.93804931640625, 1.997344970703125, 2.056640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 15.0, 14.0, 14.0, 34.0, 20.0, 40.0, 56.0, 57.0, 66.0, 77.0, 55.0, 63.0, 75.0, 75.0, 59.0, 64.0, 46.0, 38.0, 28.0, 32.0, 18.0, 17.0, 10.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.650970458984375, -1.60174560546875, -1.552520751953125, -1.5032958984375, -1.454071044921875, -1.40484619140625, -1.355621337890625, -1.306396484375, -1.257171630859375, -1.20794677734375, -1.158721923828125, -1.1094970703125, -1.060272216796875, -1.01104736328125, -0.961822509765625, -0.91259765625, -0.863372802734375, -0.81414794921875, -0.764923095703125, -0.7156982421875, -0.666473388671875, -0.61724853515625, -0.568023681640625, -0.518798828125, -0.469573974609375, -0.42034912109375, -0.371124267578125, -0.3218994140625, -0.272674560546875, -0.22344970703125, -0.174224853515625, -0.125, -0.075775146484375, -0.02655029296875, 0.022674560546875, 0.0718994140625, 0.121124267578125, 0.17034912109375, 0.219573974609375, 0.268798828125, 0.318023681640625, 0.36724853515625, 0.416473388671875, 0.4656982421875, 0.514923095703125, 0.56414794921875, 0.613372802734375, 0.66259765625, 0.711822509765625, 0.76104736328125, 0.810272216796875, 0.8594970703125, 0.908721923828125, 0.95794677734375, 1.007171630859375, 1.056396484375, 1.105621337890625, 1.15484619140625, 1.204071044921875, 1.2532958984375, 1.302520751953125, 1.35174560546875, 1.400970458984375, 1.4501953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 10.0, 7.0, 12.0, 17.0, 21.0, 28.0, 20.0, 29.0, 64.0, 58.0, 94.0, 167.0, 252.0, 458.0, 904.0, 2290.0, 8367.0, 47046.0, 875350.0, 95206.0, 12592.0, 3076.0, 1083.0, 546.0, 281.0, 194.0, 119.0, 85.0, 45.0, 36.0, 15.0, 14.0, 12.0, 17.0, 8.0, 8.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.05029296875, -1.9833984375, -1.91650390625, -1.849609375, -1.78271484375, -1.7158203125, -1.64892578125, -1.58203125, -1.51513671875, -1.4482421875, -1.38134765625, -1.314453125, -1.24755859375, -1.1806640625, -1.11376953125, -1.046875, -0.97998046875, -0.9130859375, -0.84619140625, -0.779296875, -0.71240234375, -0.6455078125, -0.57861328125, -0.51171875, -0.44482421875, -0.3779296875, -0.31103515625, -0.244140625, -0.17724609375, -0.1103515625, -0.04345703125, 0.0234375, 0.09033203125, 0.1572265625, 0.22412109375, 0.291015625, 0.35791015625, 0.4248046875, 0.49169921875, 0.55859375, 0.62548828125, 0.6923828125, 0.75927734375, 0.826171875, 0.89306640625, 0.9599609375, 1.02685546875, 1.09375, 1.16064453125, 1.2275390625, 1.29443359375, 1.361328125, 1.42822265625, 1.4951171875, 1.56201171875, 1.62890625, 1.69580078125, 1.7626953125, 1.82958984375, 1.896484375, 1.96337890625, 2.0302734375, 2.09716796875, 2.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 12.0, 10.0, 4.0, 15.0, 17.0, 16.0, 20.0, 14.0, 37.0, 32.0, 38.0, 39.0, 54.0, 60.0, 62.0, 86.0, 83.0, 71.0, 40.0, 41.0, 52.0, 22.0, 33.0, 18.0, 20.0, 16.0, 19.0, 14.0, 10.0, 6.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.08319091796875, -3.9437255859375, -3.80426025390625, -3.664794921875, -3.52532958984375, -3.3858642578125, -3.24639892578125, -3.10693359375, -2.96746826171875, -2.8280029296875, -2.68853759765625, -2.549072265625, -2.40960693359375, -2.2701416015625, -2.13067626953125, -1.9912109375, -1.85174560546875, -1.7122802734375, -1.57281494140625, -1.433349609375, -1.29388427734375, -1.1544189453125, -1.01495361328125, -0.87548828125, -0.73602294921875, -0.5965576171875, -0.45709228515625, -0.317626953125, -0.17816162109375, -0.0386962890625, 0.10076904296875, 0.240234375, 0.37969970703125, 0.5191650390625, 0.65863037109375, 0.798095703125, 0.93756103515625, 1.0770263671875, 1.21649169921875, 1.35595703125, 1.49542236328125, 1.6348876953125, 1.77435302734375, 1.913818359375, 2.05328369140625, 2.1927490234375, 2.33221435546875, 2.4716796875, 2.61114501953125, 2.7506103515625, 2.89007568359375, 3.029541015625, 3.16900634765625, 3.3084716796875, 3.44793701171875, 3.58740234375, 3.72686767578125, 3.8663330078125, 4.00579833984375, 4.145263671875, 4.28472900390625, 4.4241943359375, 4.56365966796875, 4.703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 20.0, 28.0, 36.0, 58.0, 117.0, 201.0, 484.0, 1081.0, 2852.0, 11957.0, 123865.0, 873987.0, 25880.0, 4924.0, 1552.0, 681.0, 342.0, 186.0, 93.0, 62.0, 33.0, 29.0, 10.0, 6.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5861968994140625, -0.567413330078125, -0.5486297607421875, -0.52984619140625, -0.5110626220703125, -0.492279052734375, -0.4734954833984375, -0.4547119140625, -0.4359283447265625, -0.417144775390625, -0.3983612060546875, -0.37957763671875, -0.3607940673828125, -0.342010498046875, -0.3232269287109375, -0.304443359375, -0.2856597900390625, -0.266876220703125, -0.2480926513671875, -0.22930908203125, -0.2105255126953125, -0.191741943359375, -0.1729583740234375, -0.1541748046875, -0.1353912353515625, -0.116607666015625, -0.0978240966796875, -0.07904052734375, -0.0602569580078125, -0.041473388671875, -0.0226898193359375, -0.00390625, 0.0148773193359375, 0.033660888671875, 0.0524444580078125, 0.07122802734375, 0.0900115966796875, 0.108795166015625, 0.1275787353515625, 0.1463623046875, 0.1651458740234375, 0.183929443359375, 0.2027130126953125, 0.22149658203125, 0.2402801513671875, 0.259063720703125, 0.2778472900390625, 0.296630859375, 0.3154144287109375, 0.334197998046875, 0.3529815673828125, 0.37176513671875, 0.3905487060546875, 0.409332275390625, 0.4281158447265625, 0.4468994140625, 0.4656829833984375, 0.484466552734375, 0.5032501220703125, 0.52203369140625, 0.5408172607421875, 0.559600830078125, 0.5783843994140625, 0.59716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 14.0, 16.0, 18.0, 30.0, 65.0, 87.0, 163.0, 212.0, 130.0, 72.0, 42.0, 23.0, 16.0, 17.0, 4.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015616416931152344, -0.00015132129192352295, -0.00014647841453552246, -0.00014163553714752197, -0.00013679265975952148, -0.000131949782371521, -0.0001271069049835205, -0.00012226402759552002, -0.00011742115020751953, -0.00011257827281951904, -0.00010773539543151855, -0.00010289251804351807, -9.804964065551758e-05, -9.320676326751709e-05, -8.83638858795166e-05, -8.352100849151611e-05, -7.867813110351562e-05, -7.383525371551514e-05, -6.899237632751465e-05, -6.414949893951416e-05, -5.930662155151367e-05, -5.4463744163513184e-05, -4.9620866775512695e-05, -4.477798938751221e-05, -3.993511199951172e-05, -3.509223461151123e-05, -3.0249357223510742e-05, -2.5406479835510254e-05, -2.0563602447509766e-05, -1.5720725059509277e-05, -1.0877847671508789e-05, -6.034970283508301e-06, -1.1920928955078125e-06, 3.6507844924926758e-06, 8.493661880493164e-06, 1.3336539268493652e-05, 1.817941665649414e-05, 2.302229404449463e-05, 2.7865171432495117e-05, 3.2708048820495605e-05, 3.7550926208496094e-05, 4.239380359649658e-05, 4.723668098449707e-05, 5.207955837249756e-05, 5.692243576049805e-05, 6.176531314849854e-05, 6.660819053649902e-05, 7.145106792449951e-05, 7.62939453125e-05, 8.113682270050049e-05, 8.597970008850098e-05, 9.082257747650146e-05, 9.566545486450195e-05, 0.00010050833225250244, 0.00010535120964050293, 0.00011019408702850342, 0.0001150369644165039, 0.0001198798418045044, 0.00012472271919250488, 0.00012956559658050537, 0.00013440847396850586, 0.00013925135135650635, 0.00014409422874450684, 0.00014893710613250732, 0.0001537799835205078]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 6.0, 11.0, 10.0, 12.0, 24.0, 27.0, 42.0, 61.0, 73.0, 118.0, 231.0, 398.0, 857.0, 1994.0, 5891.0, 22246.0, 204285.0, 770120.0, 30130.0, 7267.0, 2477.0, 1041.0, 511.0, 226.0, 142.0, 98.0, 66.0, 41.0, 37.0, 19.0, 12.0, 8.0, 8.0, 9.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.59326171875, -0.5758590698242188, -0.5584564208984375, -0.5410537719726562, -0.523651123046875, -0.5062484741210938, -0.4888458251953125, -0.47144317626953125, -0.45404052734375, -0.43663787841796875, -0.4192352294921875, -0.40183258056640625, -0.384429931640625, -0.36702728271484375, -0.3496246337890625, -0.33222198486328125, -0.3148193359375, -0.29741668701171875, -0.2800140380859375, -0.26261138916015625, -0.245208740234375, -0.22780609130859375, -0.2104034423828125, -0.19300079345703125, -0.17559814453125, -0.15819549560546875, -0.1407928466796875, -0.12339019775390625, -0.105987548828125, -0.08858489990234375, -0.0711822509765625, -0.05377960205078125, -0.036376953125, -0.01897430419921875, -0.0015716552734375, 0.01583099365234375, 0.033233642578125, 0.05063629150390625, 0.0680389404296875, 0.08544158935546875, 0.10284423828125, 0.12024688720703125, 0.1376495361328125, 0.15505218505859375, 0.172454833984375, 0.18985748291015625, 0.2072601318359375, 0.22466278076171875, 0.2420654296875, 0.25946807861328125, 0.2768707275390625, 0.29427337646484375, 0.311676025390625, 0.32907867431640625, 0.3464813232421875, 0.36388397216796875, 0.38128662109375, 0.39868927001953125, 0.4160919189453125, 0.43349456787109375, 0.450897216796875, 0.46829986572265625, 0.4857025146484375, 0.5031051635742188, 0.5205078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 11.0, 11.0, 14.0, 29.0, 22.0, 34.0, 65.0, 91.0, 136.0, 148.0, 138.0, 91.0, 52.0, 41.0, 23.0, 18.0, 15.0, 13.0, 6.0, 7.0, 8.0, 6.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.787109375, -0.7660140991210938, -0.7449188232421875, -0.7238235473632812, -0.702728271484375, -0.6816329956054688, -0.6605377197265625, -0.6394424438476562, -0.61834716796875, -0.5972518920898438, -0.5761566162109375, -0.5550613403320312, -0.533966064453125, -0.5128707885742188, -0.4917755126953125, -0.47068023681640625, -0.4495849609375, -0.42848968505859375, -0.4073944091796875, -0.38629913330078125, -0.365203857421875, -0.34410858154296875, -0.3230133056640625, -0.30191802978515625, -0.28082275390625, -0.25972747802734375, -0.2386322021484375, -0.21753692626953125, -0.196441650390625, -0.17534637451171875, -0.1542510986328125, -0.13315582275390625, -0.112060546875, -0.09096527099609375, -0.0698699951171875, -0.04877471923828125, -0.027679443359375, -0.00658416748046875, 0.0145111083984375, 0.03560638427734375, 0.05670166015625, 0.07779693603515625, 0.0988922119140625, 0.11998748779296875, 0.141082763671875, 0.16217803955078125, 0.1832733154296875, 0.20436859130859375, 0.2254638671875, 0.24655914306640625, 0.2676544189453125, 0.28874969482421875, 0.309844970703125, 0.33094024658203125, 0.3520355224609375, 0.37313079833984375, 0.39422607421875, 0.41532135009765625, 0.4364166259765625, 0.45751190185546875, 0.478607177734375, 0.49970245361328125, 0.5207977294921875, 0.5418930053710938, 0.56298828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 10.0, 37.0, 102.0, 646.0, 159.0, 31.0, 13.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.45219421386719, -54.08751678466797, -52.72283935546875, -51.35816192626953, -49.99348449707031, -48.62881088256836, -47.26413345336914, -45.89945602416992, -44.5347785949707, -43.170101165771484, -41.805423736572266, -40.44074630737305, -39.076072692871094, -37.711395263671875, -36.346717834472656, -34.98204040527344, -33.61736297607422, -32.252685546875, -30.88800811767578, -29.523332595825195, -28.158655166625977, -26.793977737426758, -25.429302215576172, -24.064624786376953, -22.699947357177734, -21.335269927978516, -19.970592498779297, -18.60591697692871, -17.241239547729492, -15.876562118530273, -14.511885643005371, -13.147209167480469, -11.78253173828125, -10.417854309082031, -9.053177833557129, -7.688500881195068, -6.323823928833008, -4.959146976470947, -3.5944700241088867, -2.2297935485839844, -0.8651161193847656, 0.4995608329772949, 1.8642377853393555, 3.228914737701416, 4.593591690063477, 5.958268642425537, 7.322945594787598, 8.6876220703125, 10.052299499511719, 11.416976928710938, 12.78165340423584, 14.146329879760742, 15.511007308959961, 16.87568473815918, 18.240360260009766, 19.605037689208984, 20.969715118408203, 22.334392547607422, 23.69906997680664, 25.063745498657227, 26.428422927856445, 27.793100357055664, 29.15777587890625, 30.52245330810547, 31.887130737304688]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 5.0, 11.0, 8.0, 15.0, 14.0, 17.0, 21.0, 30.0, 28.0, 42.0, 44.0, 91.0, 160.0, 142.0, 110.0, 57.0, 28.0, 21.0, 21.0, 18.0, 21.0, 14.0, 17.0, 7.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.148698806762695, -11.71694564819336, -11.285191535949707, -10.853438377380371, -10.421685218811035, -9.989931106567383, -9.558177947998047, -9.126424789428711, -8.694670677185059, -8.262917518615723, -7.8311638832092285, -7.399410247802734, -6.96765661239624, -6.535902976989746, -6.10414981842041, -5.672396183013916, -5.24064302444458, -4.808889389038086, -4.37713623046875, -3.945382595062256, -3.5136289596557617, -3.0818755626678467, -2.6501221656799316, -2.2183685302734375, -1.7866151332855225, -1.3548616170883179, -0.9231081604957581, -0.49135470390319824, -0.05960118770599365, 0.37215232849121094, 0.803905725479126, 1.2356593608856201, 1.6674127578735352, 2.09916615486145, 2.5309197902679443, 2.9626731872558594, 3.3944268226623535, 3.8261802196502686, 4.257933616638184, 4.689687252044678, 5.121440887451172, 5.553194522857666, 5.984947681427002, 6.416701316833496, 6.84845495223999, 7.280208587646484, 7.71196174621582, 8.143714904785156, 8.575468063354492, 9.007221221923828, 9.43897533416748, 9.870728492736816, 10.302481651306152, 10.734235763549805, 11.16598892211914, 11.597742080688477, 12.029496192932129, 12.461249351501465, 12.893003463745117, 13.324756622314453, 13.756509780883789, 14.188263893127441, 14.620017051696777, 15.05177116394043, 15.483524322509766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 10.0, 10.0, 12.0, 18.0, 10.0, 20.0, 32.0, 37.0, 32.0, 41.0, 37.0, 76.0, 112.0, 168.0, 90.0, 41.0, 37.0, 35.0, 29.0, 31.0, 15.0, 16.0, 19.0, 11.0, 12.0, 6.0, 4.0, 3.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3515625, -1.315277099609375, -1.27899169921875, -1.242706298828125, -1.2064208984375, -1.170135498046875, -1.13385009765625, -1.097564697265625, -1.061279296875, -1.024993896484375, -0.98870849609375, -0.952423095703125, -0.9161376953125, -0.879852294921875, -0.84356689453125, -0.807281494140625, -0.77099609375, -0.734710693359375, -0.69842529296875, -0.662139892578125, -0.6258544921875, -0.589569091796875, -0.55328369140625, -0.516998291015625, -0.480712890625, -0.444427490234375, -0.40814208984375, -0.371856689453125, -0.3355712890625, -0.299285888671875, -0.26300048828125, -0.226715087890625, -0.1904296875, -0.154144287109375, -0.11785888671875, -0.081573486328125, -0.0452880859375, -0.009002685546875, 0.02728271484375, 0.063568115234375, 0.099853515625, 0.136138916015625, 0.17242431640625, 0.208709716796875, 0.2449951171875, 0.281280517578125, 0.31756591796875, 0.353851318359375, 0.39013671875, 0.426422119140625, 0.46270751953125, 0.498992919921875, 0.5352783203125, 0.571563720703125, 0.60784912109375, 0.644134521484375, 0.680419921875, 0.716705322265625, 0.75299072265625, 0.789276123046875, 0.8255615234375, 0.861846923828125, 0.89813232421875, 0.934417724609375, 0.970703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 10.0, 24.0, 15.0, 30.0, 52.0, 83.0, 182.0, 581.0, 2712.0, 86225.0, 8292955.0, 4342.0, 812.0, 250.0, 99.0, 54.0, 42.0, 21.0, 9.0, 13.0, 13.0, 7.0, 7.0, 9.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.000646591186523, -11.573607444763184, -11.14656925201416, -10.71953010559082, -10.29249095916748, -9.86545181274414, -9.438413619995117, -9.011374473571777, -8.584335327148438, -8.157296180725098, -7.730257511138916, -7.303218841552734, -6.8761796951293945, -6.449141025543213, -6.022102355957031, -5.595063209533691, -5.168025016784668, -4.740986347198486, -4.3139472007751465, -3.886908531188965, -3.459869623184204, -3.0328307151794434, -2.6057920455932617, -2.178753137588501, -1.7517142295837402, -1.3246753215789795, -0.8976365327835083, -0.4705977439880371, -0.04355883598327637, 0.3834800720214844, 0.810518741607666, 1.2375576496124268, 1.664597511291504, 2.0916364192962646, 2.5186753273010254, 2.945713996887207, 3.3727529048919678, 3.7997918128967285, 4.22683048248291, 4.65386962890625, 5.080908298492432, 5.507946968078613, 5.934986114501953, 6.362024784088135, 6.789063453674316, 7.216102600097656, 7.643141269683838, 8.07017993927002, 8.49721908569336, 8.9242582321167, 9.351296424865723, 9.778335571289062, 10.205374717712402, 10.632413864135742, 11.059452056884766, 11.486491203308105, 11.913530349731445, 12.340569496154785, 12.767607688903809, 13.194646835327148, 13.621685981750488, 14.048725128173828, 14.475763320922852, 14.902802467346191, 15.329840660095215]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 3.0, 8.0, 3.0, 0.0, 6.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.251260757446289, -10.830163955688477, -10.409067153930664, -9.987969398498535, -9.566872596740723, -9.14577579498291, -8.724678039550781, -8.303581237792969, -7.882484436035156, -7.461387634277344, -7.040290355682373, -6.619193077087402, -6.19809627532959, -5.776999473571777, -5.355902194976807, -4.934804916381836, -4.513708114624023, -4.092611312866211, -3.6715140342712402, -3.2504169940948486, -2.829319953918457, -2.4082229137420654, -1.9871258735656738, -1.5660288333892822, -1.1449317932128906, -0.723834753036499, -0.3027377128601074, 0.11835932731628418, 0.5394563674926758, 0.9605534076690674, 1.381650447845459, 1.8027474880218506, 2.223844528198242, 2.644941568374634, 3.0660386085510254, 3.487135648727417, 3.9082326889038086, 4.329329490661621, 4.750426769256592, 5.1715240478515625, 5.592620849609375, 6.0137176513671875, 6.434814929962158, 6.855912208557129, 7.277009010314941, 7.698105812072754, 8.119203567504883, 8.540300369262695, 8.961397171020508, 9.38249397277832, 9.803590774536133, 10.224688529968262, 10.645785331726074, 11.066882133483887, 11.487979888916016, 11.909076690673828, 12.33017349243164, 12.751270294189453, 13.172367095947266, 13.593464851379395, 14.014561653137207, 14.43565845489502, 14.856756210327148, 15.277853012084961, 15.698949813842773]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 20.0, 21.0, 22.0, 31.0, 53.0, 43.0, 55.0, 64.0, 81.0, 69.0, 78.0, 74.0, 67.0, 62.0, 41.0, 36.0, 32.0, 22.0, 25.0, 15.0, 15.0, 13.0, 11.0, 11.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.840667724609375, -0.81024169921875, -0.779815673828125, -0.7493896484375, -0.718963623046875, -0.68853759765625, -0.658111572265625, -0.627685546875, -0.597259521484375, -0.56683349609375, -0.536407470703125, -0.5059814453125, -0.475555419921875, -0.44512939453125, -0.414703369140625, -0.38427734375, -0.353851318359375, -0.32342529296875, -0.292999267578125, -0.2625732421875, -0.232147216796875, -0.20172119140625, -0.171295166015625, -0.140869140625, -0.110443115234375, -0.08001708984375, -0.049591064453125, -0.0191650390625, 0.011260986328125, 0.04168701171875, 0.072113037109375, 0.1025390625, 0.132965087890625, 0.16339111328125, 0.193817138671875, 0.2242431640625, 0.254669189453125, 0.28509521484375, 0.315521240234375, 0.345947265625, 0.376373291015625, 0.40679931640625, 0.437225341796875, 0.4676513671875, 0.498077392578125, 0.52850341796875, 0.558929443359375, 0.58935546875, 0.619781494140625, 0.65020751953125, 0.680633544921875, 0.7110595703125, 0.741485595703125, 0.77191162109375, 0.802337646484375, 0.832763671875, 0.863189697265625, 0.89361572265625, 0.924041748046875, 0.9544677734375, 0.984893798828125, 1.01531982421875, 1.045745849609375, 1.076171875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 14.0, 9.0, 20.0, 27.0, 52.0, 55.0, 89.0, 167.0, 302.0, 574.0, 1114.0, 2620.0, 6403.0, 17783.0, 53107.0, 150798.0, 179664.0, 70505.0, 24606.0, 9225.0, 3748.0, 1676.0, 761.0, 392.0, 245.0, 120.0, 68.0, 46.0, 24.0, 14.0, 9.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.89666748046875, -7.6839599609375, -7.47125244140625, -7.258544921875, -7.04583740234375, -6.8331298828125, -6.62042236328125, -6.40771484375, -6.19500732421875, -5.9822998046875, -5.76959228515625, -5.556884765625, -5.34417724609375, -5.1314697265625, -4.91876220703125, -4.7060546875, -4.49334716796875, -4.2806396484375, -4.06793212890625, -3.855224609375, -3.64251708984375, -3.4298095703125, -3.21710205078125, -3.00439453125, -2.79168701171875, -2.5789794921875, -2.36627197265625, -2.153564453125, -1.94085693359375, -1.7281494140625, -1.51544189453125, -1.302734375, -1.09002685546875, -0.8773193359375, -0.66461181640625, -0.451904296875, -0.23919677734375, -0.0264892578125, 0.18621826171875, 0.39892578125, 0.61163330078125, 0.8243408203125, 1.03704833984375, 1.249755859375, 1.46246337890625, 1.6751708984375, 1.88787841796875, 2.1005859375, 2.31329345703125, 2.5260009765625, 2.73870849609375, 2.951416015625, 3.16412353515625, 3.3768310546875, 3.58953857421875, 3.80224609375, 4.01495361328125, 4.2276611328125, 4.44036865234375, 4.653076171875, 4.86578369140625, 5.0784912109375, 5.29119873046875, 5.50390625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 6.0, 5.0, 9.0, 9.0, 10.0, 19.0, 21.0, 37.0, 37.0, 26.0, 41.0, 44.0, 62.0, 57.0, 81.0, 63.0, 69.0, 61.0, 53.0, 42.0, 39.0, 42.0, 28.0, 28.0, 20.0, 17.0, 17.0, 5.0, 10.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1376953125, -1.10296630859375, -1.0682373046875, -1.03350830078125, -0.998779296875, -0.96405029296875, -0.9293212890625, -0.89459228515625, -0.85986328125, -0.82513427734375, -0.7904052734375, -0.75567626953125, -0.720947265625, -0.68621826171875, -0.6514892578125, -0.61676025390625, -0.58203125, -0.54730224609375, -0.5125732421875, -0.47784423828125, -0.443115234375, -0.40838623046875, -0.3736572265625, -0.33892822265625, -0.30419921875, -0.26947021484375, -0.2347412109375, -0.20001220703125, -0.165283203125, -0.13055419921875, -0.0958251953125, -0.06109619140625, -0.0263671875, 0.00836181640625, 0.0430908203125, 0.07781982421875, 0.112548828125, 0.14727783203125, 0.1820068359375, 0.21673583984375, 0.25146484375, 0.28619384765625, 0.3209228515625, 0.35565185546875, 0.390380859375, 0.42510986328125, 0.4598388671875, 0.49456787109375, 0.529296875, 0.56402587890625, 0.5987548828125, 0.63348388671875, 0.668212890625, 0.70294189453125, 0.7376708984375, 0.77239990234375, 0.80712890625, 0.84185791015625, 0.8765869140625, 0.91131591796875, 0.946044921875, 0.98077392578125, 1.0155029296875, 1.05023193359375, 1.0849609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 6.0, 4.0, 4.0, 9.0, 15.0, 15.0, 37.0, 21.0, 40.0, 52.0, 56.0, 66.0, 40.0, 28.0, 20.0, 18.0, 12.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.822357177734375, -7.621732711791992, -7.421108245849609, -7.220483303070068, -7.0198588371276855, -6.819234371185303, -6.61860990524292, -6.417984962463379, -6.217360496520996, -6.016736030578613, -5.8161115646362305, -5.6154866218566895, -5.414862155914307, -5.214237689971924, -5.013613224029541, -4.81298828125, -4.612363815307617, -4.411739349365234, -4.211114883422852, -4.0104899406433105, -3.8098654747009277, -3.609241008758545, -3.408616542816162, -3.2079918384552, -3.0073676109313965, -2.8067431449890137, -2.6061184406280518, -2.405493974685669, -2.204869270324707, -2.004244804382324, -1.8036202192306519, -1.6029956340789795, -1.4023709297180176, -1.2017463445663452, -1.0011217594146729, -0.8004972338676453, -0.5998726487159729, -0.3992481231689453, -0.19862353801727295, 0.002001047134399414, 0.20262563228607178, 0.40325021743774414, 0.6038748025894165, 0.8044993281364441, 1.0051238536834717, 1.205748438835144, 1.4063730239868164, 1.6069976091384888, 1.8076221942901611, 2.008246660232544, 2.208871364593506, 2.4094958305358887, 2.6101205348968506, 2.8107450008392334, 3.0113697052001953, 3.211994171142578, 3.412618637084961, 3.6132431030273438, 3.8138678073883057, 4.014492511749268, 4.21511697769165, 4.415741443634033, 4.616365909576416, 4.816990852355957, 5.01761531829834]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 15.0, 5.0, 8.0, 17.0, 21.0, 32.0, 45.0, 74.0, 70.0, 62.0, 41.0, 21.0, 16.0, 11.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.803354263305664, -11.522051811218262, -11.24074935913086, -10.959447860717773, -10.678145408630371, -10.396842956542969, -10.115540504455566, -9.834238052368164, -9.552936553955078, -9.271634101867676, -8.990331649780273, -8.709030151367188, -8.427727699279785, -8.146425247192383, -7.8651227951049805, -7.583820819854736, -7.302518367767334, -7.021215915679932, -6.7399139404296875, -6.458611488342285, -6.177309513092041, -5.896007061004639, -5.6147050857543945, -5.333402633666992, -5.05210018157959, -4.7707977294921875, -4.489495754241943, -4.208193302154541, -3.926891326904297, -3.6455888748168945, -3.3642866611480713, -3.082984447479248, -2.801682472229004, -2.5203802585601807, -2.2390780448913574, -1.9577757120132446, -1.6764734983444214, -1.3951712846755981, -1.1138689517974854, -0.8325667381286621, -0.5512645244598389, -0.26996228098869324, 0.011339962482452393, 0.2926422357559204, 0.5739444494247437, 0.8552466630935669, 1.1365489959716797, 1.417851209640503, 1.6991534233093262, 1.9804556369781494, 2.2617578506469727, 2.543060302734375, 2.824362277984619, 3.1056647300720215, 3.3869669437408447, 3.668269157409668, 3.949571371078491, 4.2308735847473145, 4.512176036834717, 4.793478012084961, 5.074780464172363, 5.356082439422607, 5.63738489151001, 5.918686866760254, 6.199989318847656]}, "eval/loss": 1.7494096755981445, "eval/wer": 1.0532328441094803, "eval/runtime": 1261.3284, "eval/samples_per_second": 2.095, "eval/steps_per_second": 0.262, "train/train_runtime": 115954.4449, "train/train_samples_per_second": 4.922, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 1.0593869240786682} \ No newline at end of file +{"train/loss": 0.3634, "train/learning_rate": 4.750593824228029e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 117895, "_timestamp": 1647711773, "_step": 17848, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [3.0, 6.0, 11.0, 43.0, 105.0, 198.0, 326.0, 195.0, 91.0, 29.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845430850982666, -4.951228618621826, -4.057026386260986, -3.1628243923187256, -2.2686221599578857, -1.374420166015625, -0.48021793365478516, 0.4139842987060547, 1.3081865310668945, 2.2023887634277344, 3.096590995788574, 3.990792989730835, 4.884995460510254, 5.7791972160339355, 6.673399448394775, 7.567601680755615, 8.461803436279297, 9.356005668640137, 10.250207901000977, 11.144410133361816, 12.038612365722656, 12.93281364440918, 13.827016830444336, 14.72121810913086, 15.615421295166016, 16.50962257385254, 17.403825759887695, 18.29802703857422, 19.192230224609375, 20.0864315032959, 20.980634689331055, 21.874835968017578, 22.7690372467041, 23.663238525390625, 24.55744171142578, 25.451642990112305, 26.34584617614746, 27.240047454833984, 28.13425064086914, 29.028451919555664, 29.92265510559082, 30.816856384277344, 31.7110595703125, 32.605262756347656, 33.49946212768555, 34.3936653137207, 35.28786849975586, 36.182071685791016, 37.076271057128906, 37.97047424316406, 38.86467361450195, 39.75887680053711, 40.653079986572266, 41.54728317260742, 42.44148254394531, 43.33568572998047, 44.229888916015625, 45.12409210205078, 46.01829147338867, 46.91249465942383, 47.806697845458984, 48.70090103149414, 49.59510040283203, 50.48930358886719, 51.383506774902344]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 8.0, 12.0, 8.0, 8.0, 12.0, 17.0, 12.0, 24.0, 21.0, 22.0, 31.0, 34.0, 24.0, 27.0, 36.0, 42.0, 46.0, 40.0, 40.0, 44.0, 61.0, 46.0, 41.0, 33.0, 29.0, 41.0, 28.0, 30.0, 15.0, 24.0, 28.0, 18.0, 17.0, 17.0, 7.0, 6.0, 8.0, 8.0, 8.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.530182838439941, -5.347039222717285, -5.163896083831787, -4.980752468109131, -4.797609329223633, -4.614465713500977, -4.43132209777832, -4.248178482055664, -4.065035343170166, -3.881891965866089, -3.6987485885620117, -3.5156049728393555, -3.3324615955352783, -3.149318218231201, -2.966174602508545, -2.7830312252044678, -2.5998878479003906, -2.4167444705963135, -2.2336010932922363, -2.05045747756958, -1.867314100265503, -1.6841707229614258, -1.501027226448059, -1.3178837299346924, -1.1347403526306152, -0.9515969157218933, -0.7684534788131714, -0.5853100419044495, -0.40216660499572754, -0.21902316808700562, -0.03587973117828369, 0.147263765335083, 0.33040761947631836, 0.5135510563850403, 0.6966944932937622, 0.8798379302024841, 1.062981367111206, 1.2461247444152832, 1.42926824092865, 1.6124117374420166, 1.7955551147460938, 1.978698492050171, 2.161841869354248, 2.3449854850769043, 2.5281288623809814, 2.7112722396850586, 2.894415855407715, 3.077559232711792, 3.260702610015869, 3.4438459873199463, 3.6269893646240234, 3.8101329803466797, 3.993276357650757, 4.176419734954834, 4.35956335067749, 4.542706489562988, 4.7258501052856445, 4.908993721008301, 5.092136859893799, 5.275280475616455, 5.458423614501953, 5.641567230224609, 5.824710845947266, 6.007854461669922, 6.19099760055542]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 7.0, 7.0, 10.0, 18.0, 23.0, 18.0, 21.0, 34.0, 36.0, 37.0, 48.0, 45.0, 43.0, 57.0, 65.0, 69.0, 63.0, 51.0, 45.0, 33.0, 39.0, 39.0, 36.0, 28.0, 19.0, 23.0, 15.0, 17.0, 6.0, 6.0, 7.0, 7.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.7312545776367188, -0.7090911865234375, -0.6869277954101562, -0.664764404296875, -0.6426010131835938, -0.6204376220703125, -0.5982742309570312, -0.57611083984375, -0.5539474487304688, -0.5317840576171875, -0.5096206665039062, -0.487457275390625, -0.46529388427734375, -0.4431304931640625, -0.42096710205078125, -0.3988037109375, -0.37664031982421875, -0.3544769287109375, -0.33231353759765625, -0.310150146484375, -0.28798675537109375, -0.2658233642578125, -0.24365997314453125, -0.22149658203125, -0.19933319091796875, -0.1771697998046875, -0.15500640869140625, -0.132843017578125, -0.11067962646484375, -0.0885162353515625, -0.06635284423828125, -0.044189453125, -0.02202606201171875, 0.0001373291015625, 0.02230072021484375, 0.044464111328125, 0.06662750244140625, 0.0887908935546875, 0.11095428466796875, 0.13311767578125, 0.15528106689453125, 0.1774444580078125, 0.19960784912109375, 0.221771240234375, 0.24393463134765625, 0.2660980224609375, 0.28826141357421875, 0.3104248046875, 0.33258819580078125, 0.3547515869140625, 0.37691497802734375, 0.399078369140625, 0.42124176025390625, 0.4434051513671875, 0.46556854248046875, 0.48773193359375, 0.5098953247070312, 0.5320587158203125, 0.5542221069335938, 0.576385498046875, 0.5985488891601562, 0.6207122802734375, 0.6428756713867188, 0.6650390625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 14.0, 19.0, 32.0, 32.0, 49.0, 83.0, 100.0, 146.0, 196.0, 298.0, 475.0, 1167.0, 3939.0, 19260.0, 189804.0, 3827644.0, 128776.0, 16054.0, 3656.0, 1094.0, 489.0, 289.0, 178.0, 127.0, 81.0, 69.0, 61.0, 38.0, 39.0, 18.0, 21.0, 7.0, 8.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.26849365234375, -8.0135498046875, -7.75860595703125, -7.503662109375, -7.24871826171875, -6.9937744140625, -6.73883056640625, -6.48388671875, -6.22894287109375, -5.9739990234375, -5.71905517578125, -5.464111328125, -5.20916748046875, -4.9542236328125, -4.69927978515625, -4.4443359375, -4.18939208984375, -3.9344482421875, -3.67950439453125, -3.424560546875, -3.16961669921875, -2.9146728515625, -2.65972900390625, -2.40478515625, -2.14984130859375, -1.8948974609375, -1.63995361328125, -1.385009765625, -1.13006591796875, -0.8751220703125, -0.62017822265625, -0.365234375, -0.11029052734375, 0.1446533203125, 0.39959716796875, 0.654541015625, 0.90948486328125, 1.1644287109375, 1.41937255859375, 1.67431640625, 1.92926025390625, 2.1842041015625, 2.43914794921875, 2.694091796875, 2.94903564453125, 3.2039794921875, 3.45892333984375, 3.7138671875, 3.96881103515625, 4.2237548828125, 4.47869873046875, 4.733642578125, 4.98858642578125, 5.2435302734375, 5.49847412109375, 5.75341796875, 6.00836181640625, 6.2633056640625, 6.51824951171875, 6.773193359375, 7.02813720703125, 7.2830810546875, 7.53802490234375, 7.79296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 23.0, 63.0, 99.0, 194.0, 527.0, 1662.0, 903.0, 322.0, 141.0, 70.0, 39.0, 19.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.46923828125, -9.2666015625, -9.06396484375, -8.861328125, -8.65869140625, -8.4560546875, -8.25341796875, -8.05078125, -7.84814453125, -7.6455078125, -7.44287109375, -7.240234375, -7.03759765625, -6.8349609375, -6.63232421875, -6.4296875, -6.22705078125, -6.0244140625, -5.82177734375, -5.619140625, -5.41650390625, -5.2138671875, -5.01123046875, -4.80859375, -4.60595703125, -4.4033203125, -4.20068359375, -3.998046875, -3.79541015625, -3.5927734375, -3.39013671875, -3.1875, -2.98486328125, -2.7822265625, -2.57958984375, -2.376953125, -2.17431640625, -1.9716796875, -1.76904296875, -1.56640625, -1.36376953125, -1.1611328125, -0.95849609375, -0.755859375, -0.55322265625, -0.3505859375, -0.14794921875, 0.0546875, 0.25732421875, 0.4599609375, 0.66259765625, 0.865234375, 1.06787109375, 1.2705078125, 1.47314453125, 1.67578125, 1.87841796875, 2.0810546875, 2.28369140625, 2.486328125, 2.68896484375, 2.8916015625, 3.09423828125, 3.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 8.0, 15.0, 31.0, 41.0, 81.0, 160.0, 586.0, 4736.0, 195360.0, 3961587.0, 29464.0, 1617.0, 330.0, 111.0, 62.0, 45.0, 19.0, 15.0, 9.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.904541015625, -34.05908203125, -33.213623046875, -32.3681640625, -31.522705078125, -30.67724609375, -29.831787109375, -28.986328125, -28.140869140625, -27.29541015625, -26.449951171875, -25.6044921875, -24.759033203125, -23.91357421875, -23.068115234375, -22.22265625, -21.377197265625, -20.53173828125, -19.686279296875, -18.8408203125, -17.995361328125, -17.14990234375, -16.304443359375, -15.458984375, -14.613525390625, -13.76806640625, -12.922607421875, -12.0771484375, -11.231689453125, -10.38623046875, -9.540771484375, -8.6953125, -7.849853515625, -7.00439453125, -6.158935546875, -5.3134765625, -4.468017578125, -3.62255859375, -2.777099609375, -1.931640625, -1.086181640625, -0.24072265625, 0.604736328125, 1.4501953125, 2.295654296875, 3.14111328125, 3.986572265625, 4.83203125, 5.677490234375, 6.52294921875, 7.368408203125, 8.2138671875, 9.059326171875, 9.90478515625, 10.750244140625, 11.595703125, 12.441162109375, 13.28662109375, 14.132080078125, 14.9775390625, 15.822998046875, 16.66845703125, 17.513916015625, 18.359375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 12.0, 8.0, 27.0, 35.0, 57.0, 100.0, 99.0, 148.0, 125.0, 134.0, 95.0, 62.0, 49.0, 27.0, 9.0, 10.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.54487419128418, -23.042083740234375, -22.53929328918457, -22.036502838134766, -21.53371238708496, -21.030921936035156, -20.52813148498535, -20.025341033935547, -19.522550582885742, -19.019760131835938, -18.516969680786133, -18.014179229736328, -17.511388778686523, -17.00859832763672, -16.505807876586914, -16.00301742553711, -15.500226020812988, -14.997435569763184, -14.494645118713379, -13.991854667663574, -13.48906421661377, -12.986273765563965, -12.483482360839844, -11.980691909790039, -11.477901458740234, -10.97511100769043, -10.472320556640625, -9.96953010559082, -9.466739654541016, -8.963949203491211, -8.461158752441406, -7.958367824554443, -7.455578804016113, -6.952788352966309, -6.449997901916504, -5.947207450866699, -5.4444169998168945, -4.94162654876709, -4.438835620880127, -3.9360451698303223, -3.4332547187805176, -2.930464267730713, -2.427673816680908, -1.9248831272125244, -1.4220926761627197, -0.919302225112915, -0.41651153564453125, 0.08627891540527344, 0.5890693664550781, 1.0918598175048828, 1.594650387763977, 2.0974409580230713, 2.600231409072876, 3.1030218601226807, 3.6058125495910645, 4.108603000640869, 4.611393451690674, 5.1141839027404785, 5.616974353790283, 6.119765281677246, 6.622555732727051, 7.1253461837768555, 7.62813663482666, 8.130927085876465, 8.63371753692627]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 10.0, 7.0, 7.0, 10.0, 12.0, 9.0, 19.0, 21.0, 25.0, 35.0, 31.0, 45.0, 30.0, 30.0, 34.0, 50.0, 34.0, 47.0, 38.0, 49.0, 44.0, 32.0, 32.0, 35.0, 40.0, 36.0, 24.0, 34.0, 29.0, 30.0, 12.0, 20.0, 10.0, 14.0, 7.0, 7.0, 10.0, 3.0, 5.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.30954647064209, -8.061635971069336, -7.813724994659424, -7.565814018249512, -7.317903518676758, -7.069992542266846, -6.822081565856934, -6.57417106628418, -6.326260089874268, -6.0783491134643555, -5.830438613891602, -5.5825276374816895, -5.334616661071777, -5.086706161499023, -4.838795185089111, -4.590884208679199, -4.342973709106445, -4.095062732696533, -3.8471522331237793, -3.599241256713867, -3.351330518722534, -3.103419780731201, -2.855508804321289, -2.607598066329956, -2.359687328338623, -2.11177659034729, -1.8638657331466675, -1.615954875946045, -1.368044137954712, -1.120133399963379, -0.8722225427627563, -0.6243116855621338, -0.376401424407959, -0.1284906268119812, 0.11942017078399658, 0.36733096837997437, 0.6152417659759521, 0.8631525039672852, 1.1110633611679077, 1.3589742183685303, 1.6068849563598633, 1.8547956943511963, 2.1027064323425293, 2.3506174087524414, 2.5985281467437744, 2.8464388847351074, 3.0943498611450195, 3.3422605991363525, 3.5901713371276855, 3.8380820751190186, 4.085992813110352, 4.333903789520264, 4.581814765930176, 4.82972526550293, 5.077636241912842, 5.325547218322754, 5.573457717895508, 5.82136869430542, 6.069279193878174, 6.317190170288086, 6.56510066986084, 6.813011646270752, 7.060922622680664, 7.308833122253418, 7.55674409866333]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 11.0, 9.0, 10.0, 14.0, 9.0, 18.0, 24.0, 28.0, 29.0, 18.0, 28.0, 36.0, 24.0, 44.0, 35.0, 46.0, 38.0, 54.0, 51.0, 47.0, 44.0, 53.0, 38.0, 34.0, 28.0, 38.0, 41.0, 27.0, 14.0, 24.0, 11.0, 18.0, 13.0, 10.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.78271484375, -0.7615890502929688, -0.7404632568359375, -0.7193374633789062, -0.698211669921875, -0.6770858764648438, -0.6559600830078125, -0.6348342895507812, -0.61370849609375, -0.5925827026367188, -0.5714569091796875, -0.5503311157226562, -0.529205322265625, -0.5080795288085938, -0.4869537353515625, -0.46582794189453125, -0.4447021484375, -0.42357635498046875, -0.4024505615234375, -0.38132476806640625, -0.360198974609375, -0.33907318115234375, -0.3179473876953125, -0.29682159423828125, -0.27569580078125, -0.25457000732421875, -0.2334442138671875, -0.21231842041015625, -0.191192626953125, -0.17006683349609375, -0.1489410400390625, -0.12781524658203125, -0.106689453125, -0.08556365966796875, -0.0644378662109375, -0.04331207275390625, -0.022186279296875, -0.00106048583984375, 0.0200653076171875, 0.04119110107421875, 0.06231689453125, 0.08344268798828125, 0.1045684814453125, 0.12569427490234375, 0.146820068359375, 0.16794586181640625, 0.1890716552734375, 0.21019744873046875, 0.2313232421875, 0.25244903564453125, 0.2735748291015625, 0.29470062255859375, 0.315826416015625, 0.33695220947265625, 0.3580780029296875, 0.37920379638671875, 0.40032958984375, 0.42145538330078125, 0.4425811767578125, 0.46370697021484375, 0.484832763671875, 0.5059585571289062, 0.5270843505859375, 0.5482101440429688, 0.5693359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 8.0, 19.0, 17.0, 37.0, 76.0, 112.0, 150.0, 230.0, 350.0, 544.0, 851.0, 1294.0, 2068.0, 3260.0, 5435.0, 9017.0, 14766.0, 24497.0, 40298.0, 64996.0, 101558.0, 147295.0, 179144.0, 155404.0, 111210.0, 72108.0, 44589.0, 27220.0, 16203.0, 9685.0, 6128.0, 3702.0, 2260.0, 1442.0, 896.0, 594.0, 353.0, 248.0, 169.0, 98.0, 80.0, 43.0, 33.0, 23.0, 14.0, 6.0, 11.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66552734375, -0.645721435546875, -0.62591552734375, -0.606109619140625, -0.5863037109375, -0.566497802734375, -0.54669189453125, -0.526885986328125, -0.507080078125, -0.487274169921875, -0.46746826171875, -0.447662353515625, -0.4278564453125, -0.408050537109375, -0.38824462890625, -0.368438720703125, -0.3486328125, -0.328826904296875, -0.30902099609375, -0.289215087890625, -0.2694091796875, -0.249603271484375, -0.22979736328125, -0.209991455078125, -0.190185546875, -0.170379638671875, -0.15057373046875, -0.130767822265625, -0.1109619140625, -0.091156005859375, -0.07135009765625, -0.051544189453125, -0.03173828125, -0.011932373046875, 0.00787353515625, 0.027679443359375, 0.0474853515625, 0.067291259765625, 0.08709716796875, 0.106903076171875, 0.126708984375, 0.146514892578125, 0.16632080078125, 0.186126708984375, 0.2059326171875, 0.225738525390625, 0.24554443359375, 0.265350341796875, 0.28515625, 0.304962158203125, 0.32476806640625, 0.344573974609375, 0.3643798828125, 0.384185791015625, 0.40399169921875, 0.423797607421875, 0.443603515625, 0.463409423828125, 0.48321533203125, 0.503021240234375, 0.5228271484375, 0.542633056640625, 0.56243896484375, 0.582244873046875, 0.60205078125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 5.0, 5.0, 9.0, 14.0, 9.0, 14.0, 14.0, 22.0, 22.0, 23.0, 28.0, 39.0, 36.0, 35.0, 28.0, 48.0, 48.0, 40.0, 1067.0, 62.0, 42.0, 47.0, 50.0, 30.0, 34.0, 36.0, 29.0, 20.0, 23.0, 29.0, 18.0, 16.0, 13.0, 13.0, 10.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65673828125, -0.635223388671875, -0.61370849609375, -0.592193603515625, -0.5706787109375, -0.549163818359375, -0.52764892578125, -0.506134033203125, -0.484619140625, -0.463104248046875, -0.44158935546875, -0.420074462890625, -0.3985595703125, -0.377044677734375, -0.35552978515625, -0.334014892578125, -0.3125, -0.290985107421875, -0.26947021484375, -0.247955322265625, -0.2264404296875, -0.204925537109375, -0.18341064453125, -0.161895751953125, -0.140380859375, -0.118865966796875, -0.09735107421875, -0.075836181640625, -0.0543212890625, -0.032806396484375, -0.01129150390625, 0.010223388671875, 0.03173828125, 0.053253173828125, 0.07476806640625, 0.096282958984375, 0.1177978515625, 0.139312744140625, 0.16082763671875, 0.182342529296875, 0.203857421875, 0.225372314453125, 0.24688720703125, 0.268402099609375, 0.2899169921875, 0.311431884765625, 0.33294677734375, 0.354461669921875, 0.3759765625, 0.397491455078125, 0.41900634765625, 0.440521240234375, 0.4620361328125, 0.483551025390625, 0.50506591796875, 0.526580810546875, 0.548095703125, 0.569610595703125, 0.59112548828125, 0.612640380859375, 0.6341552734375, 0.655670166015625, 0.67718505859375, 0.698699951171875, 0.72021484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 6.0, 3.0, 5.0, 4.0, 12.0, 15.0, 20.0, 40.0, 59.0, 58.0, 82.0, 133.0, 210.0, 276.0, 378.0, 570.0, 813.0, 1164.0, 1750.0, 2669.0, 3797.0, 5615.0, 8660.0, 13629.0, 22686.0, 45313.0, 175298.0, 1443544.0, 249500.0, 53007.0, 25031.0, 14726.0, 9142.0, 6082.0, 4082.0, 2719.0, 1889.0, 1303.0, 869.0, 630.0, 412.0, 269.0, 208.0, 148.0, 101.0, 65.0, 51.0, 38.0, 16.0, 12.0, 11.0, 9.0, 4.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.59033203125, -0.5710296630859375, -0.551727294921875, -0.5324249267578125, -0.51312255859375, -0.4938201904296875, -0.474517822265625, -0.4552154541015625, -0.4359130859375, -0.4166107177734375, -0.397308349609375, -0.3780059814453125, -0.35870361328125, -0.3394012451171875, -0.320098876953125, -0.3007965087890625, -0.281494140625, -0.2621917724609375, -0.242889404296875, -0.2235870361328125, -0.20428466796875, -0.1849822998046875, -0.165679931640625, -0.1463775634765625, -0.1270751953125, -0.1077728271484375, -0.088470458984375, -0.0691680908203125, -0.04986572265625, -0.0305633544921875, -0.011260986328125, 0.0080413818359375, 0.02734375, 0.0466461181640625, 0.065948486328125, 0.0852508544921875, 0.10455322265625, 0.1238555908203125, 0.143157958984375, 0.1624603271484375, 0.1817626953125, 0.2010650634765625, 0.220367431640625, 0.2396697998046875, 0.25897216796875, 0.2782745361328125, 0.297576904296875, 0.3168792724609375, 0.336181640625, 0.3554840087890625, 0.374786376953125, 0.3940887451171875, 0.41339111328125, 0.4326934814453125, 0.451995849609375, 0.4712982177734375, 0.4906005859375, 0.5099029541015625, 0.529205322265625, 0.5485076904296875, 0.56781005859375, 0.5871124267578125, 0.606414794921875, 0.6257171630859375, 0.64501953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 14.0, 12.0, 15.0, 23.0, 25.0, 35.0, 40.0, 77.0, 105.0, 90.0, 103.0, 93.0, 93.0, 62.0, 55.0, 48.0, 23.0, 21.0, 9.0, 9.0, 11.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.21038246154785156, -0.20372390747070312, -0.1970653533935547, -0.19040679931640625, -0.1837482452392578, -0.17708969116210938, -0.17043113708496094, -0.1637725830078125, -0.15711402893066406, -0.15045547485351562, -0.1437969207763672, -0.13713836669921875, -0.1304798126220703, -0.12382125854492188, -0.11716270446777344, -0.110504150390625, -0.10384559631347656, -0.09718704223632812, -0.09052848815917969, -0.08386993408203125, -0.07721138000488281, -0.07055282592773438, -0.06389427185058594, -0.0572357177734375, -0.05057716369628906, -0.043918609619140625, -0.03726005554199219, -0.03060150146484375, -0.023942947387695312, -0.017284393310546875, -0.010625839233398438, -0.00396728515625, 0.0026912689208984375, 0.009349822998046875, 0.016008377075195312, 0.02266693115234375, 0.029325485229492188, 0.035984039306640625, 0.04264259338378906, 0.0493011474609375, 0.05595970153808594, 0.06261825561523438, 0.06927680969238281, 0.07593536376953125, 0.08259391784667969, 0.08925247192382812, 0.09591102600097656, 0.102569580078125, 0.10922813415527344, 0.11588668823242188, 0.12254524230957031, 0.12920379638671875, 0.1358623504638672, 0.14252090454101562, 0.14917945861816406, 0.1558380126953125, 0.16249656677246094, 0.16915512084960938, 0.1758136749267578, 0.18247222900390625, 0.1891307830810547, 0.19578933715820312, 0.20244789123535156, 0.2091064453125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 11.0, 9.0, 25.0, 16.0, 37.0, 50.0, 52.0, 72.0, 87.0, 143.0, 285.0, 586.0, 1903.0, 13715.0, 671972.0, 347247.0, 9655.0, 1437.0, 482.0, 235.0, 161.0, 108.0, 60.0, 61.0, 42.0, 19.0, 24.0, 14.0, 5.0, 7.0, 11.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3671875, -2.2880859375, -2.208984375, -2.1298828125, -2.05078125, -1.9716796875, -1.892578125, -1.8134765625, -1.734375, -1.6552734375, -1.576171875, -1.4970703125, -1.41796875, -1.3388671875, -1.259765625, -1.1806640625, -1.1015625, -1.0224609375, -0.943359375, -0.8642578125, -0.78515625, -0.7060546875, -0.626953125, -0.5478515625, -0.46875, -0.3896484375, -0.310546875, -0.2314453125, -0.15234375, -0.0732421875, 0.005859375, 0.0849609375, 0.1640625, 0.2431640625, 0.322265625, 0.4013671875, 0.48046875, 0.5595703125, 0.638671875, 0.7177734375, 0.796875, 0.8759765625, 0.955078125, 1.0341796875, 1.11328125, 1.1923828125, 1.271484375, 1.3505859375, 1.4296875, 1.5087890625, 1.587890625, 1.6669921875, 1.74609375, 1.8251953125, 1.904296875, 1.9833984375, 2.0625, 2.1416015625, 2.220703125, 2.2998046875, 2.37890625, 2.4580078125, 2.537109375, 2.6162109375, 2.6953125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 22.0, 20.0, 18.0, 36.0, 47.0, 75.0, 129.0, 177.0, 158.0, 122.0, 66.0, 45.0, 18.0, 19.0, 8.0, 9.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7907149195671082, -0.7484149932861328, -0.7061150670051575, -0.6638151407241821, -0.6215152740478516, -0.5792152881622314, -0.5369154214859009, -0.49461549520492554, -0.4523155689239502, -0.41001564264297485, -0.3677157163619995, -0.32541581988334656, -0.2831158936023712, -0.24081596732139587, -0.19851607084274292, -0.15621614456176758, -0.11391621828079224, -0.07161629945039749, -0.029316380620002747, 0.012983530759811401, 0.05528345704078674, 0.09758338332176208, 0.13988327980041504, 0.18218320608139038, 0.22448313236236572, 0.26678305864334106, 0.3090829849243164, 0.35138288140296936, 0.3936828076839447, 0.43598273396492004, 0.478282630443573, 0.5205825567245483, 0.5628825426101685, 0.6051824688911438, 0.6474823951721191, 0.6897822618484497, 0.7320822477340698, 0.7743821144104004, 0.8166820406913757, 0.8589819669723511, 0.9012818932533264, 0.9435818195343018, 0.9858817458152771, 1.0281816720962524, 1.070481538772583, 1.1127815246582031, 1.1550813913345337, 1.1973812580108643, 1.2396812438964844, 1.281981110572815, 1.324281096458435, 1.3665809631347656, 1.4088809490203857, 1.4511808156967163, 1.4934806823730469, 1.535780668258667, 1.578080654144287, 1.6203805208206177, 1.6626805067062378, 1.7049803733825684, 1.7472803592681885, 1.789580225944519, 1.8318800926208496, 1.8741800785064697, 1.9164799451828003]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 6.0, 1.0, 1.0, 3.0, 9.0, 7.0, 11.0, 16.0, 16.0, 27.0, 20.0, 35.0, 27.0, 36.0, 38.0, 40.0, 43.0, 59.0, 47.0, 53.0, 40.0, 41.0, 53.0, 54.0, 47.0, 41.0, 42.0, 29.0, 30.0, 26.0, 19.0, 21.0, 12.0, 10.0, 10.0, 12.0, 4.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46852099895477295, -0.45353963971138, -0.43855828046798706, -0.4235769212245941, -0.40859556198120117, -0.39361417293548584, -0.3786328434944153, -0.36365145444869995, -0.348670095205307, -0.33368873596191406, -0.3187073767185211, -0.3037260174751282, -0.28874465823173523, -0.2737632989883423, -0.25878190994262695, -0.243800550699234, -0.22881920635700226, -0.21383784711360931, -0.19885648787021637, -0.18387511372566223, -0.1688937544822693, -0.15391239523887634, -0.1389310359954834, -0.12394966930150986, -0.10896831005811691, -0.09398695081472397, -0.07900558412075043, -0.06402422487735748, -0.04904286190867424, -0.034061498939991, -0.019080139696598053, -0.004098773002624512, 0.010882586240768433, 0.025863949209451675, 0.04084531217813492, 0.05582667142152786, 0.0708080381155014, 0.08578939735889435, 0.10077075660228729, 0.11575212329626083, 0.13073348999023438, 0.14571484923362732, 0.16069620847702026, 0.1756775677204132, 0.19065894186496735, 0.2056403011083603, 0.22062166035175323, 0.23560303449630737, 0.25058436393737793, 0.2655657231807709, 0.2805470824241638, 0.29552844166755676, 0.3105098009109497, 0.32549118995666504, 0.3404725193977356, 0.3554539084434509, 0.37043526768684387, 0.3854166269302368, 0.40039798617362976, 0.4153793454170227, 0.43036070466041565, 0.4453420639038086, 0.4603234529495239, 0.47530481219291687, 0.4902861714363098]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 11.0, 3.0, 10.0, 8.0, 11.0, 16.0, 13.0, 12.0, 31.0, 32.0, 18.0, 32.0, 33.0, 38.0, 42.0, 39.0, 37.0, 47.0, 49.0, 55.0, 46.0, 49.0, 56.0, 43.0, 41.0, 43.0, 31.0, 23.0, 17.0, 20.0, 12.0, 18.0, 20.0, 13.0, 12.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.77734375, -0.7553939819335938, -0.7334442138671875, -0.7114944458007812, -0.689544677734375, -0.6675949096679688, -0.6456451416015625, -0.6236953735351562, -0.60174560546875, -0.5797958374023438, -0.5578460693359375, -0.5358963012695312, -0.513946533203125, -0.49199676513671875, -0.4700469970703125, -0.44809722900390625, -0.4261474609375, -0.40419769287109375, -0.3822479248046875, -0.36029815673828125, -0.338348388671875, -0.31639862060546875, -0.2944488525390625, -0.27249908447265625, -0.25054931640625, -0.22859954833984375, -0.2066497802734375, -0.18470001220703125, -0.162750244140625, -0.14080047607421875, -0.1188507080078125, -0.09690093994140625, -0.074951171875, -0.05300140380859375, -0.0310516357421875, -0.00910186767578125, 0.012847900390625, 0.03479766845703125, 0.0567474365234375, 0.07869720458984375, 0.10064697265625, 0.12259674072265625, 0.1445465087890625, 0.16649627685546875, 0.188446044921875, 0.21039581298828125, 0.2323455810546875, 0.25429534912109375, 0.2762451171875, 0.29819488525390625, 0.3201446533203125, 0.34209442138671875, 0.364044189453125, 0.38599395751953125, 0.4079437255859375, 0.42989349365234375, 0.45184326171875, 0.47379302978515625, 0.4957427978515625, 0.5176925659179688, 0.539642333984375, 0.5615921020507812, 0.5835418701171875, 0.6054916381835938, 0.62744140625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 22.0, 23.0, 42.0, 41.0, 63.0, 109.0, 122.0, 219.0, 336.0, 496.0, 756.0, 1183.0, 2094.0, 3478.0, 5824.0, 10793.0, 20451.0, 42165.0, 94178.0, 211628.0, 315258.0, 181151.0, 80677.0, 36428.0, 18022.0, 9609.0, 5262.0, 3079.0, 1811.0, 1094.0, 727.0, 474.0, 304.0, 197.0, 136.0, 91.0, 58.0, 26.0, 32.0, 27.0, 18.0, 11.0, 11.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.861328125, -1.80560302734375, -1.7498779296875, -1.69415283203125, -1.638427734375, -1.58270263671875, -1.5269775390625, -1.47125244140625, -1.41552734375, -1.35980224609375, -1.3040771484375, -1.24835205078125, -1.192626953125, -1.13690185546875, -1.0811767578125, -1.02545166015625, -0.9697265625, -0.91400146484375, -0.8582763671875, -0.80255126953125, -0.746826171875, -0.69110107421875, -0.6353759765625, -0.57965087890625, -0.52392578125, -0.46820068359375, -0.4124755859375, -0.35675048828125, -0.301025390625, -0.24530029296875, -0.1895751953125, -0.13385009765625, -0.078125, -0.02239990234375, 0.0333251953125, 0.08905029296875, 0.144775390625, 0.20050048828125, 0.2562255859375, 0.31195068359375, 0.36767578125, 0.42340087890625, 0.4791259765625, 0.53485107421875, 0.590576171875, 0.64630126953125, 0.7020263671875, 0.75775146484375, 0.8134765625, 0.86920166015625, 0.9249267578125, 0.98065185546875, 1.036376953125, 1.09210205078125, 1.1478271484375, 1.20355224609375, 1.25927734375, 1.31500244140625, 1.3707275390625, 1.42645263671875, 1.482177734375, 1.53790283203125, 1.5936279296875, 1.64935302734375, 1.705078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 6.0, 5.0, 6.0, 21.0, 25.0, 34.0, 38.0, 39.0, 64.0, 84.0, 119.0, 222.0, 866.0, 842.0, 209.0, 126.0, 86.0, 65.0, 46.0, 39.0, 37.0, 28.0, 16.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.625, -3.5, -3.375, -3.25, -3.125, -3.0, -2.875, -2.75, -2.625, -2.5, -2.375, -2.25, -2.125, -2.0, -1.875, -1.75, -1.625, -1.5, -1.375, -1.25, -1.125, -1.0, -0.875, -0.75, -0.625, -0.5, -0.375, -0.25, -0.125, 0.0, 0.125, 0.25, 0.375, 0.5, 0.625, 0.75, 0.875, 1.0, 1.125, 1.25, 1.375, 1.5, 1.625, 1.75, 1.875, 2.0, 2.125, 2.25, 2.375, 2.5, 2.625, 2.75, 2.875, 3.0, 3.125, 3.25, 3.375, 3.5, 3.625, 3.75, 3.875, 4.0, 4.125, 4.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 4.0, 10.0, 10.0, 7.0, 28.0, 30.0, 43.0, 58.0, 94.0, 156.0, 312.0, 485.0, 925.0, 1694.0, 4049.0, 11945.0, 79239.0, 2364643.0, 636204.0, 32461.0, 7375.0, 2822.0, 1386.0, 721.0, 369.0, 225.0, 141.0, 82.0, 57.0, 37.0, 24.0, 22.0, 7.0, 11.0, 8.0, 4.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0625, -7.80078125, -7.5390625, -7.27734375, -7.015625, -6.75390625, -6.4921875, -6.23046875, -5.96875, -5.70703125, -5.4453125, -5.18359375, -4.921875, -4.66015625, -4.3984375, -4.13671875, -3.875, -3.61328125, -3.3515625, -3.08984375, -2.828125, -2.56640625, -2.3046875, -2.04296875, -1.78125, -1.51953125, -1.2578125, -0.99609375, -0.734375, -0.47265625, -0.2109375, 0.05078125, 0.3125, 0.57421875, 0.8359375, 1.09765625, 1.359375, 1.62109375, 1.8828125, 2.14453125, 2.40625, 2.66796875, 2.9296875, 3.19140625, 3.453125, 3.71484375, 3.9765625, 4.23828125, 4.5, 4.76171875, 5.0234375, 5.28515625, 5.546875, 5.80859375, 6.0703125, 6.33203125, 6.59375, 6.85546875, 7.1171875, 7.37890625, 7.640625, 7.90234375, 8.1640625, 8.42578125, 8.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 53.0, 375.0, 507.0, 71.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.940403938293457, -10.264060020446777, -8.587717056274414, -6.911373138427734, -5.235029697418213, -3.5586862564086914, -1.8823423385620117, -0.20599937438964844, 1.4703445434570312, 3.1466879844665527, 4.823031425476074, 6.499375343322754, 8.175718307495117, 9.852062225341797, 11.528406143188477, 13.20474910736084, 14.88109302520752, 16.557435989379883, 18.233779907226562, 19.910123825073242, 21.586467742919922, 23.26280975341797, 24.93915557861328, 26.615497589111328, 28.291841506958008, 29.968185424804688, 31.644529342651367, 33.32087326049805, 34.997215270996094, 36.673561096191406, 38.34990310668945, 40.0262451171875, 41.70258712768555, 43.378929138183594, 45.055274963378906, 46.73161697387695, 48.407962799072266, 50.08430480957031, 51.760650634765625, 53.43699264526367, 55.11333465576172, 56.789676666259766, 58.46602249145508, 60.142364501953125, 61.81871032714844, 63.495052337646484, 65.17139434814453, 66.84774017333984, 68.52408599853516, 70.20043182373047, 71.87677001953125, 73.55311584472656, 75.22946166992188, 76.90580749511719, 78.58214569091797, 80.25849151611328, 81.93482971191406, 83.61117553710938, 85.28751373291016, 86.96385955810547, 88.64020538330078, 90.31654357910156, 91.99288940429688, 93.66923522949219, 95.3455810546875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 12.0, 9.0, 10.0, 8.0, 11.0, 9.0, 18.0, 18.0, 20.0, 31.0, 31.0, 31.0, 41.0, 34.0, 35.0, 42.0, 54.0, 40.0, 52.0, 51.0, 43.0, 48.0, 48.0, 32.0, 43.0, 34.0, 33.0, 32.0, 20.0, 20.0, 13.0, 12.0, 20.0, 13.0, 9.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101920127868652, -8.788911819458008, -8.475902557373047, -8.162894248962402, -7.8498854637146, -7.536876678466797, -7.223868370056152, -6.91085958480835, -6.597850799560547, -6.284842014312744, -5.971833229064941, -5.658824920654297, -5.345816135406494, -5.032807350158691, -4.719799041748047, -4.406790256500244, -4.093781471252441, -3.7807726860046387, -3.467764139175415, -3.1547555923461914, -2.8417468070983887, -2.528738021850586, -2.2157294750213623, -1.9027209281921387, -1.589712142944336, -1.2767034769058228, -0.9636948108673096, -0.6506861448287964, -0.3376774787902832, -0.02466881275177002, 0.28833985328674316, 0.6013484001159668, 0.9143571853637695, 1.2273658514022827, 1.540374517440796, 1.853383183479309, 2.1663918495178223, 2.479400634765625, 2.7924091815948486, 3.1054177284240723, 3.418426513671875, 3.7314352989196777, 4.0444440841674805, 4.357452392578125, 4.670461177825928, 4.9834699630737305, 5.296478271484375, 5.609487056732178, 5.9224958419799805, 6.235504627227783, 6.548513412475586, 6.8615217208862305, 7.174530506134033, 7.487539291381836, 7.8005475997924805, 8.113555908203125, 8.426565170288086, 8.73957347869873, 9.052582740783691, 9.365591049194336, 9.678600311279297, 9.991608619689941, 10.304616928100586, 10.617626190185547, 10.930634498596191]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 10.0, 10.0, 12.0, 17.0, 18.0, 19.0, 23.0, 25.0, 30.0, 29.0, 43.0, 37.0, 34.0, 39.0, 37.0, 46.0, 50.0, 38.0, 33.0, 65.0, 32.0, 38.0, 40.0, 28.0, 32.0, 36.0, 30.0, 20.0, 17.0, 16.0, 11.0, 18.0, 6.0, 11.0, 5.0, 3.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7250900268554688, -0.7016448974609375, -0.6781997680664062, -0.654754638671875, -0.6313095092773438, -0.6078643798828125, -0.5844192504882812, -0.56097412109375, -0.5375289916992188, -0.5140838623046875, -0.49063873291015625, -0.467193603515625, -0.44374847412109375, -0.4203033447265625, -0.39685821533203125, -0.3734130859375, -0.34996795654296875, -0.3265228271484375, -0.30307769775390625, -0.279632568359375, -0.25618743896484375, -0.2327423095703125, -0.20929718017578125, -0.18585205078125, -0.16240692138671875, -0.1389617919921875, -0.11551666259765625, -0.092071533203125, -0.06862640380859375, -0.0451812744140625, -0.02173614501953125, 0.001708984375, 0.02515411376953125, 0.0485992431640625, 0.07204437255859375, 0.095489501953125, 0.11893463134765625, 0.1423797607421875, 0.16582489013671875, 0.18927001953125, 0.21271514892578125, 0.2361602783203125, 0.25960540771484375, 0.283050537109375, 0.30649566650390625, 0.3299407958984375, 0.35338592529296875, 0.3768310546875, 0.40027618408203125, 0.4237213134765625, 0.44716644287109375, 0.470611572265625, 0.49405670166015625, 0.5175018310546875, 0.5409469604492188, 0.56439208984375, 0.5878372192382812, 0.6112823486328125, 0.6347274780273438, 0.658172607421875, 0.6816177368164062, 0.7050628662109375, 0.7285079956054688, 0.751953125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 23.0, 25.0, 35.0, 57.0, 96.0, 116.0, 181.0, 284.0, 495.0, 606.0, 1054.0, 1618.0, 2402.0, 3804.0, 6113.0, 9866.0, 17006.0, 31432.0, 63784.0, 167367.0, 812541.0, 2269823.0, 550536.0, 133501.0, 54398.0, 27436.0, 14985.0, 9047.0, 5436.0, 3512.0, 2340.0, 1412.0, 921.0, 675.0, 455.0, 283.0, 196.0, 121.0, 87.0, 69.0, 49.0, 26.0, 17.0, 14.0, 7.0, 10.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.6441497802734375, -1.590057373046875, -1.5359649658203125, -1.48187255859375, -1.4277801513671875, -1.373687744140625, -1.3195953369140625, -1.2655029296875, -1.2114105224609375, -1.157318115234375, -1.1032257080078125, -1.04913330078125, -0.9950408935546875, -0.940948486328125, -0.8868560791015625, -0.832763671875, -0.7786712646484375, -0.724578857421875, -0.6704864501953125, -0.61639404296875, -0.5623016357421875, -0.508209228515625, -0.4541168212890625, -0.4000244140625, -0.3459320068359375, -0.291839599609375, -0.2377471923828125, -0.18365478515625, -0.1295623779296875, -0.075469970703125, -0.0213775634765625, 0.03271484375, 0.0868072509765625, 0.140899658203125, 0.1949920654296875, 0.24908447265625, 0.3031768798828125, 0.357269287109375, 0.4113616943359375, 0.4654541015625, 0.5195465087890625, 0.573638916015625, 0.6277313232421875, 0.68182373046875, 0.7359161376953125, 0.790008544921875, 0.8441009521484375, 0.898193359375, 0.9522857666015625, 1.006378173828125, 1.0604705810546875, 1.11456298828125, 1.1686553955078125, 1.222747802734375, 1.2768402099609375, 1.3309326171875, 1.3850250244140625, 1.439117431640625, 1.4932098388671875, 1.54730224609375, 1.6013946533203125, 1.655487060546875, 1.7095794677734375, 1.763671875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 8.0, 15.0, 28.0, 38.0, 66.0, 104.0, 215.0, 418.0, 854.0, 1052.0, 537.0, 327.0, 169.0, 93.0, 58.0, 32.0, 19.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.18212890625, -3.0322265625, -2.88232421875, -2.732421875, -2.58251953125, -2.4326171875, -2.28271484375, -2.1328125, -1.98291015625, -1.8330078125, -1.68310546875, -1.533203125, -1.38330078125, -1.2333984375, -1.08349609375, -0.93359375, -0.78369140625, -0.6337890625, -0.48388671875, -0.333984375, -0.18408203125, -0.0341796875, 0.11572265625, 0.265625, 0.41552734375, 0.5654296875, 0.71533203125, 0.865234375, 1.01513671875, 1.1650390625, 1.31494140625, 1.46484375, 1.61474609375, 1.7646484375, 1.91455078125, 2.064453125, 2.21435546875, 2.3642578125, 2.51416015625, 2.6640625, 2.81396484375, 2.9638671875, 3.11376953125, 3.263671875, 3.41357421875, 3.5634765625, 3.71337890625, 3.86328125, 4.01318359375, 4.1630859375, 4.31298828125, 4.462890625, 4.61279296875, 4.7626953125, 4.91259765625, 5.0625, 5.21240234375, 5.3623046875, 5.51220703125, 5.662109375, 5.81201171875, 5.9619140625, 6.11181640625, 6.26171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 20.0, 25.0, 24.0, 45.0, 50.0, 85.0, 136.0, 207.0, 260.0, 534.0, 1127.0, 2912.0, 9388.0, 40953.0, 294113.0, 3348972.0, 426475.0, 51464.0, 11273.0, 3387.0, 1223.0, 593.0, 344.0, 198.0, 143.0, 105.0, 66.0, 45.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.55718994140625, -5.3214111328125, -5.08563232421875, -4.849853515625, -4.61407470703125, -4.3782958984375, -4.14251708984375, -3.90673828125, -3.67095947265625, -3.4351806640625, -3.19940185546875, -2.963623046875, -2.72784423828125, -2.4920654296875, -2.25628662109375, -2.0205078125, -1.78472900390625, -1.5489501953125, -1.31317138671875, -1.077392578125, -0.84161376953125, -0.6058349609375, -0.37005615234375, -0.13427734375, 0.10150146484375, 0.3372802734375, 0.57305908203125, 0.808837890625, 1.04461669921875, 1.2803955078125, 1.51617431640625, 1.751953125, 1.98773193359375, 2.2235107421875, 2.45928955078125, 2.695068359375, 2.93084716796875, 3.1666259765625, 3.40240478515625, 3.63818359375, 3.87396240234375, 4.1097412109375, 4.34552001953125, 4.581298828125, 4.81707763671875, 5.0528564453125, 5.28863525390625, 5.5244140625, 5.76019287109375, 5.9959716796875, 6.23175048828125, 6.467529296875, 6.70330810546875, 6.9390869140625, 7.17486572265625, 7.41064453125, 7.64642333984375, 7.8822021484375, 8.11798095703125, 8.353759765625, 8.58953857421875, 8.8253173828125, 9.06109619140625, 9.296875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 9.0, 3.0, 8.0, 18.0, 24.0, 24.0, 41.0, 44.0, 59.0, 80.0, 87.0, 130.0, 106.0, 87.0, 62.0, 60.0, 53.0, 32.0, 28.0, 14.0, 13.0, 9.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.659172058105469, -15.299201011657715, -14.939230918884277, -14.579259872436523, -14.219289779663086, -13.859318733215332, -13.499347686767578, -13.13937759399414, -12.779406547546387, -12.419435501098633, -12.059465408325195, -11.699494361877441, -11.339523315429688, -10.97955322265625, -10.619582176208496, -10.259611129760742, -9.899641036987305, -9.53966999053955, -9.179699897766113, -8.81972885131836, -8.459758758544922, -8.099787712097168, -7.739816665649414, -7.379846096038818, -7.019875526428223, -6.659904956817627, -6.299934387207031, -5.939963340759277, -5.579992771148682, -5.220022201538086, -4.860051155090332, -4.500080585479736, -4.140110015869141, -3.780139446258545, -3.42016863822937, -3.0601978302001953, -2.7002272605895996, -2.340256690979004, -1.980285882949829, -1.6203150749206543, -1.2603445053100586, -0.9003738164901733, -0.5404031276702881, -0.18043243885040283, 0.17953824996948242, 0.5395089387893677, 0.8994796276092529, 1.2594504356384277, 1.6194210052490234, 1.9793916940689087, 2.339362382888794, 2.6993331909179688, 3.0593037605285645, 3.41927433013916, 3.779245138168335, 4.13921594619751, 4.4991865158081055, 4.859157085418701, 5.219127655029297, 5.579098701477051, 5.9390692710876465, 6.299039840698242, 6.659010887145996, 7.018981456756592, 7.3789520263671875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 9.0, 5.0, 9.0, 13.0, 13.0, 16.0, 18.0, 20.0, 22.0, 26.0, 38.0, 29.0, 30.0, 32.0, 33.0, 35.0, 40.0, 38.0, 42.0, 55.0, 43.0, 33.0, 47.0, 42.0, 40.0, 35.0, 31.0, 25.0, 20.0, 27.0, 17.0, 19.0, 17.0, 17.0, 10.0, 14.0, 9.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.366325378417969, -9.082765579223633, -8.79920482635498, -8.515645027160645, -8.232085227966309, -7.948524475097656, -7.66496467590332, -7.381404399871826, -7.097844123840332, -6.814283847808838, -6.530724048614502, -6.247163772583008, -5.963603496551514, -5.6800432205200195, -5.396483421325684, -5.1129231452941895, -4.8293633460998535, -4.545803070068359, -4.262243270874023, -3.9786829948425293, -3.695122718811035, -3.41156268119812, -3.128002643585205, -2.844442367553711, -2.560882329940796, -2.277322292327881, -1.9937620162963867, -1.7102019786834717, -1.426641821861267, -1.1430816650390625, -0.8595216274261475, -0.5759614706039429, -0.2924013137817383, -0.008841186761856079, 0.2747189402580261, 0.5582790374755859, 0.8418391942977905, 1.1253993511199951, 1.4089593887329102, 1.6925195455551147, 1.9760797023773193, 2.2596397399902344, 2.5432000160217285, 2.8267600536346436, 3.1103200912475586, 3.3938803672790527, 3.6774404048919678, 3.961000442504883, 4.244560718536377, 4.528120994567871, 4.811680793762207, 5.095241069793701, 5.378801345825195, 5.662361145019531, 5.945921421051025, 6.2294816970825195, 6.5130414962768555, 6.79660177230835, 7.0801615715026855, 7.36372184753418, 7.647282123565674, 7.930842399597168, 8.214402198791504, 8.49796199798584, 8.781522750854492]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 11.0, 16.0, 19.0, 22.0, 21.0, 16.0, 35.0, 38.0, 37.0, 30.0, 33.0, 34.0, 40.0, 50.0, 49.0, 52.0, 50.0, 38.0, 39.0, 46.0, 35.0, 34.0, 31.0, 18.0, 32.0, 25.0, 19.0, 24.0, 13.0, 16.0, 10.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7509765625, -0.726806640625, -0.70263671875, -0.678466796875, -0.654296875, -0.630126953125, -0.60595703125, -0.581787109375, -0.5576171875, -0.533447265625, -0.50927734375, -0.485107421875, -0.4609375, -0.436767578125, -0.41259765625, -0.388427734375, -0.3642578125, -0.340087890625, -0.31591796875, -0.291748046875, -0.267578125, -0.243408203125, -0.21923828125, -0.195068359375, -0.1708984375, -0.146728515625, -0.12255859375, -0.098388671875, -0.07421875, -0.050048828125, -0.02587890625, -0.001708984375, 0.0224609375, 0.046630859375, 0.07080078125, 0.094970703125, 0.119140625, 0.143310546875, 0.16748046875, 0.191650390625, 0.2158203125, 0.239990234375, 0.26416015625, 0.288330078125, 0.3125, 0.336669921875, 0.36083984375, 0.385009765625, 0.4091796875, 0.433349609375, 0.45751953125, 0.481689453125, 0.505859375, 0.530029296875, 0.55419921875, 0.578369140625, 0.6025390625, 0.626708984375, 0.65087890625, 0.675048828125, 0.69921875, 0.723388671875, 0.74755859375, 0.771728515625, 0.7958984375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 17.0, 25.0, 29.0, 56.0, 82.0, 136.0, 163.0, 258.0, 364.0, 537.0, 760.0, 1026.0, 1492.0, 2322.0, 3281.0, 4664.0, 6876.0, 10158.0, 14604.0, 21760.0, 32012.0, 46455.0, 66102.0, 89496.0, 112905.0, 130327.0, 125596.0, 105952.0, 81271.0, 59616.0, 41478.0, 28299.0, 19310.0, 12773.0, 8924.0, 6065.0, 4152.0, 2812.0, 2024.0, 1361.0, 872.0, 654.0, 479.0, 319.0, 228.0, 156.0, 109.0, 73.0, 39.0, 27.0, 19.0, 14.0, 9.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.56494140625, -0.5477371215820312, -0.5305328369140625, -0.5133285522460938, -0.496124267578125, -0.47891998291015625, -0.4617156982421875, -0.44451141357421875, -0.42730712890625, -0.41010284423828125, -0.3928985595703125, -0.37569427490234375, -0.358489990234375, -0.34128570556640625, -0.3240814208984375, -0.30687713623046875, -0.2896728515625, -0.27246856689453125, -0.2552642822265625, -0.23805999755859375, -0.220855712890625, -0.20365142822265625, -0.1864471435546875, -0.16924285888671875, -0.15203857421875, -0.13483428955078125, -0.1176300048828125, -0.10042572021484375, -0.083221435546875, -0.06601715087890625, -0.0488128662109375, -0.03160858154296875, -0.014404296875, 0.00279998779296875, 0.0200042724609375, 0.03720855712890625, 0.054412841796875, 0.07161712646484375, 0.0888214111328125, 0.10602569580078125, 0.12322998046875, 0.14043426513671875, 0.1576385498046875, 0.17484283447265625, 0.192047119140625, 0.20925140380859375, 0.2264556884765625, 0.24365997314453125, 0.2608642578125, 0.27806854248046875, 0.2952728271484375, 0.31247711181640625, 0.329681396484375, 0.34688568115234375, 0.3640899658203125, 0.38129425048828125, 0.39849853515625, 0.41570281982421875, 0.4329071044921875, 0.45011138916015625, 0.467315673828125, 0.48451995849609375, 0.5017242431640625, 0.5189285278320312, 0.5361328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 12.0, 5.0, 3.0, 12.0, 11.0, 11.0, 19.0, 12.0, 12.0, 25.0, 23.0, 25.0, 27.0, 31.0, 36.0, 34.0, 34.0, 39.0, 47.0, 44.0, 1067.0, 33.0, 42.0, 36.0, 34.0, 31.0, 39.0, 44.0, 40.0, 26.0, 25.0, 21.0, 35.0, 14.0, 14.0, 11.0, 10.0, 7.0, 4.0, 7.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7138671875, -0.6908111572265625, -0.667755126953125, -0.6446990966796875, -0.62164306640625, -0.5985870361328125, -0.575531005859375, -0.5524749755859375, -0.5294189453125, -0.5063629150390625, -0.483306884765625, -0.4602508544921875, -0.43719482421875, -0.4141387939453125, -0.391082763671875, -0.3680267333984375, -0.344970703125, -0.3219146728515625, -0.298858642578125, -0.2758026123046875, -0.25274658203125, -0.2296905517578125, -0.206634521484375, -0.1835784912109375, -0.1605224609375, -0.1374664306640625, -0.114410400390625, -0.0913543701171875, -0.06829833984375, -0.0452423095703125, -0.022186279296875, 0.0008697509765625, 0.02392578125, 0.0469818115234375, 0.070037841796875, 0.0930938720703125, 0.11614990234375, 0.1392059326171875, 0.162261962890625, 0.1853179931640625, 0.2083740234375, 0.2314300537109375, 0.254486083984375, 0.2775421142578125, 0.30059814453125, 0.3236541748046875, 0.346710205078125, 0.3697662353515625, 0.392822265625, 0.4158782958984375, 0.438934326171875, 0.4619903564453125, 0.48504638671875, 0.5081024169921875, 0.531158447265625, 0.5542144775390625, 0.5772705078125, 0.6003265380859375, 0.623382568359375, 0.6464385986328125, 0.66949462890625, 0.6925506591796875, 0.715606689453125, 0.7386627197265625, 0.76171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 12.0, 10.0, 23.0, 28.0, 63.0, 58.0, 96.0, 131.0, 224.0, 309.0, 515.0, 672.0, 1075.0, 1639.0, 2355.0, 3661.0, 5358.0, 8275.0, 13067.0, 22011.0, 47711.0, 259574.0, 1510294.0, 132842.0, 35779.0, 18520.0, 11449.0, 7214.0, 4671.0, 3221.0, 2039.0, 1405.0, 909.0, 634.0, 401.0, 288.0, 215.0, 127.0, 78.0, 63.0, 29.0, 29.0, 19.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6856231689453125, -0.662261962890625, -0.6389007568359375, -0.61553955078125, -0.5921783447265625, -0.568817138671875, -0.5454559326171875, -0.5220947265625, -0.4987335205078125, -0.475372314453125, -0.4520111083984375, -0.42864990234375, -0.4052886962890625, -0.381927490234375, -0.3585662841796875, -0.335205078125, -0.3118438720703125, -0.288482666015625, -0.2651214599609375, -0.24176025390625, -0.2183990478515625, -0.195037841796875, -0.1716766357421875, -0.1483154296875, -0.1249542236328125, -0.101593017578125, -0.0782318115234375, -0.05487060546875, -0.0315093994140625, -0.008148193359375, 0.0152130126953125, 0.03857421875, 0.0619354248046875, 0.085296630859375, 0.1086578369140625, 0.13201904296875, 0.1553802490234375, 0.178741455078125, 0.2021026611328125, 0.2254638671875, 0.2488250732421875, 0.272186279296875, 0.2955474853515625, 0.31890869140625, 0.3422698974609375, 0.365631103515625, 0.3889923095703125, 0.412353515625, 0.4357147216796875, 0.459075927734375, 0.4824371337890625, 0.50579833984375, 0.5291595458984375, 0.552520751953125, 0.5758819580078125, 0.5992431640625, 0.6226043701171875, 0.645965576171875, 0.6693267822265625, 0.69268798828125, 0.7160491943359375, 0.739410400390625, 0.7627716064453125, 0.7861328125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 12.0, 6.0, 17.0, 15.0, 16.0, 19.0, 39.0, 33.0, 43.0, 53.0, 73.0, 90.0, 85.0, 93.0, 73.0, 62.0, 60.0, 48.0, 39.0, 18.0, 16.0, 11.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14349937438964844, -0.13831710815429688, -0.1331348419189453, -0.12795257568359375, -0.12277030944824219, -0.11758804321289062, -0.11240577697753906, -0.1072235107421875, -0.10204124450683594, -0.09685897827148438, -0.09167671203613281, -0.08649444580078125, -0.08131217956542969, -0.07612991333007812, -0.07094764709472656, -0.065765380859375, -0.06058311462402344, -0.055400848388671875, -0.05021858215332031, -0.04503631591796875, -0.03985404968261719, -0.034671783447265625, -0.029489517211914062, -0.0243072509765625, -0.019124984741210938, -0.013942718505859375, -0.008760452270507812, -0.00357818603515625, 0.0016040802001953125, 0.006786346435546875, 0.011968612670898438, 0.01715087890625, 0.022333145141601562, 0.027515411376953125, 0.03269767761230469, 0.03787994384765625, 0.04306221008300781, 0.048244476318359375, 0.05342674255371094, 0.0586090087890625, 0.06379127502441406, 0.06897354125976562, 0.07415580749511719, 0.07933807373046875, 0.08452033996582031, 0.08970260620117188, 0.09488487243652344, 0.100067138671875, 0.10524940490722656, 0.11043167114257812, 0.11561393737792969, 0.12079620361328125, 0.1259784698486328, 0.13116073608398438, 0.13634300231933594, 0.1415252685546875, 0.14670753479003906, 0.15188980102539062, 0.1570720672607422, 0.16225433349609375, 0.1674365997314453, 0.17261886596679688, 0.17780113220214844, 0.1829833984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 8.0, 6.0, 14.0, 10.0, 18.0, 27.0, 31.0, 43.0, 58.0, 60.0, 95.0, 121.0, 171.0, 354.0, 1555.0, 12829.0, 849159.0, 176536.0, 5651.0, 878.0, 262.0, 157.0, 129.0, 82.0, 46.0, 41.0, 43.0, 26.0, 28.0, 11.0, 19.0, 15.0, 8.0, 6.0, 5.0, 10.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.53515625, -2.45794677734375, -2.3807373046875, -2.30352783203125, -2.226318359375, -2.14910888671875, -2.0718994140625, -1.99468994140625, -1.91748046875, -1.84027099609375, -1.7630615234375, -1.68585205078125, -1.608642578125, -1.53143310546875, -1.4542236328125, -1.37701416015625, -1.2998046875, -1.22259521484375, -1.1453857421875, -1.06817626953125, -0.990966796875, -0.91375732421875, -0.8365478515625, -0.75933837890625, -0.68212890625, -0.60491943359375, -0.5277099609375, -0.45050048828125, -0.373291015625, -0.29608154296875, -0.2188720703125, -0.14166259765625, -0.064453125, 0.01275634765625, 0.0899658203125, 0.16717529296875, 0.244384765625, 0.32159423828125, 0.3988037109375, 0.47601318359375, 0.55322265625, 0.63043212890625, 0.7076416015625, 0.78485107421875, 0.862060546875, 0.93927001953125, 1.0164794921875, 1.09368896484375, 1.1708984375, 1.24810791015625, 1.3253173828125, 1.40252685546875, 1.479736328125, 1.55694580078125, 1.6341552734375, 1.71136474609375, 1.78857421875, 1.86578369140625, 1.9429931640625, 2.02020263671875, 2.097412109375, 2.17462158203125, 2.2518310546875, 2.32904052734375, 2.40625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 13.0, 22.0, 69.0, 168.0, 420.0, 187.0, 70.0, 34.0, 15.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123091459274292, -3.029902696609497, -2.936713933944702, -2.8435251712799072, -2.750336170196533, -2.6571474075317383, -2.5639586448669434, -2.4707698822021484, -2.3775811195373535, -2.2843923568725586, -2.1912035942077637, -2.0980148315429688, -2.004826068878174, -1.9116371870040894, -1.8184483051300049, -1.72525954246521, -1.632070779800415, -1.5388820171356201, -1.4456932544708252, -1.3525043725967407, -1.2593156099319458, -1.1661268472671509, -1.0729379653930664, -0.9797492027282715, -0.8865604400634766, -0.7933716773986816, -0.7001828551292419, -0.6069940328598022, -0.5138052701950073, -0.42061647772789, -0.3274276852607727, -0.234238862991333, -0.1410503387451172, -0.04786154627799988, 0.04532724618911743, 0.13851603865623474, 0.23170483112335205, 0.32489362359046936, 0.41808241605758667, 0.5112712383270264, 0.6044600009918213, 0.6976487636566162, 0.7908375859260559, 0.8840264081954956, 0.9772151708602905, 1.0704039335250854, 1.16359281539917, 1.2567815780639648, 1.3499703407287598, 1.4431591033935547, 1.5363478660583496, 1.629536747932434, 1.722725510597229, 1.815914273262024, 1.9091031551361084, 2.0022919178009033, 2.0954806804656982, 2.188669443130493, 2.281858205795288, 2.375046968460083, 2.468235969543457, 2.561424732208252, 2.654613494873047, 2.747802257537842, 2.8409910202026367]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 3.0, 9.0, 14.0, 12.0, 21.0, 28.0, 27.0, 50.0, 31.0, 42.0, 47.0, 48.0, 66.0, 46.0, 59.0, 76.0, 54.0, 49.0, 42.0, 48.0, 40.0, 36.0, 28.0, 23.0, 17.0, 18.0, 20.0, 13.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.011688232421875, -0.9810954928398132, -0.9505027532577515, -0.9199100136756897, -0.8893172740936279, -0.8587245345115662, -0.8281317949295044, -0.7975390553474426, -0.7669463157653809, -0.7363535761833191, -0.7057608366012573, -0.6751680970191956, -0.6445753574371338, -0.613982617855072, -0.5833898782730103, -0.5527971386909485, -0.5222043991088867, -0.49161165952682495, -0.4610189199447632, -0.4304261803627014, -0.39983344078063965, -0.3692407011985779, -0.3386479616165161, -0.30805522203445435, -0.2774624228477478, -0.24686968326568604, -0.21627694368362427, -0.1856842041015625, -0.15509146451950073, -0.12449871003627777, -0.093905970454216, -0.06331323087215424, -0.03272050619125366, -0.0021277647465467453, 0.02846497669816017, 0.05905772000551224, 0.089650459587574, 0.12024320662021637, 0.15083594620227814, 0.1814286857843399, 0.21202142536640167, 0.24261416494846344, 0.2732069194316864, 0.30379965901374817, 0.33439239859580994, 0.3649851381778717, 0.39557787775993347, 0.42617061734199524, 0.456763356924057, 0.4873560965061188, 0.5179488658905029, 0.5485416054725647, 0.5791343450546265, 0.6097270846366882, 0.64031982421875, 0.6709125638008118, 0.7015053033828735, 0.7320980429649353, 0.7626907825469971, 0.7932835221290588, 0.8238762617111206, 0.8544690012931824, 0.8850617408752441, 0.9156544804573059, 0.9462472200393677]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 11.0, 10.0, 10.0, 8.0, 19.0, 22.0, 25.0, 20.0, 18.0, 29.0, 28.0, 29.0, 37.0, 39.0, 43.0, 45.0, 44.0, 36.0, 41.0, 56.0, 38.0, 46.0, 29.0, 32.0, 32.0, 27.0, 30.0, 31.0, 30.0, 22.0, 15.0, 22.0, 17.0, 8.0, 8.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.728515625, -0.7051010131835938, -0.6816864013671875, -0.6582717895507812, -0.634857177734375, -0.6114425659179688, -0.5880279541015625, -0.5646133422851562, -0.54119873046875, -0.5177841186523438, -0.4943695068359375, -0.47095489501953125, -0.447540283203125, -0.42412567138671875, -0.4007110595703125, -0.37729644775390625, -0.3538818359375, -0.33046722412109375, -0.3070526123046875, -0.28363800048828125, -0.260223388671875, -0.23680877685546875, -0.2133941650390625, -0.18997955322265625, -0.16656494140625, -0.14315032958984375, -0.1197357177734375, -0.09632110595703125, -0.072906494140625, -0.04949188232421875, -0.0260772705078125, -0.00266265869140625, 0.020751953125, 0.04416656494140625, 0.0675811767578125, 0.09099578857421875, 0.114410400390625, 0.13782501220703125, 0.1612396240234375, 0.18465423583984375, 0.20806884765625, 0.23148345947265625, 0.2548980712890625, 0.27831268310546875, 0.301727294921875, 0.32514190673828125, 0.3485565185546875, 0.37197113037109375, 0.3953857421875, 0.41880035400390625, 0.4422149658203125, 0.46562957763671875, 0.489044189453125, 0.5124588012695312, 0.5358734130859375, 0.5592880249023438, 0.58270263671875, 0.6061172485351562, 0.6295318603515625, 0.6529464721679688, 0.676361083984375, 0.6997756958007812, 0.7231903076171875, 0.7466049194335938, 0.77001953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 7.0, 15.0, 29.0, 43.0, 55.0, 72.0, 112.0, 129.0, 185.0, 274.0, 443.0, 622.0, 1015.0, 1688.0, 2751.0, 4800.0, 8589.0, 15805.0, 31266.0, 64796.0, 134919.0, 241006.0, 251144.0, 145474.0, 70452.0, 34012.0, 16913.0, 8908.0, 5084.0, 2884.0, 1742.0, 1119.0, 696.0, 486.0, 325.0, 202.0, 161.0, 111.0, 82.0, 32.0, 28.0, 16.0, 13.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.833038330078125, -0.80621337890625, -0.779388427734375, -0.7525634765625, -0.725738525390625, -0.69891357421875, -0.672088623046875, -0.645263671875, -0.618438720703125, -0.59161376953125, -0.564788818359375, -0.5379638671875, -0.511138916015625, -0.48431396484375, -0.457489013671875, -0.4306640625, -0.403839111328125, -0.37701416015625, -0.350189208984375, -0.3233642578125, -0.296539306640625, -0.26971435546875, -0.242889404296875, -0.216064453125, -0.189239501953125, -0.16241455078125, -0.135589599609375, -0.1087646484375, -0.081939697265625, -0.05511474609375, -0.028289794921875, -0.00146484375, 0.025360107421875, 0.05218505859375, 0.079010009765625, 0.1058349609375, 0.132659912109375, 0.15948486328125, 0.186309814453125, 0.213134765625, 0.239959716796875, 0.26678466796875, 0.293609619140625, 0.3204345703125, 0.347259521484375, 0.37408447265625, 0.400909423828125, 0.427734375, 0.454559326171875, 0.48138427734375, 0.508209228515625, 0.5350341796875, 0.561859130859375, 0.58868408203125, 0.615509033203125, 0.642333984375, 0.669158935546875, 0.69598388671875, 0.722808837890625, 0.7496337890625, 0.776458740234375, 0.80328369140625, 0.830108642578125, 0.85693359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 12.0, 9.0, 10.0, 3.0, 13.0, 19.0, 16.0, 29.0, 18.0, 35.0, 35.0, 31.0, 48.0, 47.0, 62.0, 77.0, 118.0, 237.0, 1343.0, 278.0, 124.0, 75.0, 60.0, 48.0, 39.0, 43.0, 36.0, 32.0, 24.0, 23.0, 17.0, 21.0, 12.0, 11.0, 13.0, 8.0, 2.0, 6.0, 2.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.928375244140625, -2.82940673828125, -2.730438232421875, -2.6314697265625, -2.532501220703125, -2.43353271484375, -2.334564208984375, -2.235595703125, -2.136627197265625, -2.03765869140625, -1.938690185546875, -1.8397216796875, -1.740753173828125, -1.64178466796875, -1.542816162109375, -1.44384765625, -1.344879150390625, -1.24591064453125, -1.146942138671875, -1.0479736328125, -0.949005126953125, -0.85003662109375, -0.751068115234375, -0.652099609375, -0.553131103515625, -0.45416259765625, -0.355194091796875, -0.2562255859375, -0.157257080078125, -0.05828857421875, 0.040679931640625, 0.1396484375, 0.238616943359375, 0.33758544921875, 0.436553955078125, 0.5355224609375, 0.634490966796875, 0.73345947265625, 0.832427978515625, 0.931396484375, 1.030364990234375, 1.12933349609375, 1.228302001953125, 1.3272705078125, 1.426239013671875, 1.52520751953125, 1.624176025390625, 1.72314453125, 1.822113037109375, 1.92108154296875, 2.020050048828125, 2.1190185546875, 2.217987060546875, 2.31695556640625, 2.415924072265625, 2.514892578125, 2.613861083984375, 2.71282958984375, 2.811798095703125, 2.9107666015625, 3.009735107421875, 3.10870361328125, 3.207672119140625, 3.306640625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 14.0, 20.0, 37.0, 48.0, 75.0, 97.0, 124.0, 182.0, 260.0, 421.0, 584.0, 880.0, 1239.0, 1890.0, 2877.0, 4601.0, 8254.0, 19370.0, 106836.0, 2439924.0, 494116.0, 35411.0, 11747.0, 5978.0, 3565.0, 2277.0, 1501.0, 1047.0, 741.0, 475.0, 336.0, 209.0, 151.0, 114.0, 92.0, 55.0, 42.0, 24.0, 21.0, 12.0, 10.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.33984375, -5.17669677734375, -5.0135498046875, -4.85040283203125, -4.687255859375, -4.52410888671875, -4.3609619140625, -4.19781494140625, -4.03466796875, -3.87152099609375, -3.7083740234375, -3.54522705078125, -3.382080078125, -3.21893310546875, -3.0557861328125, -2.89263916015625, -2.7294921875, -2.56634521484375, -2.4031982421875, -2.24005126953125, -2.076904296875, -1.91375732421875, -1.7506103515625, -1.58746337890625, -1.42431640625, -1.26116943359375, -1.0980224609375, -0.93487548828125, -0.771728515625, -0.60858154296875, -0.4454345703125, -0.28228759765625, -0.119140625, 0.04400634765625, 0.2071533203125, 0.37030029296875, 0.533447265625, 0.69659423828125, 0.8597412109375, 1.02288818359375, 1.18603515625, 1.34918212890625, 1.5123291015625, 1.67547607421875, 1.838623046875, 2.00177001953125, 2.1649169921875, 2.32806396484375, 2.4912109375, 2.65435791015625, 2.8175048828125, 2.98065185546875, 3.143798828125, 3.30694580078125, 3.4700927734375, 3.63323974609375, 3.79638671875, 3.95953369140625, 4.1226806640625, 4.28582763671875, 4.448974609375, 4.61212158203125, 4.7752685546875, 4.93841552734375, 5.1015625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 11.0, 25.0, 34.0, 92.0, 186.0, 277.0, 207.0, 105.0, 46.0, 17.0, 6.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.837425231933594, -10.219122886657715, -9.600820541381836, -8.98251724243164, -8.364214897155762, -7.745912551879883, -7.127609729766846, -6.509306907653809, -5.89100456237793, -5.272702217102051, -4.654399394989014, -4.036096572875977, -3.4177942276000977, -2.7994916439056396, -2.1811890602111816, -1.5628862380981445, -0.9445838928222656, -0.3262813091278076, 0.2920212745666504, 0.9103238582611084, 1.5286264419555664, 2.1469290256500244, 2.7652316093444824, 3.3835344314575195, 4.001836776733398, 4.620139122009277, 5.2384419441223145, 5.856744766235352, 6.4750471115112305, 7.093349456787109, 7.7116522789001465, 8.329955101013184, 8.94825553894043, 9.566557884216309, 10.184860229492188, 10.803163528442383, 11.421465873718262, 12.03976821899414, 12.658071517944336, 13.276373863220215, 13.894676208496094, 14.512978553771973, 15.131280899047852, 15.749584197998047, 16.36788558959961, 16.986188888549805, 17.6044921875, 18.222793579101562, 18.841096878051758, 19.459400177001953, 20.077701568603516, 20.69600486755371, 21.314308166503906, 21.93260955810547, 22.550912857055664, 23.16921615600586, 23.787517547607422, 24.405820846557617, 25.02412223815918, 25.642425537109375, 26.260726928710938, 26.879030227661133, 27.497333526611328, 28.11563491821289, 28.733938217163086]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 9.0, 8.0, 7.0, 15.0, 8.0, 14.0, 16.0, 17.0, 26.0, 33.0, 29.0, 36.0, 33.0, 46.0, 39.0, 43.0, 47.0, 49.0, 42.0, 54.0, 45.0, 39.0, 45.0, 52.0, 31.0, 32.0, 19.0, 25.0, 23.0, 27.0, 24.0, 11.0, 13.0, 11.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.091780662536621, -10.756503105163574, -10.421225547790527, -10.08594799041748, -9.750670433044434, -9.415392875671387, -9.08011531829834, -8.744837760925293, -8.409560203552246, -8.0742826461792, -7.739005088806152, -7.4037275314331055, -7.068449974060059, -6.733172416687012, -6.397894859313965, -6.062617301940918, -5.727339744567871, -5.392062187194824, -5.056784629821777, -4.7215070724487305, -4.386229515075684, -4.050951957702637, -3.71567440032959, -3.380396842956543, -3.045119285583496, -2.709841728210449, -2.3745641708374023, -2.0392866134643555, -1.7040090560913086, -1.3687314987182617, -1.0334539413452148, -0.698176383972168, -0.3628978729248047, -0.027620315551757812, 0.30765724182128906, 0.6429347991943359, 0.9782123565673828, 1.3134899139404297, 1.6487674713134766, 1.9840450286865234, 2.3193225860595703, 2.654600143432617, 2.989877700805664, 3.325155258178711, 3.660432815551758, 3.9957103729248047, 4.330987930297852, 4.666265487670898, 5.001543045043945, 5.336820602416992, 5.672098159790039, 6.007375717163086, 6.342653274536133, 6.67793083190918, 7.013208389282227, 7.348485946655273, 7.68376350402832, 8.019041061401367, 8.354318618774414, 8.689596176147461, 9.024873733520508, 9.360151290893555, 9.695428848266602, 10.030706405639648, 10.365983963012695]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 9.0, 19.0, 20.0, 18.0, 23.0, 21.0, 18.0, 28.0, 26.0, 42.0, 41.0, 37.0, 36.0, 51.0, 36.0, 53.0, 41.0, 51.0, 46.0, 46.0, 27.0, 36.0, 35.0, 35.0, 31.0, 24.0, 22.0, 18.0, 13.0, 16.0, 10.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.84814453125, -0.8229598999023438, -0.7977752685546875, -0.7725906372070312, -0.747406005859375, -0.7222213745117188, -0.6970367431640625, -0.6718521118164062, -0.64666748046875, -0.6214828491210938, -0.5962982177734375, -0.5711135864257812, -0.545928955078125, -0.5207443237304688, -0.4955596923828125, -0.47037506103515625, -0.4451904296875, -0.42000579833984375, -0.3948211669921875, -0.36963653564453125, -0.344451904296875, -0.31926727294921875, -0.2940826416015625, -0.26889801025390625, -0.24371337890625, -0.21852874755859375, -0.1933441162109375, -0.16815948486328125, -0.142974853515625, -0.11779022216796875, -0.0926055908203125, -0.06742095947265625, -0.042236328125, -0.01705169677734375, 0.0081329345703125, 0.03331756591796875, 0.058502197265625, 0.08368682861328125, 0.1088714599609375, 0.13405609130859375, 0.15924072265625, 0.18442535400390625, 0.2096099853515625, 0.23479461669921875, 0.259979248046875, 0.28516387939453125, 0.3103485107421875, 0.33553314208984375, 0.3607177734375, 0.38590240478515625, 0.4110870361328125, 0.43627166748046875, 0.461456298828125, 0.48664093017578125, 0.5118255615234375, 0.5370101928710938, 0.56219482421875, 0.5873794555664062, 0.6125640869140625, 0.6377487182617188, 0.662933349609375, 0.6881179809570312, 0.7133026123046875, 0.7384872436523438, 0.763671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 12.0, 6.0, 11.0, 14.0, 21.0, 20.0, 37.0, 38.0, 56.0, 72.0, 106.0, 158.0, 215.0, 375.0, 646.0, 1144.0, 2439.0, 5458.0, 12773.0, 33926.0, 115156.0, 977435.0, 2678846.0, 269561.0, 59791.0, 20303.0, 8006.0, 3651.0, 1724.0, 868.0, 457.0, 277.0, 182.0, 126.0, 82.0, 61.0, 57.0, 35.0, 24.0, 14.0, 16.0, 10.0, 12.0, 13.0, 12.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.890625, -2.80621337890625, -2.7218017578125, -2.63739013671875, -2.552978515625, -2.46856689453125, -2.3841552734375, -2.29974365234375, -2.21533203125, -2.13092041015625, -2.0465087890625, -1.96209716796875, -1.877685546875, -1.79327392578125, -1.7088623046875, -1.62445068359375, -1.5400390625, -1.45562744140625, -1.3712158203125, -1.28680419921875, -1.202392578125, -1.11798095703125, -1.0335693359375, -0.94915771484375, -0.86474609375, -0.78033447265625, -0.6959228515625, -0.61151123046875, -0.527099609375, -0.44268798828125, -0.3582763671875, -0.27386474609375, -0.189453125, -0.10504150390625, -0.0206298828125, 0.06378173828125, 0.148193359375, 0.23260498046875, 0.3170166015625, 0.40142822265625, 0.48583984375, 0.57025146484375, 0.6546630859375, 0.73907470703125, 0.823486328125, 0.90789794921875, 0.9923095703125, 1.07672119140625, 1.1611328125, 1.24554443359375, 1.3299560546875, 1.41436767578125, 1.498779296875, 1.58319091796875, 1.6676025390625, 1.75201416015625, 1.83642578125, 1.92083740234375, 2.0052490234375, 2.08966064453125, 2.174072265625, 2.25848388671875, 2.3428955078125, 2.42730712890625, 2.51171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 14.0, 16.0, 17.0, 35.0, 36.0, 46.0, 64.0, 84.0, 142.0, 190.0, 325.0, 493.0, 664.0, 628.0, 433.0, 258.0, 181.0, 129.0, 84.0, 61.0, 44.0, 31.0, 34.0, 17.0, 13.0, 11.0, 4.0, 0.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.234466552734375, -2.13690185546875, -2.039337158203125, -1.9417724609375, -1.844207763671875, -1.74664306640625, -1.649078369140625, -1.551513671875, -1.453948974609375, -1.35638427734375, -1.258819580078125, -1.1612548828125, -1.063690185546875, -0.96612548828125, -0.868560791015625, -0.77099609375, -0.673431396484375, -0.57586669921875, -0.478302001953125, -0.3807373046875, -0.283172607421875, -0.18560791015625, -0.088043212890625, 0.009521484375, 0.107086181640625, 0.20465087890625, 0.302215576171875, 0.3997802734375, 0.497344970703125, 0.59490966796875, 0.692474365234375, 0.7900390625, 0.887603759765625, 0.98516845703125, 1.082733154296875, 1.1802978515625, 1.277862548828125, 1.37542724609375, 1.472991943359375, 1.570556640625, 1.668121337890625, 1.76568603515625, 1.863250732421875, 1.9608154296875, 2.058380126953125, 2.15594482421875, 2.253509521484375, 2.35107421875, 2.448638916015625, 2.54620361328125, 2.643768310546875, 2.7413330078125, 2.838897705078125, 2.93646240234375, 3.034027099609375, 3.131591796875, 3.229156494140625, 3.32672119140625, 3.424285888671875, 3.5218505859375, 3.619415283203125, 3.71697998046875, 3.814544677734375, 3.912109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 11.0, 17.0, 8.0, 15.0, 8.0, 17.0, 37.0, 50.0, 66.0, 130.0, 189.0, 305.0, 630.0, 1157.0, 2445.0, 5030.0, 11419.0, 28302.0, 79707.0, 298029.0, 2020611.0, 1412923.0, 225708.0, 64939.0, 23794.0, 9840.0, 4430.0, 2061.0, 1052.0, 535.0, 281.0, 177.0, 114.0, 51.0, 46.0, 36.0, 43.0, 23.0, 13.0, 5.0, 9.0, 3.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.02734375, -3.901123046875, -3.77490234375, -3.648681640625, -3.5224609375, -3.396240234375, -3.27001953125, -3.143798828125, -3.017578125, -2.891357421875, -2.76513671875, -2.638916015625, -2.5126953125, -2.386474609375, -2.26025390625, -2.134033203125, -2.0078125, -1.881591796875, -1.75537109375, -1.629150390625, -1.5029296875, -1.376708984375, -1.25048828125, -1.124267578125, -0.998046875, -0.871826171875, -0.74560546875, -0.619384765625, -0.4931640625, -0.366943359375, -0.24072265625, -0.114501953125, 0.01171875, 0.137939453125, 0.26416015625, 0.390380859375, 0.5166015625, 0.642822265625, 0.76904296875, 0.895263671875, 1.021484375, 1.147705078125, 1.27392578125, 1.400146484375, 1.5263671875, 1.652587890625, 1.77880859375, 1.905029296875, 2.03125, 2.157470703125, 2.28369140625, 2.409912109375, 2.5361328125, 2.662353515625, 2.78857421875, 2.914794921875, 3.041015625, 3.167236328125, 3.29345703125, 3.419677734375, 3.5458984375, 3.672119140625, 3.79833984375, 3.924560546875, 4.05078125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 9.0, 20.0, 44.0, 69.0, 99.0, 122.0, 145.0, 161.0, 114.0, 93.0, 56.0, 36.0, 13.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96290111541748, -15.368990898132324, -14.775080680847168, -14.181170463562012, -13.587259292602539, -12.993349075317383, -12.399438858032227, -11.80552864074707, -11.211618423461914, -10.617708206176758, -10.023797988891602, -9.429887771606445, -8.835977554321289, -8.242067337036133, -7.64815616607666, -7.054245948791504, -6.460335731506348, -5.866425514221191, -5.272515296936035, -4.678604602813721, -4.0846943855285645, -3.490784168243408, -2.896873712539673, -2.3029632568359375, -1.7090530395507812, -1.1151427030563354, -0.5212323665618896, 0.07267796993255615, 0.666588306427002, 1.2604985237121582, 1.8544089794158936, 2.448319435119629, 3.0422306060791016, 3.636140823364258, 4.230051040649414, 4.8239617347717285, 5.417871952056885, 6.011782169342041, 6.6056928634643555, 7.199603080749512, 7.793513298034668, 8.387423515319824, 8.98133373260498, 9.575243949890137, 10.16915512084961, 10.763065338134766, 11.356975555419922, 11.950885772705078, 12.544795989990234, 13.13870620727539, 13.732616424560547, 14.326526641845703, 14.92043685913086, 15.514347076416016, 16.108257293701172, 16.702167510986328, 17.296077728271484, 17.88998794555664, 18.483898162841797, 19.077808380126953, 19.67171859741211, 20.265628814697266, 20.859539031982422, 21.453449249267578, 22.047361373901367]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 7.0, 11.0, 5.0, 12.0, 16.0, 16.0, 13.0, 23.0, 24.0, 31.0, 34.0, 41.0, 35.0, 31.0, 38.0, 42.0, 46.0, 35.0, 37.0, 33.0, 42.0, 30.0, 49.0, 39.0, 26.0, 31.0, 32.0, 25.0, 31.0, 19.0, 23.0, 16.0, 24.0, 19.0, 9.0, 7.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.851471900939941, -6.5974884033203125, -6.343504428863525, -6.0895209312438965, -5.835537433624268, -5.5815534591674805, -5.327569961547852, -5.073586463928223, -4.819602966308594, -4.565619468688965, -4.311635494232178, -4.057651996612549, -3.80366849899292, -3.549684762954712, -3.295701026916504, -3.041717529296875, -2.787733554840088, -2.53374981880188, -2.279766321182251, -2.025782585144043, -1.7717989683151245, -1.517815351486206, -1.263831615447998, -1.0098479986190796, -0.7558643817901611, -0.5018807649612427, -0.24789708852767944, 0.006086587905883789, 0.26007020473480225, 0.5140538215637207, 0.7680375576019287, 1.0220211744308472, 1.2760047912597656, 1.529988408088684, 1.7839720249176025, 2.0379557609558105, 2.2919392585754395, 2.5459229946136475, 2.7999067306518555, 3.0538902282714844, 3.3078739643096924, 3.5618577003479004, 3.8158411979675293, 4.069825172424316, 4.323808670043945, 4.577792167663574, 4.831775665283203, 5.08575963973999, 5.339743137359619, 5.593726634979248, 5.847710609436035, 6.101694107055664, 6.355677604675293, 6.609661102294922, 6.863645076751709, 7.117628574371338, 7.371612548828125, 7.625596046447754, 7.879580020904541, 8.133563995361328, 8.387547492980957, 8.641530990600586, 8.895514488220215, 9.149497985839844, 9.403481483459473]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 3.0, 7.0, 12.0, 15.0, 9.0, 9.0, 16.0, 24.0, 21.0, 14.0, 30.0, 24.0, 25.0, 31.0, 38.0, 42.0, 44.0, 41.0, 43.0, 46.0, 41.0, 46.0, 39.0, 44.0, 44.0, 40.0, 33.0, 30.0, 34.0, 24.0, 18.0, 19.0, 14.0, 8.0, 19.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7783203125, -0.75238037109375, -0.7264404296875, -0.70050048828125, -0.674560546875, -0.64862060546875, -0.6226806640625, -0.59674072265625, -0.57080078125, -0.54486083984375, -0.5189208984375, -0.49298095703125, -0.467041015625, -0.44110107421875, -0.4151611328125, -0.38922119140625, -0.36328125, -0.33734130859375, -0.3114013671875, -0.28546142578125, -0.259521484375, -0.23358154296875, -0.2076416015625, -0.18170166015625, -0.15576171875, -0.12982177734375, -0.1038818359375, -0.07794189453125, -0.052001953125, -0.02606201171875, -0.0001220703125, 0.02581787109375, 0.0517578125, 0.07769775390625, 0.1036376953125, 0.12957763671875, 0.155517578125, 0.18145751953125, 0.2073974609375, 0.23333740234375, 0.25927734375, 0.28521728515625, 0.3111572265625, 0.33709716796875, 0.363037109375, 0.38897705078125, 0.4149169921875, 0.44085693359375, 0.466796875, 0.49273681640625, 0.5186767578125, 0.54461669921875, 0.570556640625, 0.59649658203125, 0.6224365234375, 0.64837646484375, 0.67431640625, 0.70025634765625, 0.7261962890625, 0.75213623046875, 0.778076171875, 0.80401611328125, 0.8299560546875, 0.85589599609375, 0.8818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 18.0, 21.0, 31.0, 58.0, 82.0, 113.0, 184.0, 259.0, 444.0, 631.0, 954.0, 1429.0, 2164.0, 3414.0, 5425.0, 8236.0, 12632.0, 19416.0, 29741.0, 45241.0, 66463.0, 92575.0, 119479.0, 136570.0, 132476.0, 111489.0, 84564.0, 59404.0, 39763.0, 26397.0, 17096.0, 11185.0, 7032.0, 4720.0, 2951.0, 2027.0, 1289.0, 912.0, 556.0, 349.0, 247.0, 183.0, 108.0, 64.0, 44.0, 24.0, 27.0, 18.0, 14.0, 12.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.58642578125, -0.5667800903320312, -0.5471343994140625, -0.5274887084960938, -0.507843017578125, -0.48819732666015625, -0.4685516357421875, -0.44890594482421875, -0.42926025390625, -0.40961456298828125, -0.3899688720703125, -0.37032318115234375, -0.350677490234375, -0.33103179931640625, -0.3113861083984375, -0.29174041748046875, -0.2720947265625, -0.25244903564453125, -0.2328033447265625, -0.21315765380859375, -0.193511962890625, -0.17386627197265625, -0.1542205810546875, -0.13457489013671875, -0.11492919921875, -0.09528350830078125, -0.0756378173828125, -0.05599212646484375, -0.036346435546875, -0.01670074462890625, 0.0029449462890625, 0.02259063720703125, 0.042236328125, 0.06188201904296875, 0.0815277099609375, 0.10117340087890625, 0.120819091796875, 0.14046478271484375, 0.1601104736328125, 0.17975616455078125, 0.19940185546875, 0.21904754638671875, 0.2386932373046875, 0.25833892822265625, 0.277984619140625, 0.29763031005859375, 0.3172760009765625, 0.33692169189453125, 0.3565673828125, 0.37621307373046875, 0.3958587646484375, 0.41550445556640625, 0.435150146484375, 0.45479583740234375, 0.4744415283203125, 0.49408721923828125, 0.51373291015625, 0.5333786010742188, 0.5530242919921875, 0.5726699829101562, 0.592315673828125, 0.6119613647460938, 0.6316070556640625, 0.6512527465820312, 0.6708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 7.0, 13.0, 14.0, 9.0, 11.0, 13.0, 29.0, 18.0, 19.0, 24.0, 34.0, 27.0, 32.0, 39.0, 32.0, 32.0, 31.0, 36.0, 42.0, 1058.0, 40.0, 27.0, 51.0, 29.0, 48.0, 36.0, 30.0, 26.0, 19.0, 26.0, 24.0, 31.0, 19.0, 13.0, 17.0, 8.0, 10.0, 6.0, 7.0, 5.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74951171875, -0.7255325317382812, -0.7015533447265625, -0.6775741577148438, -0.653594970703125, -0.6296157836914062, -0.6056365966796875, -0.5816574096679688, -0.55767822265625, -0.5336990356445312, -0.5097198486328125, -0.48574066162109375, -0.461761474609375, -0.43778228759765625, -0.4138031005859375, -0.38982391357421875, -0.3658447265625, -0.34186553955078125, -0.3178863525390625, -0.29390716552734375, -0.269927978515625, -0.24594879150390625, -0.2219696044921875, -0.19799041748046875, -0.17401123046875, -0.15003204345703125, -0.1260528564453125, -0.10207366943359375, -0.078094482421875, -0.05411529541015625, -0.0301361083984375, -0.00615692138671875, 0.017822265625, 0.04180145263671875, 0.0657806396484375, 0.08975982666015625, 0.113739013671875, 0.13771820068359375, 0.1616973876953125, 0.18567657470703125, 0.20965576171875, 0.23363494873046875, 0.2576141357421875, 0.28159332275390625, 0.305572509765625, 0.32955169677734375, 0.3535308837890625, 0.37751007080078125, 0.4014892578125, 0.42546844482421875, 0.4494476318359375, 0.47342681884765625, 0.497406005859375, 0.5213851928710938, 0.5453643798828125, 0.5693435668945312, 0.59332275390625, 0.6173019409179688, 0.6412811279296875, 0.6652603149414062, 0.689239501953125, 0.7132186889648438, 0.7371978759765625, 0.7611770629882812, 0.78515625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 9.0, 9.0, 14.0, 32.0, 37.0, 52.0, 101.0, 121.0, 223.0, 324.0, 469.0, 721.0, 1018.0, 1628.0, 2409.0, 3501.0, 5202.0, 8208.0, 12561.0, 20015.0, 40649.0, 185192.0, 1544069.0, 174861.0, 40004.0, 20008.0, 12235.0, 7756.0, 5101.0, 3461.0, 2401.0, 1550.0, 1056.0, 697.0, 489.0, 318.0, 211.0, 126.0, 91.0, 71.0, 42.0, 33.0, 13.0, 15.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.86669921875, -0.8415679931640625, -0.816436767578125, -0.7913055419921875, -0.76617431640625, -0.7410430908203125, -0.715911865234375, -0.6907806396484375, -0.6656494140625, -0.6405181884765625, -0.615386962890625, -0.5902557373046875, -0.56512451171875, -0.5399932861328125, -0.514862060546875, -0.4897308349609375, -0.464599609375, -0.4394683837890625, -0.414337158203125, -0.3892059326171875, -0.36407470703125, -0.3389434814453125, -0.313812255859375, -0.2886810302734375, -0.2635498046875, -0.2384185791015625, -0.213287353515625, -0.1881561279296875, -0.16302490234375, -0.1378936767578125, -0.112762451171875, -0.0876312255859375, -0.0625, -0.0373687744140625, -0.012237548828125, 0.0128936767578125, 0.03802490234375, 0.0631561279296875, 0.088287353515625, 0.1134185791015625, 0.1385498046875, 0.1636810302734375, 0.188812255859375, 0.2139434814453125, 0.23907470703125, 0.2642059326171875, 0.289337158203125, 0.3144683837890625, 0.339599609375, 0.3647308349609375, 0.389862060546875, 0.4149932861328125, 0.44012451171875, 0.4652557373046875, 0.490386962890625, 0.5155181884765625, 0.5406494140625, 0.5657806396484375, 0.590911865234375, 0.6160430908203125, 0.64117431640625, 0.6663055419921875, 0.691436767578125, 0.7165679931640625, 0.74169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 11.0, 7.0, 5.0, 14.0, 7.0, 17.0, 27.0, 32.0, 31.0, 45.0, 41.0, 43.0, 58.0, 84.0, 86.0, 69.0, 72.0, 72.0, 43.0, 45.0, 33.0, 24.0, 20.0, 19.0, 11.0, 12.0, 11.0, 10.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.125244140625, -0.12112998962402344, -0.11701583862304688, -0.11290168762207031, -0.10878753662109375, -0.10467338562011719, -0.10055923461914062, -0.09644508361816406, -0.0923309326171875, -0.08821678161621094, -0.08410263061523438, -0.07998847961425781, -0.07587432861328125, -0.07176017761230469, -0.06764602661132812, -0.06353187561035156, -0.059417724609375, -0.05530357360839844, -0.051189422607421875, -0.04707527160644531, -0.04296112060546875, -0.03884696960449219, -0.034732818603515625, -0.030618667602539062, -0.0265045166015625, -0.022390365600585938, -0.018276214599609375, -0.014162063598632812, -0.01004791259765625, -0.0059337615966796875, -0.001819610595703125, 0.0022945404052734375, 0.00640869140625, 0.010522842407226562, 0.014636993408203125, 0.018751144409179688, 0.02286529541015625, 0.026979446411132812, 0.031093597412109375, 0.03520774841308594, 0.0393218994140625, 0.04343605041503906, 0.047550201416015625, 0.05166435241699219, 0.05577850341796875, 0.05989265441894531, 0.06400680541992188, 0.06812095642089844, 0.072235107421875, 0.07634925842285156, 0.08046340942382812, 0.08457756042480469, 0.08869171142578125, 0.09280586242675781, 0.09692001342773438, 0.10103416442871094, 0.1051483154296875, 0.10926246643066406, 0.11337661743164062, 0.11749076843261719, 0.12160491943359375, 0.1257190704345703, 0.12983322143554688, 0.13394737243652344, 0.1380615234375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 14.0, 10.0, 11.0, 18.0, 27.0, 24.0, 35.0, 36.0, 60.0, 82.0, 132.0, 188.0, 312.0, 895.0, 5953.0, 161862.0, 855148.0, 20580.0, 1879.0, 445.0, 221.0, 141.0, 113.0, 67.0, 61.0, 38.0, 27.0, 18.0, 23.0, 14.0, 19.0, 11.0, 10.0, 12.0, 7.0, 7.0, 4.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.1171875, -2.055328369140625, -1.99346923828125, -1.931610107421875, -1.8697509765625, -1.807891845703125, -1.74603271484375, -1.684173583984375, -1.622314453125, -1.560455322265625, -1.49859619140625, -1.436737060546875, -1.3748779296875, -1.313018798828125, -1.25115966796875, -1.189300537109375, -1.12744140625, -1.065582275390625, -1.00372314453125, -0.941864013671875, -0.8800048828125, -0.818145751953125, -0.75628662109375, -0.694427490234375, -0.632568359375, -0.570709228515625, -0.50885009765625, -0.446990966796875, -0.3851318359375, -0.323272705078125, -0.26141357421875, -0.199554443359375, -0.1376953125, -0.075836181640625, -0.01397705078125, 0.047882080078125, 0.1097412109375, 0.171600341796875, 0.23345947265625, 0.295318603515625, 0.357177734375, 0.419036865234375, 0.48089599609375, 0.542755126953125, 0.6046142578125, 0.666473388671875, 0.72833251953125, 0.790191650390625, 0.85205078125, 0.913909912109375, 0.97576904296875, 1.037628173828125, 1.0994873046875, 1.161346435546875, 1.22320556640625, 1.285064697265625, 1.346923828125, 1.408782958984375, 1.47064208984375, 1.532501220703125, 1.5943603515625, 1.656219482421875, 1.71807861328125, 1.779937744140625, 1.841796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 22.0, 61.0, 133.0, 251.0, 304.0, 146.0, 47.0, 26.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1922073364257812, -2.1312191486358643, -2.0702309608459473, -2.0092427730560303, -1.9482544660568237, -1.8872662782669067, -1.8262780904769897, -1.7652899026870728, -1.7043017148971558, -1.6433135271072388, -1.5823253393173218, -1.5213370323181152, -1.4603488445281982, -1.3993606567382812, -1.3383724689483643, -1.2773842811584473, -1.2163960933685303, -1.1554079055786133, -1.0944197177886963, -1.0334315299987793, -0.9724432826042175, -0.9114550352096558, -0.8504668474197388, -0.7894786596298218, -0.7284903526306152, -0.6675021648406982, -0.6065139174461365, -0.5455257296562195, -0.4845375418663025, -0.4235493242740631, -0.36256110668182373, -0.30157291889190674, -0.24058473110198975, -0.17959652841091156, -0.11860831826925278, -0.057620108127593994, 0.003368094563484192, 0.06435629725456238, 0.12534451484680176, 0.18633270263671875, 0.24732092022895813, 0.3083091378211975, 0.3692973256111145, 0.4302855432033539, 0.49127376079559326, 0.5522619485855103, 0.6132501363754272, 0.6742383241653442, 0.735226571559906, 0.796214759349823, 0.8572030067443848, 0.9181911945343018, 0.9791793823242188, 1.0401675701141357, 1.1011557579040527, 1.1621439456939697, 1.2231322526931763, 1.2841204404830933, 1.3451086282730103, 1.4060969352722168, 1.4670851230621338, 1.5280733108520508, 1.5890614986419678, 1.6500496864318848, 1.7110378742218018]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 6.0, 12.0, 9.0, 10.0, 11.0, 9.0, 17.0, 11.0, 21.0, 28.0, 25.0, 33.0, 20.0, 32.0, 35.0, 27.0, 31.0, 37.0, 51.0, 45.0, 30.0, 48.0, 46.0, 32.0, 37.0, 27.0, 27.0, 33.0, 19.0, 26.0, 25.0, 25.0, 15.0, 20.0, 26.0, 13.0, 12.0, 6.0, 8.0, 9.0, 9.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.42906856536865234, -0.41569530963897705, -0.40232208371162415, -0.38894882798194885, -0.37557557225227356, -0.36220234632492065, -0.34882909059524536, -0.33545583486557007, -0.3220825791358948, -0.3087093234062195, -0.2953360974788666, -0.2819628417491913, -0.268589586019516, -0.2552163600921631, -0.2418431043624878, -0.2284698486328125, -0.2150966078042984, -0.2017233669757843, -0.188350111246109, -0.1749768704175949, -0.16160361468791962, -0.14823037385940552, -0.13485711812973022, -0.12148387730121613, -0.10811062902212143, -0.09473738074302673, -0.08136413246393204, -0.06799088418483734, -0.054617639631032944, -0.041244395077228546, -0.02787114679813385, -0.014497898519039154, -0.001124650239944458, 0.012248597107827663, 0.025621844455599785, 0.03899509087204933, 0.05236833915114403, 0.06574158370494843, 0.07911483198404312, 0.09248808026313782, 0.10586132854223251, 0.11923457682132721, 0.1326078176498413, 0.1459810733795166, 0.1593543142080307, 0.1727275550365448, 0.1861008107662201, 0.19947406649589539, 0.21284730732440948, 0.22622054815292358, 0.23959380388259888, 0.25296705961227417, 0.2663402855396271, 0.27971354126930237, 0.29308679699897766, 0.30646002292633057, 0.31983327865600586, 0.33320653438568115, 0.34657976031303406, 0.35995301604270935, 0.37332627177238464, 0.38669949769973755, 0.40007275342941284, 0.41344600915908813, 0.4268192648887634]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 7.0, 11.0, 9.0, 11.0, 19.0, 16.0, 12.0, 31.0, 27.0, 28.0, 21.0, 36.0, 30.0, 35.0, 35.0, 49.0, 38.0, 55.0, 55.0, 41.0, 54.0, 45.0, 47.0, 36.0, 33.0, 46.0, 32.0, 17.0, 14.0, 18.0, 13.0, 8.0, 19.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7777786254882812, -0.7508697509765625, -0.7239608764648438, -0.697052001953125, -0.6701431274414062, -0.6432342529296875, -0.6163253784179688, -0.58941650390625, -0.5625076293945312, -0.5355987548828125, -0.5086898803710938, -0.481781005859375, -0.45487213134765625, -0.4279632568359375, -0.40105438232421875, -0.3741455078125, -0.34723663330078125, -0.3203277587890625, -0.29341888427734375, -0.266510009765625, -0.23960113525390625, -0.2126922607421875, -0.18578338623046875, -0.15887451171875, -0.13196563720703125, -0.1050567626953125, -0.07814788818359375, -0.051239013671875, -0.02433013916015625, 0.0025787353515625, 0.02948760986328125, 0.056396484375, 0.08330535888671875, 0.1102142333984375, 0.13712310791015625, 0.164031982421875, 0.19094085693359375, 0.2178497314453125, 0.24475860595703125, 0.27166748046875, 0.29857635498046875, 0.3254852294921875, 0.35239410400390625, 0.379302978515625, 0.40621185302734375, 0.4331207275390625, 0.46002960205078125, 0.4869384765625, 0.5138473510742188, 0.5407562255859375, 0.5676651000976562, 0.594573974609375, 0.6214828491210938, 0.6483917236328125, 0.6753005981445312, 0.70220947265625, 0.7291183471679688, 0.7560272216796875, 0.7829360961914062, 0.809844970703125, 0.8367538452148438, 0.8636627197265625, 0.8905715942382812, 0.91748046875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 8.0, 29.0, 28.0, 31.0, 68.0, 88.0, 134.0, 221.0, 361.0, 613.0, 905.0, 1573.0, 2632.0, 4708.0, 8804.0, 17789.0, 47584.0, 220570.0, 556553.0, 122001.0, 32949.0, 14145.0, 6978.0, 3970.0, 2200.0, 1363.0, 838.0, 499.0, 307.0, 216.0, 135.0, 89.0, 47.0, 27.0, 24.0, 13.0, 15.0, 4.0, 7.0, 5.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.052734375, -1.992950439453125, -1.93316650390625, -1.873382568359375, -1.8135986328125, -1.753814697265625, -1.69403076171875, -1.634246826171875, -1.574462890625, -1.514678955078125, -1.45489501953125, -1.395111083984375, -1.3353271484375, -1.275543212890625, -1.21575927734375, -1.155975341796875, -1.09619140625, -1.036407470703125, -0.97662353515625, -0.916839599609375, -0.8570556640625, -0.797271728515625, -0.73748779296875, -0.677703857421875, -0.617919921875, -0.558135986328125, -0.49835205078125, -0.438568115234375, -0.3787841796875, -0.319000244140625, -0.25921630859375, -0.199432373046875, -0.1396484375, -0.079864501953125, -0.02008056640625, 0.039703369140625, 0.0994873046875, 0.159271240234375, 0.21905517578125, 0.278839111328125, 0.338623046875, 0.398406982421875, 0.45819091796875, 0.517974853515625, 0.5777587890625, 0.637542724609375, 0.69732666015625, 0.757110595703125, 0.81689453125, 0.876678466796875, 0.93646240234375, 0.996246337890625, 1.0560302734375, 1.115814208984375, 1.17559814453125, 1.235382080078125, 1.295166015625, 1.354949951171875, 1.41473388671875, 1.474517822265625, 1.5343017578125, 1.594085693359375, 1.65386962890625, 1.713653564453125, 1.7734375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 5.0, 8.0, 13.0, 13.0, 11.0, 16.0, 22.0, 24.0, 19.0, 25.0, 35.0, 28.0, 32.0, 38.0, 37.0, 57.0, 61.0, 103.0, 142.0, 1422.0, 276.0, 127.0, 80.0, 66.0, 48.0, 59.0, 26.0, 40.0, 24.0, 23.0, 24.0, 17.0, 16.0, 24.0, 15.0, 14.0, 5.0, 11.0, 13.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.162109375, -3.071197509765625, -2.98028564453125, -2.889373779296875, -2.7984619140625, -2.707550048828125, -2.61663818359375, -2.525726318359375, -2.434814453125, -2.343902587890625, -2.25299072265625, -2.162078857421875, -2.0711669921875, -1.980255126953125, -1.88934326171875, -1.798431396484375, -1.70751953125, -1.616607666015625, -1.52569580078125, -1.434783935546875, -1.3438720703125, -1.252960205078125, -1.16204833984375, -1.071136474609375, -0.980224609375, -0.889312744140625, -0.79840087890625, -0.707489013671875, -0.6165771484375, -0.525665283203125, -0.43475341796875, -0.343841552734375, -0.2529296875, -0.162017822265625, -0.07110595703125, 0.019805908203125, 0.1107177734375, 0.201629638671875, 0.29254150390625, 0.383453369140625, 0.474365234375, 0.565277099609375, 0.65618896484375, 0.747100830078125, 0.8380126953125, 0.928924560546875, 1.01983642578125, 1.110748291015625, 1.20166015625, 1.292572021484375, 1.38348388671875, 1.474395751953125, 1.5653076171875, 1.656219482421875, 1.74713134765625, 1.838043212890625, 1.928955078125, 2.019866943359375, 2.11077880859375, 2.201690673828125, 2.2926025390625, 2.383514404296875, 2.47442626953125, 2.565338134765625, 2.65625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 5.0, 8.0, 10.0, 15.0, 18.0, 17.0, 23.0, 33.0, 36.0, 35.0, 79.0, 109.0, 155.0, 317.0, 591.0, 1229.0, 2450.0, 5828.0, 16060.0, 56597.0, 407071.0, 2397243.0, 200157.0, 37258.0, 11767.0, 4407.0, 1977.0, 921.0, 461.0, 265.0, 166.0, 96.0, 64.0, 47.0, 38.0, 30.0, 28.0, 25.0, 13.0, 12.0, 11.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.28515625, -3.173248291015625, -3.06134033203125, -2.949432373046875, -2.8375244140625, -2.725616455078125, -2.61370849609375, -2.501800537109375, -2.389892578125, -2.277984619140625, -2.16607666015625, -2.054168701171875, -1.9422607421875, -1.830352783203125, -1.71844482421875, -1.606536865234375, -1.49462890625, -1.382720947265625, -1.27081298828125, -1.158905029296875, -1.0469970703125, -0.935089111328125, -0.82318115234375, -0.711273193359375, -0.599365234375, -0.487457275390625, -0.37554931640625, -0.263641357421875, -0.1517333984375, -0.039825439453125, 0.07208251953125, 0.183990478515625, 0.2958984375, 0.407806396484375, 0.51971435546875, 0.631622314453125, 0.7435302734375, 0.855438232421875, 0.96734619140625, 1.079254150390625, 1.191162109375, 1.303070068359375, 1.41497802734375, 1.526885986328125, 1.6387939453125, 1.750701904296875, 1.86260986328125, 1.974517822265625, 2.08642578125, 2.198333740234375, 2.31024169921875, 2.422149658203125, 2.5340576171875, 2.645965576171875, 2.75787353515625, 2.869781494140625, 2.981689453125, 3.093597412109375, 3.20550537109375, 3.317413330078125, 3.4293212890625, 3.541229248046875, 3.65313720703125, 3.765045166015625, 3.876953125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 58.0, 290.0, 442.0, 176.0, 39.0, 3.0], "bins": [-55.20594787597656, -54.29047775268555, -53.3750114440918, -52.45954132080078, -51.54407501220703, -50.628604888916016, -49.713134765625, -48.79766845703125, -47.882198333740234, -46.96672821044922, -46.05126190185547, -45.13579177856445, -44.2203254699707, -43.30485534667969, -42.38938903808594, -41.47391891479492, -40.55845260620117, -39.642982482910156, -38.727516174316406, -37.81204605102539, -36.89657974243164, -35.981109619140625, -35.065643310546875, -34.15017318725586, -33.234703063964844, -32.31923294067383, -31.403766632080078, -30.488296508789062, -29.57282829284668, -28.657360076904297, -27.741891860961914, -26.82642364501953, -25.91095542907715, -24.995487213134766, -24.080018997192383, -23.16455078125, -22.249080657958984, -21.3336124420166, -20.41814422607422, -19.502676010131836, -18.587207794189453, -17.67173957824707, -16.756271362304688, -15.840802192687988, -14.925333976745605, -14.009864807128906, -13.094396591186523, -12.17892837524414, -11.263458251953125, -10.347990036010742, -9.432520866394043, -8.51705265045166, -7.601584434509277, -6.686115741729736, -5.770647048950195, -4.8551788330078125, -3.9397106170654297, -3.0242421627044678, -2.108773708343506, -1.1933050155639648, -0.27783656120300293, 0.637631893157959, 1.5531005859375, 2.468568801879883, 3.384037494659424]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 3.0, 11.0, 9.0, 14.0, 30.0, 37.0, 22.0, 39.0, 32.0, 28.0, 42.0, 50.0, 39.0, 32.0, 49.0, 59.0, 49.0, 53.0, 50.0, 34.0, 32.0, 45.0, 39.0, 32.0, 15.0, 27.0, 27.0, 11.0, 19.0, 13.0, 8.0, 9.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.994815826416016, -8.629061698913574, -8.26330852508545, -7.897554397583008, -7.531800746917725, -7.166047096252441, -6.80029296875, -6.434539318084717, -6.068785667419434, -5.70303201675415, -5.337277889251709, -4.971524238586426, -4.605770587921143, -4.240016937255859, -3.874262809753418, -3.5085091590881348, -3.1427550315856934, -2.777001142501831, -2.411247491836548, -2.0454936027526855, -1.6797398328781128, -1.31398606300354, -0.9482321739196777, -0.5824785232543945, -0.21672463417053223, 0.14902916550636292, 0.5147829651832581, 0.8805367946624756, 1.2462905645370483, 1.612044334411621, 1.9777982234954834, 2.3435518741607666, 2.709305763244629, 3.075059652328491, 3.4408133029937744, 3.8065671920776367, 4.17232084274292, 4.538074493408203, 4.9038286209106445, 5.269582271575928, 5.635335922241211, 6.001089572906494, 6.3668437004089355, 6.732597351074219, 7.098351001739502, 7.464104652404785, 7.829858779907227, 8.195611953735352, 8.56136703491211, 8.92712116241455, 9.292874336242676, 9.658628463745117, 10.024382591247559, 10.390135765075684, 10.755889892578125, 11.12164306640625, 11.487397193908691, 11.853151321411133, 12.218904495239258, 12.5846586227417, 12.95041275024414, 13.316165924072266, 13.681920051574707, 14.047674179077148, 14.413427352905273]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 10.0, 16.0, 16.0, 20.0, 28.0, 29.0, 24.0, 30.0, 33.0, 40.0, 45.0, 43.0, 40.0, 50.0, 41.0, 54.0, 36.0, 53.0, 47.0, 45.0, 40.0, 33.0, 32.0, 30.0, 25.0, 21.0, 14.0, 15.0, 8.0, 13.0, 12.0, 4.0, 3.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84423828125, -0.8149337768554688, -0.7856292724609375, -0.7563247680664062, -0.727020263671875, -0.6977157592773438, -0.6684112548828125, -0.6391067504882812, -0.60980224609375, -0.5804977416992188, -0.5511932373046875, -0.5218887329101562, -0.492584228515625, -0.46327972412109375, -0.4339752197265625, -0.40467071533203125, -0.3753662109375, -0.34606170654296875, -0.3167572021484375, -0.28745269775390625, -0.258148193359375, -0.22884368896484375, -0.1995391845703125, -0.17023468017578125, -0.14093017578125, -0.11162567138671875, -0.0823211669921875, -0.05301666259765625, -0.023712158203125, 0.00559234619140625, 0.0348968505859375, 0.06420135498046875, 0.093505859375, 0.12281036376953125, 0.1521148681640625, 0.18141937255859375, 0.210723876953125, 0.24002838134765625, 0.2693328857421875, 0.29863739013671875, 0.32794189453125, 0.35724639892578125, 0.3865509033203125, 0.41585540771484375, 0.445159912109375, 0.47446441650390625, 0.5037689208984375, 0.5330734252929688, 0.5623779296875, 0.5916824340820312, 0.6209869384765625, 0.6502914428710938, 0.679595947265625, 0.7089004516601562, 0.7382049560546875, 0.7675094604492188, 0.79681396484375, 0.8261184692382812, 0.8554229736328125, 0.8847274780273438, 0.914031982421875, 0.9433364868164062, 0.9726409912109375, 1.0019454956054688, 1.03125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 2.0, 12.0, 14.0, 21.0, 23.0, 42.0, 53.0, 105.0, 174.0, 330.0, 644.0, 1500.0, 3719.0, 9061.0, 26064.0, 108975.0, 2121047.0, 1785596.0, 97908.0, 24040.0, 8580.0, 3326.0, 1466.0, 705.0, 363.0, 177.0, 104.0, 64.0, 47.0, 27.0, 19.0, 21.0, 13.0, 5.0, 7.0, 9.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.496612548828125, -3.37994384765625, -3.263275146484375, -3.1466064453125, -3.029937744140625, -2.91326904296875, -2.796600341796875, -2.679931640625, -2.563262939453125, -2.44659423828125, -2.329925537109375, -2.2132568359375, -2.096588134765625, -1.97991943359375, -1.863250732421875, -1.74658203125, -1.629913330078125, -1.51324462890625, -1.396575927734375, -1.2799072265625, -1.163238525390625, -1.04656982421875, -0.929901123046875, -0.813232421875, -0.696563720703125, -0.57989501953125, -0.463226318359375, -0.3465576171875, -0.229888916015625, -0.11322021484375, 0.003448486328125, 0.1201171875, 0.236785888671875, 0.35345458984375, 0.470123291015625, 0.5867919921875, 0.703460693359375, 0.82012939453125, 0.936798095703125, 1.053466796875, 1.170135498046875, 1.28680419921875, 1.403472900390625, 1.5201416015625, 1.636810302734375, 1.75347900390625, 1.870147705078125, 1.98681640625, 2.103485107421875, 2.22015380859375, 2.336822509765625, 2.4534912109375, 2.570159912109375, 2.68682861328125, 2.803497314453125, 2.920166015625, 3.036834716796875, 3.15350341796875, 3.270172119140625, 3.3868408203125, 3.503509521484375, 3.62017822265625, 3.736846923828125, 3.853515625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 11.0, 10.0, 21.0, 37.0, 54.0, 98.0, 171.0, 339.0, 710.0, 1096.0, 748.0, 351.0, 177.0, 111.0, 65.0, 26.0, 21.0, 13.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.375, -7.213134765625, -7.05126953125, -6.889404296875, -6.7275390625, -6.565673828125, -6.40380859375, -6.241943359375, -6.080078125, -5.918212890625, -5.75634765625, -5.594482421875, -5.4326171875, -5.270751953125, -5.10888671875, -4.947021484375, -4.78515625, -4.623291015625, -4.46142578125, -4.299560546875, -4.1376953125, -3.975830078125, -3.81396484375, -3.652099609375, -3.490234375, -3.328369140625, -3.16650390625, -3.004638671875, -2.8427734375, -2.680908203125, -2.51904296875, -2.357177734375, -2.1953125, -2.033447265625, -1.87158203125, -1.709716796875, -1.5478515625, -1.385986328125, -1.22412109375, -1.062255859375, -0.900390625, -0.738525390625, -0.57666015625, -0.414794921875, -0.2529296875, -0.091064453125, 0.07080078125, 0.232666015625, 0.39453125, 0.556396484375, 0.71826171875, 0.880126953125, 1.0419921875, 1.203857421875, 1.36572265625, 1.527587890625, 1.689453125, 1.851318359375, 2.01318359375, 2.175048828125, 2.3369140625, 2.498779296875, 2.66064453125, 2.822509765625, 2.984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 10.0, 23.0, 22.0, 24.0, 27.0, 43.0, 70.0, 119.0, 219.0, 663.0, 2083.0, 8485.0, 54974.0, 1118586.0, 2898624.0, 93448.0, 12587.0, 2711.0, 835.0, 320.0, 155.0, 71.0, 45.0, 27.0, 30.0, 15.0, 22.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.39447021484375, -6.1053466796875, -5.81622314453125, -5.527099609375, -5.23797607421875, -4.9488525390625, -4.65972900390625, -4.37060546875, -4.08148193359375, -3.7923583984375, -3.50323486328125, -3.214111328125, -2.92498779296875, -2.6358642578125, -2.34674072265625, -2.0576171875, -1.76849365234375, -1.4793701171875, -1.19024658203125, -0.901123046875, -0.61199951171875, -0.3228759765625, -0.03375244140625, 0.25537109375, 0.54449462890625, 0.8336181640625, 1.12274169921875, 1.411865234375, 1.70098876953125, 1.9901123046875, 2.27923583984375, 2.568359375, 2.85748291015625, 3.1466064453125, 3.43572998046875, 3.724853515625, 4.01397705078125, 4.3031005859375, 4.59222412109375, 4.88134765625, 5.17047119140625, 5.4595947265625, 5.74871826171875, 6.037841796875, 6.32696533203125, 6.6160888671875, 6.90521240234375, 7.1943359375, 7.48345947265625, 7.7725830078125, 8.06170654296875, 8.350830078125, 8.63995361328125, 8.9290771484375, 9.21820068359375, 9.50732421875, 9.79644775390625, 10.0855712890625, 10.37469482421875, 10.663818359375, 10.95294189453125, 11.2420654296875, 11.53118896484375, 11.8203125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 19.0, 44.0, 61.0, 129.0, 201.0, 194.0, 166.0, 105.0, 46.0, 20.0, 9.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.7143669128418, -35.8249397277832, -34.93551254272461, -34.046085357666016, -33.15665817260742, -32.26723098754883, -31.377803802490234, -30.488378524780273, -29.59895133972168, -28.709524154663086, -27.820096969604492, -26.9306697845459, -26.041242599487305, -25.151817321777344, -24.26239013671875, -23.372962951660156, -22.483535766601562, -21.59410858154297, -20.704681396484375, -19.81525421142578, -18.925827026367188, -18.036399841308594, -17.14697265625, -16.25754737854004, -15.368118286132812, -14.478691101074219, -13.589263916015625, -12.699836730957031, -11.810410499572754, -10.92098331451416, -10.031556129455566, -9.142129898071289, -8.252702713012695, -7.363275527954102, -6.473848819732666, -5.584421634674072, -4.694994926452637, -3.805567741394043, -2.916140556335449, -2.0267138481140137, -1.13728666305542, -0.2478596568107605, 0.6415673494338989, 1.5309944152832031, 2.4204213619232178, 3.3098483085632324, 4.199275493621826, 5.088702201843262, 5.9781293869018555, 6.867556571960449, 7.756983280181885, 8.64640998840332, 9.535837173461914, 10.425264358520508, 11.314691543579102, 12.204118728637695, 13.093545913696289, 13.982973098754883, 14.872400283813477, 15.76182746887207, 16.651254653930664, 17.540679931640625, 18.43010711669922, 19.319534301757812, 20.208961486816406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 13.0, 10.0, 15.0, 20.0, 18.0, 21.0, 21.0, 28.0, 24.0, 34.0, 33.0, 53.0, 35.0, 36.0, 35.0, 41.0, 58.0, 38.0, 31.0, 31.0, 33.0, 40.0, 28.0, 33.0, 32.0, 28.0, 28.0, 28.0, 16.0, 15.0, 13.0, 12.0, 9.0, 12.0, 5.0, 5.0, 12.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.801793098449707, -8.55057144165039, -8.29935073852539, -8.048129081726074, -7.796907424926758, -7.5456862449646, -7.294465065002441, -7.043243408203125, -6.792022228240967, -6.540801048278809, -6.289579391479492, -6.038358211517334, -5.787137031555176, -5.535915374755859, -5.284694194793701, -5.033473014831543, -4.782251358032227, -4.531030178070068, -4.279808521270752, -4.028587341308594, -3.7773659229278564, -3.526144504547119, -3.274923324584961, -3.0237019062042236, -2.7724804878234863, -2.521259069442749, -2.2700376510620117, -2.0188164710998535, -1.7675950527191162, -1.516373634338379, -1.2651523351669312, -1.0139310359954834, -0.7627086639404297, -0.5114873051643372, -0.26026594638824463, -0.0090445876121521, 0.24217677116394043, 0.49339818954467773, 0.7446194887161255, 0.9958407878875732, 1.2470622062683105, 1.4982836246490479, 1.7495049238204956, 2.0007262229919434, 2.2519476413726807, 2.503169059753418, 2.754390239715576, 3.0056116580963135, 3.256833076477051, 3.508054494857788, 3.7592759132385254, 4.010497093200684, 4.26171875, 4.512939929962158, 4.764161109924316, 5.015382766723633, 5.266603946685791, 5.517825126647949, 5.769046783447266, 6.020267963409424, 6.271489143371582, 6.522710800170898, 6.773931980133057, 7.025153160095215, 7.276374816894531]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 12.0, 10.0, 16.0, 16.0, 20.0, 24.0, 19.0, 27.0, 22.0, 18.0, 29.0, 31.0, 28.0, 34.0, 38.0, 40.0, 48.0, 42.0, 53.0, 43.0, 50.0, 42.0, 33.0, 39.0, 36.0, 31.0, 23.0, 18.0, 23.0, 15.0, 17.0, 16.0, 13.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87744140625, -0.8497467041015625, -0.822052001953125, -0.7943572998046875, -0.76666259765625, -0.7389678955078125, -0.711273193359375, -0.6835784912109375, -0.6558837890625, -0.6281890869140625, -0.600494384765625, -0.5727996826171875, -0.54510498046875, -0.5174102783203125, -0.489715576171875, -0.4620208740234375, -0.434326171875, -0.4066314697265625, -0.378936767578125, -0.3512420654296875, -0.32354736328125, -0.2958526611328125, -0.268157958984375, -0.2404632568359375, -0.2127685546875, -0.1850738525390625, -0.157379150390625, -0.1296844482421875, -0.10198974609375, -0.0742950439453125, -0.046600341796875, -0.0189056396484375, 0.0087890625, 0.0364837646484375, 0.064178466796875, 0.0918731689453125, 0.11956787109375, 0.1472625732421875, 0.174957275390625, 0.2026519775390625, 0.2303466796875, 0.2580413818359375, 0.285736083984375, 0.3134307861328125, 0.34112548828125, 0.3688201904296875, 0.396514892578125, 0.4242095947265625, 0.451904296875, 0.4795989990234375, 0.507293701171875, 0.5349884033203125, 0.56268310546875, 0.5903778076171875, 0.618072509765625, 0.6457672119140625, 0.6734619140625, 0.7011566162109375, 0.728851318359375, 0.7565460205078125, 0.78424072265625, 0.8119354248046875, 0.839630126953125, 0.8673248291015625, 0.89501953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 12.0, 17.0, 36.0, 46.0, 49.0, 109.0, 145.0, 265.0, 332.0, 508.0, 825.0, 1226.0, 1761.0, 2665.0, 4020.0, 5901.0, 8889.0, 13255.0, 19568.0, 29233.0, 42656.0, 60681.0, 84802.0, 111115.0, 133089.0, 134891.0, 112511.0, 85538.0, 61731.0, 42538.0, 29630.0, 19618.0, 13538.0, 8966.0, 6126.0, 4103.0, 2752.0, 1815.0, 1193.0, 850.0, 516.0, 342.0, 230.0, 170.0, 95.0, 75.0, 38.0, 37.0, 20.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.68701171875, -0.6668167114257812, -0.6466217041015625, -0.6264266967773438, -0.606231689453125, -0.5860366821289062, -0.5658416748046875, -0.5456466674804688, -0.52545166015625, -0.5052566528320312, -0.4850616455078125, -0.46486663818359375, -0.444671630859375, -0.42447662353515625, -0.4042816162109375, -0.38408660888671875, -0.3638916015625, -0.34369659423828125, -0.3235015869140625, -0.30330657958984375, -0.283111572265625, -0.26291656494140625, -0.2427215576171875, -0.22252655029296875, -0.20233154296875, -0.18213653564453125, -0.1619415283203125, -0.14174652099609375, -0.121551513671875, -0.10135650634765625, -0.0811614990234375, -0.06096649169921875, -0.040771484375, -0.02057647705078125, -0.0003814697265625, 0.01981353759765625, 0.040008544921875, 0.06020355224609375, 0.0803985595703125, 0.10059356689453125, 0.12078857421875, 0.14098358154296875, 0.1611785888671875, 0.18137359619140625, 0.201568603515625, 0.22176361083984375, 0.2419586181640625, 0.26215362548828125, 0.2823486328125, 0.30254364013671875, 0.3227386474609375, 0.34293365478515625, 0.363128662109375, 0.38332366943359375, 0.4035186767578125, 0.42371368408203125, 0.44390869140625, 0.46410369873046875, 0.4842987060546875, 0.5044937133789062, 0.524688720703125, 0.5448837280273438, 0.5650787353515625, 0.5852737426757812, 0.60546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 14.0, 21.0, 21.0, 21.0, 21.0, 25.0, 36.0, 47.0, 26.0, 49.0, 38.0, 43.0, 38.0, 47.0, 1068.0, 42.0, 43.0, 46.0, 46.0, 36.0, 42.0, 47.0, 28.0, 24.0, 27.0, 26.0, 17.0, 9.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.255859375, -1.2216720581054688, -1.1874847412109375, -1.1532974243164062, -1.119110107421875, -1.0849227905273438, -1.0507354736328125, -1.0165481567382812, -0.98236083984375, -0.9481735229492188, -0.9139862060546875, -0.8797988891601562, -0.845611572265625, -0.8114242553710938, -0.7772369384765625, -0.7430496215820312, -0.7088623046875, -0.6746749877929688, -0.6404876708984375, -0.6063003540039062, -0.572113037109375, -0.5379257202148438, -0.5037384033203125, -0.46955108642578125, -0.43536376953125, -0.40117645263671875, -0.3669891357421875, -0.33280181884765625, -0.298614501953125, -0.26442718505859375, -0.2302398681640625, -0.19605255126953125, -0.161865234375, -0.12767791748046875, -0.0934906005859375, -0.05930328369140625, -0.025115966796875, 0.00907135009765625, 0.0432586669921875, 0.07744598388671875, 0.11163330078125, 0.14582061767578125, 0.1800079345703125, 0.21419525146484375, 0.248382568359375, 0.28256988525390625, 0.3167572021484375, 0.35094451904296875, 0.3851318359375, 0.41931915283203125, 0.4535064697265625, 0.48769378662109375, 0.521881103515625, 0.5560684204101562, 0.5902557373046875, 0.6244430541992188, 0.65863037109375, 0.6928176879882812, 0.7270050048828125, 0.7611923217773438, 0.795379638671875, 0.8295669555664062, 0.8637542724609375, 0.8979415893554688, 0.93212890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 7.0, 5.0, 9.0, 20.0, 28.0, 46.0, 85.0, 120.0, 169.0, 279.0, 435.0, 683.0, 1038.0, 1751.0, 2729.0, 4218.0, 7153.0, 11815.0, 21167.0, 46316.0, 256580.0, 1551521.0, 114898.0, 33507.0, 16922.0, 9815.0, 5820.0, 3649.0, 2376.0, 1460.0, 925.0, 591.0, 368.0, 211.0, 133.0, 110.0, 70.0, 44.0, 24.0, 14.0, 9.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99072265625, -0.9557418823242188, -0.9207611083984375, -0.8857803344726562, -0.850799560546875, -0.8158187866210938, -0.7808380126953125, -0.7458572387695312, -0.71087646484375, -0.6758956909179688, -0.6409149169921875, -0.6059341430664062, -0.570953369140625, -0.5359725952148438, -0.5009918212890625, -0.46601104736328125, -0.4310302734375, -0.39604949951171875, -0.3610687255859375, -0.32608795166015625, -0.291107177734375, -0.25612640380859375, -0.2211456298828125, -0.18616485595703125, -0.15118408203125, -0.11620330810546875, -0.0812225341796875, -0.04624176025390625, -0.011260986328125, 0.02371978759765625, 0.0587005615234375, 0.09368133544921875, 0.128662109375, 0.16364288330078125, 0.1986236572265625, 0.23360443115234375, 0.268585205078125, 0.30356597900390625, 0.3385467529296875, 0.37352752685546875, 0.40850830078125, 0.44348907470703125, 0.4784698486328125, 0.5134506225585938, 0.548431396484375, 0.5834121704101562, 0.6183929443359375, 0.6533737182617188, 0.6883544921875, 0.7233352661132812, 0.7583160400390625, 0.7932968139648438, 0.828277587890625, 0.8632583618164062, 0.8982391357421875, 0.9332199096679688, 0.96820068359375, 1.0031814575195312, 1.0381622314453125, 1.0731430053710938, 1.108123779296875, 1.1431045532226562, 1.1780853271484375, 1.2130661010742188, 1.248046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 6.0, 7.0, 7.0, 4.0, 12.0, 18.0, 9.0, 17.0, 35.0, 33.0, 41.0, 45.0, 52.0, 68.0, 86.0, 72.0, 88.0, 52.0, 50.0, 45.0, 46.0, 35.0, 36.0, 22.0, 19.0, 18.0, 15.0, 13.0, 6.0, 8.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207763671875, -0.2004852294921875, -0.193206787109375, -0.1859283447265625, -0.17864990234375, -0.1713714599609375, -0.164093017578125, -0.1568145751953125, -0.1495361328125, -0.1422576904296875, -0.134979248046875, -0.1277008056640625, -0.12042236328125, -0.1131439208984375, -0.105865478515625, -0.0985870361328125, -0.09130859375, -0.0840301513671875, -0.076751708984375, -0.0694732666015625, -0.06219482421875, -0.0549163818359375, -0.047637939453125, -0.0403594970703125, -0.0330810546875, -0.0258026123046875, -0.018524169921875, -0.0112457275390625, -0.00396728515625, 0.0033111572265625, 0.010589599609375, 0.0178680419921875, 0.025146484375, 0.0324249267578125, 0.039703369140625, 0.0469818115234375, 0.05426025390625, 0.0615386962890625, 0.068817138671875, 0.0760955810546875, 0.0833740234375, 0.0906524658203125, 0.097930908203125, 0.1052093505859375, 0.11248779296875, 0.1197662353515625, 0.127044677734375, 0.1343231201171875, 0.1416015625, 0.1488800048828125, 0.156158447265625, 0.1634368896484375, 0.17071533203125, 0.1779937744140625, 0.185272216796875, 0.1925506591796875, 0.1998291015625, 0.2071075439453125, 0.214385986328125, 0.2216644287109375, 0.22894287109375, 0.2362213134765625, 0.243499755859375, 0.2507781982421875, 0.258056640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 7.0, 12.0, 9.0, 18.0, 21.0, 37.0, 49.0, 46.0, 73.0, 126.0, 163.0, 282.0, 798.0, 3332.0, 26636.0, 744937.0, 255586.0, 12958.0, 2079.0, 559.0, 263.0, 197.0, 87.0, 79.0, 51.0, 35.0, 28.0, 16.0, 12.0, 8.0, 9.0, 10.0, 6.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4921875, -3.394775390625, -3.29736328125, -3.199951171875, -3.1025390625, -3.005126953125, -2.90771484375, -2.810302734375, -2.712890625, -2.615478515625, -2.51806640625, -2.420654296875, -2.3232421875, -2.225830078125, -2.12841796875, -2.031005859375, -1.93359375, -1.836181640625, -1.73876953125, -1.641357421875, -1.5439453125, -1.446533203125, -1.34912109375, -1.251708984375, -1.154296875, -1.056884765625, -0.95947265625, -0.862060546875, -0.7646484375, -0.667236328125, -0.56982421875, -0.472412109375, -0.375, -0.277587890625, -0.18017578125, -0.082763671875, 0.0146484375, 0.112060546875, 0.20947265625, 0.306884765625, 0.404296875, 0.501708984375, 0.59912109375, 0.696533203125, 0.7939453125, 0.891357421875, 0.98876953125, 1.086181640625, 1.18359375, 1.281005859375, 1.37841796875, 1.475830078125, 1.5732421875, 1.670654296875, 1.76806640625, 1.865478515625, 1.962890625, 2.060302734375, 2.15771484375, 2.255126953125, 2.3525390625, 2.449951171875, 2.54736328125, 2.644775390625, 2.7421875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 16.0, 20.0, 44.0, 129.0, 431.0, 243.0, 81.0, 28.0, 10.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.804503440856934, -6.6024394035339355, -6.400374889373779, -6.198310852050781, -5.996246814727783, -5.794182777404785, -5.592118263244629, -5.390054225921631, -5.187990188598633, -4.985926151275635, -4.7838616371154785, -4.5817975997924805, -4.379733562469482, -4.177669525146484, -3.975605010986328, -3.77354097366333, -3.571476459503174, -3.3694121837615967, -3.1673481464385986, -2.9652838706970215, -2.7632198333740234, -2.5611555576324463, -2.359091281890869, -2.157027244567871, -1.954962968826294, -1.7528988122940063, -1.5508346557617188, -1.3487703800201416, -1.146706223487854, -0.9446420669555664, -0.7425777912139893, -0.5405136346817017, -0.33844995498657227, -0.13638576865196228, 0.0656784176826477, 0.2677426338195801, 0.4698067903518677, 0.6718709468841553, 0.8739352226257324, 1.07599937915802, 1.2780635356903076, 1.4801276922225952, 1.6821918487548828, 1.88425612449646, 2.086320400238037, 2.288384437561035, 2.4904487133026123, 2.6925129890441895, 2.8945770263671875, 3.0966413021087646, 3.2987053394317627, 3.50076961517334, 3.702833652496338, 3.904897928237915, 4.106962203979492, 4.30902624130249, 4.511090278625488, 4.713154315948486, 4.915218830108643, 5.117282867431641, 5.319346904754639, 5.521410942077637, 5.723475456237793, 5.925539493560791, 6.127604007720947]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 4.0, 5.0, 11.0, 18.0, 13.0, 22.0, 25.0, 33.0, 28.0, 44.0, 30.0, 62.0, 51.0, 33.0, 54.0, 38.0, 66.0, 58.0, 48.0, 46.0, 48.0, 35.0, 48.0, 40.0, 18.0, 21.0, 18.0, 9.0, 12.0, 13.0, 15.0, 7.0, 5.0, 9.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5857336521148682, -1.539997935295105, -1.4942622184753418, -1.448526382446289, -1.4027906656265259, -1.3570549488067627, -1.3113192319869995, -1.2655835151672363, -1.2198477983474731, -1.17411208152771, -1.1283763647079468, -1.0826406478881836, -1.0369048118591309, -0.9911690950393677, -0.9454333782196045, -0.8996976613998413, -0.8539618849754333, -0.8082261681556702, -0.7624903917312622, -0.716754674911499, -0.6710189580917358, -0.6252832412719727, -0.5795474648475647, -0.5338117480278015, -0.48807600140571594, -0.44234025478363037, -0.3966045379638672, -0.3508687913417816, -0.30513304471969604, -0.25939732789993286, -0.2136615812778473, -0.1679258644580841, -0.12219011783599854, -0.07645438611507416, -0.030718646943569183, 0.015017092227935791, 0.06075282394886017, 0.10648855566978455, 0.15222430229187012, 0.1979600191116333, 0.24369576573371887, 0.28943151235580444, 0.3351672291755676, 0.3809029757976532, 0.42663872241973877, 0.47237443923950195, 0.5181101560592651, 0.5638458728790283, 0.6095816493034363, 0.6553173661231995, 0.7010531425476074, 0.7467888593673706, 0.7925245761871338, 0.838260293006897, 0.8839960694313049, 0.9297317862510681, 0.9754675626754761, 1.0212032794952393, 1.0669389963150024, 1.1126747131347656, 1.1584105491638184, 1.2041462659835815, 1.2498819828033447, 1.295617699623108, 1.341353416442871]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 0.0, 4.0, 10.0, 4.0, 9.0, 12.0, 19.0, 16.0, 15.0, 21.0, 24.0, 23.0, 31.0, 37.0, 27.0, 31.0, 31.0, 38.0, 32.0, 52.0, 42.0, 57.0, 49.0, 48.0, 51.0, 44.0, 35.0, 39.0, 15.0, 24.0, 26.0, 22.0, 13.0, 19.0, 19.0, 12.0, 11.0, 10.0, 9.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89697265625, -0.8680572509765625, -0.839141845703125, -0.8102264404296875, -0.78131103515625, -0.7523956298828125, -0.723480224609375, -0.6945648193359375, -0.6656494140625, -0.6367340087890625, -0.607818603515625, -0.5789031982421875, -0.54998779296875, -0.5210723876953125, -0.492156982421875, -0.4632415771484375, -0.434326171875, -0.4054107666015625, -0.376495361328125, -0.3475799560546875, -0.31866455078125, -0.2897491455078125, -0.260833740234375, -0.2319183349609375, -0.2030029296875, -0.1740875244140625, -0.145172119140625, -0.1162567138671875, -0.08734130859375, -0.0584259033203125, -0.029510498046875, -0.0005950927734375, 0.0283203125, 0.0572357177734375, 0.086151123046875, 0.1150665283203125, 0.14398193359375, 0.1728973388671875, 0.201812744140625, 0.2307281494140625, 0.2596435546875, 0.2885589599609375, 0.317474365234375, 0.3463897705078125, 0.37530517578125, 0.4042205810546875, 0.433135986328125, 0.4620513916015625, 0.490966796875, 0.5198822021484375, 0.548797607421875, 0.5777130126953125, 0.60662841796875, 0.6355438232421875, 0.664459228515625, 0.6933746337890625, 0.7222900390625, 0.7512054443359375, 0.780120849609375, 0.8090362548828125, 0.83795166015625, 0.8668670654296875, 0.895782470703125, 0.9246978759765625, 0.95361328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 12.0, 14.0, 28.0, 41.0, 51.0, 75.0, 113.0, 181.0, 233.0, 361.0, 608.0, 917.0, 1413.0, 2222.0, 3779.0, 6946.0, 13770.0, 31347.0, 89323.0, 327926.0, 389574.0, 108639.0, 36866.0, 15361.0, 7689.0, 4245.0, 2541.0, 1480.0, 970.0, 606.0, 417.0, 243.0, 181.0, 125.0, 73.0, 45.0, 46.0, 30.0, 16.0, 15.0, 7.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.449920654296875, -1.40472412109375, -1.359527587890625, -1.3143310546875, -1.269134521484375, -1.22393798828125, -1.178741455078125, -1.133544921875, -1.088348388671875, -1.04315185546875, -0.997955322265625, -0.9527587890625, -0.907562255859375, -0.86236572265625, -0.817169189453125, -0.77197265625, -0.726776123046875, -0.68157958984375, -0.636383056640625, -0.5911865234375, -0.545989990234375, -0.50079345703125, -0.455596923828125, -0.410400390625, -0.365203857421875, -0.32000732421875, -0.274810791015625, -0.2296142578125, -0.184417724609375, -0.13922119140625, -0.094024658203125, -0.048828125, -0.003631591796875, 0.04156494140625, 0.086761474609375, 0.1319580078125, 0.177154541015625, 0.22235107421875, 0.267547607421875, 0.312744140625, 0.357940673828125, 0.40313720703125, 0.448333740234375, 0.4935302734375, 0.538726806640625, 0.58392333984375, 0.629119873046875, 0.67431640625, 0.719512939453125, 0.76470947265625, 0.809906005859375, 0.8551025390625, 0.900299072265625, 0.94549560546875, 0.990692138671875, 1.035888671875, 1.081085205078125, 1.12628173828125, 1.171478271484375, 1.2166748046875, 1.261871337890625, 1.30706787109375, 1.352264404296875, 1.3974609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 2.0, 10.0, 14.0, 10.0, 16.0, 17.0, 23.0, 17.0, 29.0, 29.0, 24.0, 37.0, 33.0, 39.0, 56.0, 52.0, 80.0, 103.0, 230.0, 1429.0, 194.0, 104.0, 64.0, 67.0, 44.0, 35.0, 48.0, 32.0, 34.0, 33.0, 22.0, 21.0, 17.0, 15.0, 10.0, 7.0, 13.0, 6.0, 6.0, 11.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.443359375, -3.3404541015625, -3.237548828125, -3.1346435546875, -3.03173828125, -2.9288330078125, -2.825927734375, -2.7230224609375, -2.6201171875, -2.5172119140625, -2.414306640625, -2.3114013671875, -2.20849609375, -2.1055908203125, -2.002685546875, -1.8997802734375, -1.796875, -1.6939697265625, -1.591064453125, -1.4881591796875, -1.38525390625, -1.2823486328125, -1.179443359375, -1.0765380859375, -0.9736328125, -0.8707275390625, -0.767822265625, -0.6649169921875, -0.56201171875, -0.4591064453125, -0.356201171875, -0.2532958984375, -0.150390625, -0.0474853515625, 0.055419921875, 0.1583251953125, 0.26123046875, 0.3641357421875, 0.467041015625, 0.5699462890625, 0.6728515625, 0.7757568359375, 0.878662109375, 0.9815673828125, 1.08447265625, 1.1873779296875, 1.290283203125, 1.3931884765625, 1.49609375, 1.5989990234375, 1.701904296875, 1.8048095703125, 1.90771484375, 2.0106201171875, 2.113525390625, 2.2164306640625, 2.3193359375, 2.4222412109375, 2.525146484375, 2.6280517578125, 2.73095703125, 2.8338623046875, 2.936767578125, 3.0396728515625, 3.142578125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 10.0, 12.0, 11.0, 16.0, 29.0, 32.0, 50.0, 87.0, 175.0, 218.0, 478.0, 933.0, 2067.0, 5096.0, 13941.0, 57559.0, 1167102.0, 1800036.0, 71611.0, 16121.0, 5619.0, 2255.0, 1040.0, 485.0, 244.0, 170.0, 105.0, 73.0, 42.0, 28.0, 19.0, 22.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.955078125, -3.797210693359375, -3.63934326171875, -3.481475830078125, -3.3236083984375, -3.165740966796875, -3.00787353515625, -2.850006103515625, -2.692138671875, -2.534271240234375, -2.37640380859375, -2.218536376953125, -2.0606689453125, -1.902801513671875, -1.74493408203125, -1.587066650390625, -1.42919921875, -1.271331787109375, -1.11346435546875, -0.955596923828125, -0.7977294921875, -0.639862060546875, -0.48199462890625, -0.324127197265625, -0.166259765625, -0.008392333984375, 0.14947509765625, 0.307342529296875, 0.4652099609375, 0.623077392578125, 0.78094482421875, 0.938812255859375, 1.0966796875, 1.254547119140625, 1.41241455078125, 1.570281982421875, 1.7281494140625, 1.886016845703125, 2.04388427734375, 2.201751708984375, 2.359619140625, 2.517486572265625, 2.67535400390625, 2.833221435546875, 2.9910888671875, 3.148956298828125, 3.30682373046875, 3.464691162109375, 3.62255859375, 3.780426025390625, 3.93829345703125, 4.096160888671875, 4.2540283203125, 4.411895751953125, 4.56976318359375, 4.727630615234375, 4.885498046875, 5.043365478515625, 5.20123291015625, 5.359100341796875, 5.5169677734375, 5.674835205078125, 5.83270263671875, 5.990570068359375, 6.1484375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 237.0, 698.0, 69.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.47452735900879, -15.380653381347656, -13.286779403686523, -11.192906379699707, -9.099032402038574, -7.005158424377441, -4.911285400390625, -2.817411422729492, -0.7235374450683594, 1.3703362941741943, 3.464210033416748, 5.558083534240723, 7.6519575119018555, 9.745831489562988, 11.839704513549805, 13.933578491210938, 16.02745246887207, 18.121326446533203, 20.215200424194336, 22.30907440185547, 24.40294647216797, 26.496822357177734, 28.590694427490234, 30.684568405151367, 32.7784423828125, 34.872314453125, 36.966190338134766, 39.060062408447266, 41.15393829345703, 43.24781036376953, 45.34168243408203, 47.4355583190918, 49.52942657470703, 51.62329864501953, 53.7171745300293, 55.8110466003418, 57.90492248535156, 59.99879455566406, 62.09266662597656, 64.18653869628906, 66.2804183959961, 68.3742904663086, 70.4681625366211, 72.56204223632812, 74.65591430664062, 76.74978637695312, 78.84365844726562, 80.93753051757812, 83.03140258789062, 85.12527465820312, 87.21914672851562, 89.31302642822266, 91.40689849853516, 93.50077056884766, 95.59464263916016, 97.68852233886719, 99.78239440917969, 101.87626647949219, 103.97013854980469, 106.06401824951172, 108.15789031982422, 110.25176239013672, 112.34563446044922, 114.43951416015625, 116.53338623046875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 4.0, 1.0, 7.0, 3.0, 2.0, 11.0, 6.0, 15.0, 14.0, 14.0, 14.0, 21.0, 18.0, 31.0, 28.0, 28.0, 22.0, 26.0, 38.0, 37.0, 33.0, 33.0, 50.0, 44.0, 37.0, 31.0, 30.0, 27.0, 27.0, 39.0, 29.0, 34.0, 25.0, 28.0, 29.0, 23.0, 17.0, 19.0, 12.0, 10.0, 11.0, 7.0, 18.0, 8.0, 6.0, 8.0, 3.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.972294807434082, -9.66366958618164, -9.355045318603516, -9.046420097351074, -8.737794876098633, -8.429170608520508, -8.120545387268066, -7.811920642852783, -7.5032958984375, -7.194671154022217, -6.886046409606934, -6.577421188354492, -6.268796443939209, -5.960171699523926, -5.651546478271484, -5.342921733856201, -5.034296989440918, -4.725672245025635, -4.417047500610352, -4.10842227935791, -3.799797534942627, -3.4911727905273438, -3.1825478076934814, -2.873922824859619, -2.565298080444336, -2.2566733360290527, -1.9480483531951904, -1.6394234895706177, -1.330798625946045, -1.0221737623214722, -0.7135488986968994, -0.4049239158630371, -0.09630012512207031, 0.21232473850250244, 0.5209496021270752, 0.829574465751648, 1.1381993293762207, 1.4468241930007935, 1.7554490566253662, 2.0640740394592285, 2.3726987838745117, 2.681323528289795, 2.9899485111236572, 3.2985734939575195, 3.6071982383728027, 3.915822982788086, 4.224448204040527, 4.5330729484558105, 4.841697692871094, 5.150322437286377, 5.45894718170166, 5.767572402954102, 6.076197147369385, 6.384821891784668, 6.693447113037109, 7.002071857452393, 7.310696601867676, 7.619321346282959, 7.927946090698242, 8.236571311950684, 8.545196533203125, 8.85382080078125, 9.162446022033691, 9.471071243286133, 9.779695510864258]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 16.0, 17.0, 20.0, 16.0, 15.0, 29.0, 31.0, 26.0, 31.0, 35.0, 44.0, 34.0, 32.0, 48.0, 45.0, 37.0, 46.0, 40.0, 54.0, 42.0, 34.0, 33.0, 29.0, 29.0, 25.0, 20.0, 14.0, 23.0, 22.0, 7.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.89208984375, -0.8633270263671875, -0.834564208984375, -0.8058013916015625, -0.77703857421875, -0.7482757568359375, -0.719512939453125, -0.6907501220703125, -0.6619873046875, -0.6332244873046875, -0.604461669921875, -0.5756988525390625, -0.54693603515625, -0.5181732177734375, -0.489410400390625, -0.4606475830078125, -0.431884765625, -0.4031219482421875, -0.374359130859375, -0.3455963134765625, -0.31683349609375, -0.2880706787109375, -0.259307861328125, -0.2305450439453125, -0.2017822265625, -0.1730194091796875, -0.144256591796875, -0.1154937744140625, -0.08673095703125, -0.0579681396484375, -0.029205322265625, -0.0004425048828125, 0.0283203125, 0.0570831298828125, 0.085845947265625, 0.1146087646484375, 0.14337158203125, 0.1721343994140625, 0.200897216796875, 0.2296600341796875, 0.2584228515625, 0.2871856689453125, 0.315948486328125, 0.3447113037109375, 0.37347412109375, 0.4022369384765625, 0.430999755859375, 0.4597625732421875, 0.488525390625, 0.5172882080078125, 0.546051025390625, 0.5748138427734375, 0.60357666015625, 0.6323394775390625, 0.661102294921875, 0.6898651123046875, 0.7186279296875, 0.7473907470703125, 0.776153564453125, 0.8049163818359375, 0.83367919921875, 0.8624420166015625, 0.891204833984375, 0.9199676513671875, 0.94873046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 3.0, 10.0, 10.0, 19.0, 27.0, 39.0, 52.0, 72.0, 149.0, 170.0, 297.0, 440.0, 748.0, 1189.0, 1945.0, 3506.0, 6274.0, 11672.0, 23980.0, 56294.0, 208923.0, 1593136.0, 1908752.0, 258490.0, 64149.0, 25703.0, 12244.0, 6603.0, 3783.0, 2063.0, 1304.0, 769.0, 525.0, 315.0, 186.0, 147.0, 98.0, 58.0, 40.0, 29.0, 18.0, 17.0, 11.0, 10.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.09844970703125, -2.0308837890625, -1.96331787109375, -1.895751953125, -1.82818603515625, -1.7606201171875, -1.69305419921875, -1.62548828125, -1.55792236328125, -1.4903564453125, -1.42279052734375, -1.355224609375, -1.28765869140625, -1.2200927734375, -1.15252685546875, -1.0849609375, -1.01739501953125, -0.9498291015625, -0.88226318359375, -0.814697265625, -0.74713134765625, -0.6795654296875, -0.61199951171875, -0.54443359375, -0.47686767578125, -0.4093017578125, -0.34173583984375, -0.274169921875, -0.20660400390625, -0.1390380859375, -0.07147216796875, -0.00390625, 0.06365966796875, 0.1312255859375, 0.19879150390625, 0.266357421875, 0.33392333984375, 0.4014892578125, 0.46905517578125, 0.53662109375, 0.60418701171875, 0.6717529296875, 0.73931884765625, 0.806884765625, 0.87445068359375, 0.9420166015625, 1.00958251953125, 1.0771484375, 1.14471435546875, 1.2122802734375, 1.27984619140625, 1.347412109375, 1.41497802734375, 1.4825439453125, 1.55010986328125, 1.61767578125, 1.68524169921875, 1.7528076171875, 1.82037353515625, 1.887939453125, 1.95550537109375, 2.0230712890625, 2.09063720703125, 2.158203125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 8.0, 14.0, 17.0, 24.0, 34.0, 36.0, 39.0, 53.0, 60.0, 94.0, 125.0, 157.0, 227.0, 297.0, 422.0, 462.0, 481.0, 386.0, 241.0, 194.0, 148.0, 117.0, 83.0, 67.0, 61.0, 51.0, 26.0, 24.0, 27.0, 16.0, 7.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9228515625, -1.8535919189453125, -1.784332275390625, -1.7150726318359375, -1.64581298828125, -1.5765533447265625, -1.507293701171875, -1.4380340576171875, -1.3687744140625, -1.2995147705078125, -1.230255126953125, -1.1609954833984375, -1.09173583984375, -1.0224761962890625, -0.953216552734375, -0.8839569091796875, -0.814697265625, -0.7454376220703125, -0.676177978515625, -0.6069183349609375, -0.53765869140625, -0.4683990478515625, -0.399139404296875, -0.3298797607421875, -0.2606201171875, -0.1913604736328125, -0.122100830078125, -0.0528411865234375, 0.01641845703125, 0.0856781005859375, 0.154937744140625, 0.2241973876953125, 0.29345703125, 0.3627166748046875, 0.431976318359375, 0.5012359619140625, 0.57049560546875, 0.6397552490234375, 0.709014892578125, 0.7782745361328125, 0.8475341796875, 0.9167938232421875, 0.986053466796875, 1.0553131103515625, 1.12457275390625, 1.1938323974609375, 1.263092041015625, 1.3323516845703125, 1.401611328125, 1.4708709716796875, 1.540130615234375, 1.6093902587890625, 1.67864990234375, 1.7479095458984375, 1.817169189453125, 1.8864288330078125, 1.9556884765625, 2.0249481201171875, 2.094207763671875, 2.1634674072265625, 2.23272705078125, 2.3019866943359375, 2.371246337890625, 2.4405059814453125, 2.509765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 12.0, 28.0, 37.0, 45.0, 57.0, 115.0, 142.0, 238.0, 344.0, 588.0, 885.0, 1455.0, 2413.0, 4178.0, 7796.0, 14583.0, 30127.0, 67535.0, 179436.0, 688019.0, 2230790.0, 661475.0, 176247.0, 66039.0, 29367.0, 14375.0, 7553.0, 4124.0, 2400.0, 1408.0, 903.0, 560.0, 351.0, 199.0, 146.0, 109.0, 71.0, 42.0, 31.0, 16.0, 17.0, 9.0, 6.0, 4.0, 2.0, 2.0], "bins": [-3.423828125, -3.334869384765625, -3.24591064453125, -3.156951904296875, -3.0679931640625, -2.979034423828125, -2.89007568359375, -2.801116943359375, -2.712158203125, -2.623199462890625, -2.53424072265625, -2.445281982421875, -2.3563232421875, -2.267364501953125, -2.17840576171875, -2.089447021484375, -2.00048828125, -1.911529541015625, -1.82257080078125, -1.733612060546875, -1.6446533203125, -1.555694580078125, -1.46673583984375, -1.377777099609375, -1.288818359375, -1.199859619140625, -1.11090087890625, -1.021942138671875, -0.9329833984375, -0.844024658203125, -0.75506591796875, -0.666107177734375, -0.5771484375, -0.488189697265625, -0.39923095703125, -0.310272216796875, -0.2213134765625, -0.132354736328125, -0.04339599609375, 0.045562744140625, 0.134521484375, 0.223480224609375, 0.31243896484375, 0.401397705078125, 0.4903564453125, 0.579315185546875, 0.66827392578125, 0.757232666015625, 0.84619140625, 0.935150146484375, 1.02410888671875, 1.113067626953125, 1.2020263671875, 1.290985107421875, 1.37994384765625, 1.468902587890625, 1.557861328125, 1.646820068359375, 1.73577880859375, 1.824737548828125, 1.9136962890625, 2.002655029296875, 2.09161376953125, 2.180572509765625, 2.26953125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 23.0, 20.0, 41.0, 68.0, 82.0, 125.0, 119.0, 123.0, 120.0, 73.0, 49.0, 58.0, 36.0, 18.0, 15.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.158880233764648, -9.64907455444336, -9.13926887512207, -8.629462242126465, -8.119656562805176, -7.609850883483887, -7.1000447273254395, -6.590238571166992, -6.080432891845703, -5.570627212524414, -5.060821056365967, -4.5510149002075195, -4.0412092208862305, -3.5314033031463623, -3.021597385406494, -2.511791467666626, -2.001985549926758, -1.4921796321868896, -0.9823737144470215, -0.4725677967071533, 0.037238121032714844, 0.547044038772583, 1.0568499565124512, 1.5666558742523193, 2.0764617919921875, 2.5862677097320557, 3.096073627471924, 3.605879545211792, 4.11568546295166, 4.625491142272949, 5.1352972984313965, 5.645103454589844, 6.154909133911133, 6.664714813232422, 7.174520969390869, 7.684327125549316, 8.194132804870605, 8.703938484191895, 9.2137451171875, 9.723550796508789, 10.233356475830078, 10.743162155151367, 11.252967834472656, 11.762774467468262, 12.27258014678955, 12.78238582611084, 13.292192459106445, 13.801998138427734, 14.311803817749023, 14.821609497070312, 15.331415176391602, 15.841221809387207, 16.351028442382812, 16.8608341217041, 17.37063980102539, 17.88044548034668, 18.39025115966797, 18.900056838989258, 19.409862518310547, 19.919668197631836, 20.429473876953125, 20.939281463623047, 21.449087142944336, 21.958892822265625, 22.468698501586914]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 7.0, 5.0, 7.0, 4.0, 18.0, 15.0, 11.0, 13.0, 21.0, 21.0, 27.0, 20.0, 31.0, 35.0, 34.0, 26.0, 34.0, 30.0, 43.0, 35.0, 46.0, 48.0, 40.0, 36.0, 37.0, 37.0, 34.0, 31.0, 29.0, 24.0, 36.0, 25.0, 24.0, 19.0, 17.0, 12.0, 13.0, 11.0, 10.0, 13.0, 12.0, 3.0, 2.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.297189712524414, -8.033828735351562, -7.7704668045043945, -7.507105350494385, -7.243743896484375, -6.980382442474365, -6.7170209884643555, -6.453659534454346, -6.190298080444336, -5.926936626434326, -5.663575172424316, -5.400213718414307, -5.136852264404297, -4.873490810394287, -4.610129356384277, -4.346767902374268, -4.083406448364258, -3.820044994354248, -3.5566835403442383, -3.2933220863342285, -3.0299606323242188, -2.766599178314209, -2.503237724304199, -2.2398762702941895, -1.9765148162841797, -1.71315336227417, -1.4497919082641602, -1.1864304542541504, -0.9230690002441406, -0.6597075462341309, -0.3963460922241211, -0.13298463821411133, 0.13037681579589844, 0.3937382698059082, 0.657099723815918, 0.9204611778259277, 1.1838226318359375, 1.4471840858459473, 1.710545539855957, 1.9739069938659668, 2.2372684478759766, 2.5006299018859863, 2.763991355895996, 3.027352809906006, 3.2907142639160156, 3.5540757179260254, 3.817437171936035, 4.080798625946045, 4.344160079956055, 4.6075215339660645, 4.870882987976074, 5.134244441986084, 5.397605895996094, 5.6609673500061035, 5.924328804016113, 6.187690258026123, 6.451051712036133, 6.714413166046143, 6.977774620056152, 7.241136074066162, 7.504497528076172, 7.767858982086182, 8.031220436096191, 8.29458236694336, 8.557943344116211]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 18.0, 18.0, 22.0, 23.0, 32.0, 19.0, 44.0, 32.0, 47.0, 38.0, 52.0, 43.0, 51.0, 28.0, 50.0, 45.0, 46.0, 39.0, 35.0, 44.0, 34.0, 27.0, 33.0, 16.0, 15.0, 20.0, 17.0, 11.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.92041015625, -0.8886947631835938, -0.8569793701171875, -0.8252639770507812, -0.793548583984375, -0.7618331909179688, -0.7301177978515625, -0.6984024047851562, -0.66668701171875, -0.6349716186523438, -0.6032562255859375, -0.5715408325195312, -0.539825439453125, -0.5081100463867188, -0.4763946533203125, -0.44467926025390625, -0.4129638671875, -0.38124847412109375, -0.3495330810546875, -0.31781768798828125, -0.286102294921875, -0.25438690185546875, -0.2226715087890625, -0.19095611572265625, -0.15924072265625, -0.12752532958984375, -0.0958099365234375, -0.06409454345703125, -0.032379150390625, -0.00066375732421875, 0.0310516357421875, 0.06276702880859375, 0.094482421875, 0.12619781494140625, 0.1579132080078125, 0.18962860107421875, 0.221343994140625, 0.25305938720703125, 0.2847747802734375, 0.31649017333984375, 0.34820556640625, 0.37992095947265625, 0.4116363525390625, 0.44335174560546875, 0.475067138671875, 0.5067825317382812, 0.5384979248046875, 0.5702133178710938, 0.6019287109375, 0.6336441040039062, 0.6653594970703125, 0.6970748901367188, 0.728790283203125, 0.7605056762695312, 0.7922210693359375, 0.8239364624023438, 0.85565185546875, 0.8873672485351562, 0.9190826416015625, 0.9507980346679688, 0.982513427734375, 1.0142288208007812, 1.0459442138671875, 1.0776596069335938, 1.109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 7.0, 7.0, 10.0, 23.0, 37.0, 56.0, 85.0, 135.0, 198.0, 258.0, 420.0, 667.0, 959.0, 1429.0, 2127.0, 3114.0, 4687.0, 6912.0, 10416.0, 15600.0, 23313.0, 34231.0, 48904.0, 69049.0, 91918.0, 114413.0, 127329.0, 122600.0, 103637.0, 80122.0, 58694.0, 40957.0, 28154.0, 19317.0, 12832.0, 8631.0, 5709.0, 3852.0, 2520.0, 1745.0, 1216.0, 798.0, 546.0, 329.0, 222.0, 131.0, 85.0, 55.0, 33.0, 29.0, 16.0, 14.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62158203125, -0.6013717651367188, -0.5811614990234375, -0.5609512329101562, -0.540740966796875, -0.5205307006835938, -0.5003204345703125, -0.48011016845703125, -0.45989990234375, -0.43968963623046875, -0.4194793701171875, -0.39926910400390625, -0.379058837890625, -0.35884857177734375, -0.3386383056640625, -0.31842803955078125, -0.2982177734375, -0.27800750732421875, -0.2577972412109375, -0.23758697509765625, -0.217376708984375, -0.19716644287109375, -0.1769561767578125, -0.15674591064453125, -0.13653564453125, -0.11632537841796875, -0.0961151123046875, -0.07590484619140625, -0.055694580078125, -0.03548431396484375, -0.0152740478515625, 0.00493621826171875, 0.025146484375, 0.04535675048828125, 0.0655670166015625, 0.08577728271484375, 0.105987548828125, 0.12619781494140625, 0.1464080810546875, 0.16661834716796875, 0.18682861328125, 0.20703887939453125, 0.2272491455078125, 0.24745941162109375, 0.267669677734375, 0.28787994384765625, 0.3080902099609375, 0.32830047607421875, 0.3485107421875, 0.36872100830078125, 0.3889312744140625, 0.40914154052734375, 0.429351806640625, 0.44956207275390625, 0.4697723388671875, 0.48998260498046875, 0.51019287109375, 0.5304031372070312, 0.5506134033203125, 0.5708236694335938, 0.591033935546875, 0.6112442016601562, 0.6314544677734375, 0.6516647338867188, 0.671875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 3.0, 4.0, 13.0, 10.0, 14.0, 16.0, 13.0, 24.0, 23.0, 29.0, 25.0, 30.0, 32.0, 33.0, 41.0, 40.0, 43.0, 41.0, 44.0, 1075.0, 38.0, 43.0, 43.0, 35.0, 46.0, 25.0, 38.0, 21.0, 23.0, 32.0, 27.0, 16.0, 10.0, 14.0, 15.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0751953125, -1.0427398681640625, -1.010284423828125, -0.9778289794921875, -0.94537353515625, -0.9129180908203125, -0.880462646484375, -0.8480072021484375, -0.8155517578125, -0.7830963134765625, -0.750640869140625, -0.7181854248046875, -0.68572998046875, -0.6532745361328125, -0.620819091796875, -0.5883636474609375, -0.555908203125, -0.5234527587890625, -0.490997314453125, -0.4585418701171875, -0.42608642578125, -0.3936309814453125, -0.361175537109375, -0.3287200927734375, -0.2962646484375, -0.2638092041015625, -0.231353759765625, -0.1988983154296875, -0.16644287109375, -0.1339874267578125, -0.101531982421875, -0.0690765380859375, -0.03662109375, -0.0041656494140625, 0.028289794921875, 0.0607452392578125, 0.09320068359375, 0.1256561279296875, 0.158111572265625, 0.1905670166015625, 0.2230224609375, 0.2554779052734375, 0.287933349609375, 0.3203887939453125, 0.35284423828125, 0.3852996826171875, 0.417755126953125, 0.4502105712890625, 0.482666015625, 0.5151214599609375, 0.547576904296875, 0.5800323486328125, 0.61248779296875, 0.6449432373046875, 0.677398681640625, 0.7098541259765625, 0.7423095703125, 0.7747650146484375, 0.807220458984375, 0.8396759033203125, 0.87213134765625, 0.9045867919921875, 0.937042236328125, 0.9694976806640625, 1.001953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 18.0, 8.0, 19.0, 17.0, 27.0, 38.0, 58.0, 75.0, 133.0, 176.0, 269.0, 395.0, 554.0, 787.0, 1112.0, 1637.0, 2394.0, 3290.0, 4898.0, 7296.0, 10887.0, 16828.0, 30406.0, 97177.0, 1360538.0, 428095.0, 61016.0, 24392.0, 14692.0, 9414.0, 6463.0, 4323.0, 2975.0, 1984.0, 1421.0, 1054.0, 680.0, 472.0, 319.0, 246.0, 162.0, 114.0, 89.0, 56.0, 42.0, 31.0, 18.0, 11.0, 9.0, 6.0, 8.0, 0.0, 0.0, 6.0, 1.0, 2.0], "bins": [-0.9150390625, -0.887176513671875, -0.85931396484375, -0.831451416015625, -0.8035888671875, -0.775726318359375, -0.74786376953125, -0.720001220703125, -0.692138671875, -0.664276123046875, -0.63641357421875, -0.608551025390625, -0.5806884765625, -0.552825927734375, -0.52496337890625, -0.497100830078125, -0.46923828125, -0.441375732421875, -0.41351318359375, -0.385650634765625, -0.3577880859375, -0.329925537109375, -0.30206298828125, -0.274200439453125, -0.246337890625, -0.218475341796875, -0.19061279296875, -0.162750244140625, -0.1348876953125, -0.107025146484375, -0.07916259765625, -0.051300048828125, -0.0234375, 0.004425048828125, 0.03228759765625, 0.060150146484375, 0.0880126953125, 0.115875244140625, 0.14373779296875, 0.171600341796875, 0.199462890625, 0.227325439453125, 0.25518798828125, 0.283050537109375, 0.3109130859375, 0.338775634765625, 0.36663818359375, 0.394500732421875, 0.42236328125, 0.450225830078125, 0.47808837890625, 0.505950927734375, 0.5338134765625, 0.561676025390625, 0.58953857421875, 0.617401123046875, 0.645263671875, 0.673126220703125, 0.70098876953125, 0.728851318359375, 0.7567138671875, 0.784576416015625, 0.81243896484375, 0.840301513671875, 0.8681640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 3.0, 2.0, 10.0, 8.0, 9.0, 15.0, 16.0, 19.0, 24.0, 24.0, 17.0, 29.0, 30.0, 40.0, 39.0, 52.0, 44.0, 51.0, 62.0, 50.0, 49.0, 57.0, 38.0, 51.0, 35.0, 28.0, 32.0, 27.0, 23.0, 17.0, 19.0, 14.0, 8.0, 3.0, 11.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.096923828125, -0.09407997131347656, -0.09123611450195312, -0.08839225769042969, -0.08554840087890625, -0.08270454406738281, -0.07986068725585938, -0.07701683044433594, -0.0741729736328125, -0.07132911682128906, -0.06848526000976562, -0.06564140319824219, -0.06279754638671875, -0.05995368957519531, -0.057109832763671875, -0.05426597595214844, -0.051422119140625, -0.04857826232910156, -0.045734405517578125, -0.04289054870605469, -0.04004669189453125, -0.03720283508300781, -0.034358978271484375, -0.03151512145996094, -0.0286712646484375, -0.025827407836914062, -0.022983551025390625, -0.020139694213867188, -0.01729583740234375, -0.014451980590820312, -0.011608123779296875, -0.008764266967773438, -0.00592041015625, -0.0030765533447265625, -0.000232696533203125, 0.0026111602783203125, 0.00545501708984375, 0.008298873901367188, 0.011142730712890625, 0.013986587524414062, 0.0168304443359375, 0.019674301147460938, 0.022518157958984375, 0.025362014770507812, 0.02820587158203125, 0.031049728393554688, 0.033893585205078125, 0.03673744201660156, 0.039581298828125, 0.04242515563964844, 0.045269012451171875, 0.04811286926269531, 0.05095672607421875, 0.05380058288574219, 0.056644439697265625, 0.05948829650878906, 0.0623321533203125, 0.06517601013183594, 0.06801986694335938, 0.07086372375488281, 0.07370758056640625, 0.07655143737792969, 0.07939529418945312, 0.08223915100097656, 0.0850830078125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 4.0, 4.0, 10.0, 11.0, 18.0, 20.0, 36.0, 50.0, 69.0, 86.0, 139.0, 225.0, 307.0, 874.0, 7375.0, 373159.0, 652254.0, 11751.0, 1052.0, 403.0, 211.0, 151.0, 92.0, 64.0, 51.0, 23.0, 31.0, 22.0, 15.0, 7.0, 12.0, 8.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5576171875, -1.50213623046875, -1.4466552734375, -1.39117431640625, -1.335693359375, -1.28021240234375, -1.2247314453125, -1.16925048828125, -1.11376953125, -1.05828857421875, -1.0028076171875, -0.94732666015625, -0.891845703125, -0.83636474609375, -0.7808837890625, -0.72540283203125, -0.669921875, -0.61444091796875, -0.5589599609375, -0.50347900390625, -0.447998046875, -0.39251708984375, -0.3370361328125, -0.28155517578125, -0.22607421875, -0.17059326171875, -0.1151123046875, -0.05963134765625, -0.004150390625, 0.05133056640625, 0.1068115234375, 0.16229248046875, 0.2177734375, 0.27325439453125, 0.3287353515625, 0.38421630859375, 0.439697265625, 0.49517822265625, 0.5506591796875, 0.60614013671875, 0.66162109375, 0.71710205078125, 0.7725830078125, 0.82806396484375, 0.883544921875, 0.93902587890625, 0.9945068359375, 1.04998779296875, 1.10546875, 1.16094970703125, 1.2164306640625, 1.27191162109375, 1.327392578125, 1.38287353515625, 1.4383544921875, 1.49383544921875, 1.54931640625, 1.60479736328125, 1.6602783203125, 1.71575927734375, 1.771240234375, 1.82672119140625, 1.8822021484375, 1.93768310546875, 1.9931640625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 28.0, 78.0, 281.0, 417.0, 146.0, 45.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.656111478805542, -3.5602521896362305, -3.464393138885498, -3.3685338497161865, -3.272674560546875, -3.1768155097961426, -3.080956220626831, -2.9850969314575195, -2.889237880706787, -2.7933785915374756, -2.697519540786743, -2.6016602516174316, -2.50580096244812, -2.4099416732788086, -2.314082622528076, -2.2182233333587646, -2.122364044189453, -2.0265047550201416, -1.9306455850601196, -1.8347864151000977, -1.7389271259307861, -1.6430679559707642, -1.5472087860107422, -1.4513494968414307, -1.3554903268814087, -1.2596311569213867, -1.1637718677520752, -1.0679126977920532, -0.9720534682273865, -0.8761942386627197, -0.7803350687026978, -0.684475839138031, -0.5886166095733643, -0.4927573800086975, -0.39689818024635315, -0.3010389804840088, -0.20517975091934204, -0.10932052135467529, -0.01346135139465332, 0.08239787817001343, 0.17825710773468018, 0.2741163372993469, 0.3699755370616913, 0.46583473682403564, 0.5616939663887024, 0.6575531959533691, 0.7534123659133911, 0.8492715954780579, 0.9451308250427246, 1.0409899950027466, 1.136849284172058, 1.23270845413208, 1.3285677433013916, 1.4244269132614136, 1.5202860832214355, 1.616145372390747, 1.712004542350769, 1.807863712310791, 1.9037230014801025, 1.9995821714401245, 2.0954413414001465, 2.191300630569458, 2.2871599197387695, 2.383018970489502, 2.4788782596588135]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 4.0, 12.0, 6.0, 9.0, 18.0, 14.0, 13.0, 16.0, 23.0, 24.0, 32.0, 28.0, 34.0, 30.0, 40.0, 42.0, 45.0, 55.0, 43.0, 40.0, 43.0, 35.0, 31.0, 35.0, 33.0, 32.0, 37.0, 23.0, 31.0, 33.0, 18.0, 20.0, 15.0, 15.0, 8.0, 11.0, 9.0, 6.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.5994930267333984, -0.582394540309906, -0.5652959942817688, -0.5481975078582764, -0.5310989618301392, -0.5140004754066467, -0.4969019591808319, -0.4798034429550171, -0.46270492672920227, -0.44560641050338745, -0.42850789427757263, -0.4114093780517578, -0.3943108916282654, -0.3772123456001282, -0.36011385917663574, -0.3430153429508209, -0.3259168267250061, -0.3088183104991913, -0.29171979427337646, -0.27462127804756165, -0.2575227618217468, -0.2404242604970932, -0.22332575917243958, -0.20622724294662476, -0.18912872672080994, -0.17203021049499512, -0.1549316942691803, -0.13783319294452667, -0.12073467671871185, -0.10363616049289703, -0.08653765171766281, -0.06943914294242859, -0.05234062671661377, -0.03524211421608925, -0.018143601715564728, -0.001045089215040207, 0.016053423285484314, 0.03315193951129913, 0.050250448286533356, 0.06734895706176758, 0.0844474732875824, 0.10154598951339722, 0.11864449828863144, 0.13574300706386566, 0.15284152328968048, 0.1699400395154953, 0.18703854084014893, 0.20413705706596375, 0.22123557329177856, 0.23833408951759338, 0.2554326057434082, 0.272531121969223, 0.28962963819503784, 0.3067281246185303, 0.3238266408443451, 0.3409251570701599, 0.35802367329597473, 0.37512218952178955, 0.39222070574760437, 0.4093192219734192, 0.4264177083969116, 0.44351625442504883, 0.46061474084854126, 0.4777132570743561, 0.4948117733001709]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 7.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 13.0, 20.0, 30.0, 19.0, 31.0, 21.0, 37.0, 34.0, 37.0, 41.0, 32.0, 49.0, 43.0, 41.0, 47.0, 49.0, 40.0, 40.0, 45.0, 49.0, 40.0, 33.0, 44.0, 21.0, 16.0, 22.0, 15.0, 10.0, 8.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96875, -0.9354248046875, -0.902099609375, -0.8687744140625, -0.83544921875, -0.8021240234375, -0.768798828125, -0.7354736328125, -0.7021484375, -0.6688232421875, -0.635498046875, -0.6021728515625, -0.56884765625, -0.5355224609375, -0.502197265625, -0.4688720703125, -0.435546875, -0.4022216796875, -0.368896484375, -0.3355712890625, -0.30224609375, -0.2689208984375, -0.235595703125, -0.2022705078125, -0.1689453125, -0.1356201171875, -0.102294921875, -0.0689697265625, -0.03564453125, -0.0023193359375, 0.031005859375, 0.0643310546875, 0.09765625, 0.1309814453125, 0.164306640625, 0.1976318359375, 0.23095703125, 0.2642822265625, 0.297607421875, 0.3309326171875, 0.3642578125, 0.3975830078125, 0.430908203125, 0.4642333984375, 0.49755859375, 0.5308837890625, 0.564208984375, 0.5975341796875, 0.630859375, 0.6641845703125, 0.697509765625, 0.7308349609375, 0.76416015625, 0.7974853515625, 0.830810546875, 0.8641357421875, 0.8974609375, 0.9307861328125, 0.964111328125, 0.9974365234375, 1.03076171875, 1.0640869140625, 1.097412109375, 1.1307373046875, 1.1640625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 13.0, 19.0, 25.0, 50.0, 55.0, 103.0, 157.0, 221.0, 357.0, 596.0, 992.0, 1591.0, 2735.0, 5050.0, 9717.0, 23035.0, 67715.0, 257324.0, 463169.0, 142015.0, 41156.0, 15790.0, 7183.0, 3918.0, 2208.0, 1223.0, 798.0, 483.0, 289.0, 193.0, 112.0, 87.0, 55.0, 35.0, 24.0, 14.0, 15.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5534210205078125, -1.496490478515625, -1.4395599365234375, -1.38262939453125, -1.3256988525390625, -1.268768310546875, -1.2118377685546875, -1.1549072265625, -1.0979766845703125, -1.041046142578125, -0.9841156005859375, -0.92718505859375, -0.8702545166015625, -0.813323974609375, -0.7563934326171875, -0.699462890625, -0.6425323486328125, -0.585601806640625, -0.5286712646484375, -0.47174072265625, -0.4148101806640625, -0.357879638671875, -0.3009490966796875, -0.2440185546875, -0.1870880126953125, -0.130157470703125, -0.0732269287109375, -0.01629638671875, 0.0406341552734375, 0.097564697265625, 0.1544952392578125, 0.21142578125, 0.2683563232421875, 0.325286865234375, 0.3822174072265625, 0.43914794921875, 0.4960784912109375, 0.553009033203125, 0.6099395751953125, 0.6668701171875, 0.7238006591796875, 0.780731201171875, 0.8376617431640625, 0.89459228515625, 0.9515228271484375, 1.008453369140625, 1.0653839111328125, 1.122314453125, 1.1792449951171875, 1.236175537109375, 1.2931060791015625, 1.35003662109375, 1.4069671630859375, 1.463897705078125, 1.5208282470703125, 1.5777587890625, 1.6346893310546875, 1.691619873046875, 1.7485504150390625, 1.80548095703125, 1.8624114990234375, 1.919342041015625, 1.9762725830078125, 2.033203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 10.0, 13.0, 11.0, 13.0, 25.0, 28.0, 12.0, 32.0, 20.0, 36.0, 30.0, 31.0, 50.0, 64.0, 78.0, 143.0, 239.0, 1362.0, 196.0, 147.0, 73.0, 59.0, 44.0, 50.0, 45.0, 26.0, 30.0, 23.0, 16.0, 16.0, 15.0, 16.0, 12.0, 13.0, 7.0, 9.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.625, -3.516693115234375, -3.40838623046875, -3.300079345703125, -3.1917724609375, -3.083465576171875, -2.97515869140625, -2.866851806640625, -2.758544921875, -2.650238037109375, -2.54193115234375, -2.433624267578125, -2.3253173828125, -2.217010498046875, -2.10870361328125, -2.000396728515625, -1.89208984375, -1.783782958984375, -1.67547607421875, -1.567169189453125, -1.4588623046875, -1.350555419921875, -1.24224853515625, -1.133941650390625, -1.025634765625, -0.917327880859375, -0.80902099609375, -0.700714111328125, -0.5924072265625, -0.484100341796875, -0.37579345703125, -0.267486572265625, -0.1591796875, -0.050872802734375, 0.05743408203125, 0.165740966796875, 0.2740478515625, 0.382354736328125, 0.49066162109375, 0.598968505859375, 0.707275390625, 0.815582275390625, 0.92388916015625, 1.032196044921875, 1.1405029296875, 1.248809814453125, 1.35711669921875, 1.465423583984375, 1.57373046875, 1.682037353515625, 1.79034423828125, 1.898651123046875, 2.0069580078125, 2.115264892578125, 2.22357177734375, 2.331878662109375, 2.440185546875, 2.548492431640625, 2.65679931640625, 2.765106201171875, 2.8734130859375, 2.981719970703125, 3.09002685546875, 3.198333740234375, 3.306640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 7.0, 14.0, 10.0, 20.0, 22.0, 21.0, 32.0, 41.0, 60.0, 92.0, 154.0, 268.0, 424.0, 850.0, 1761.0, 3741.0, 9865.0, 32905.0, 204838.0, 2303098.0, 507858.0, 55198.0, 14339.0, 5381.0, 2254.0, 1052.0, 541.0, 297.0, 158.0, 99.0, 73.0, 48.0, 42.0, 26.0, 20.0, 19.0, 12.0, 17.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.892578125, -3.765655517578125, -3.63873291015625, -3.511810302734375, -3.3848876953125, -3.257965087890625, -3.13104248046875, -3.004119873046875, -2.877197265625, -2.750274658203125, -2.62335205078125, -2.496429443359375, -2.3695068359375, -2.242584228515625, -2.11566162109375, -1.988739013671875, -1.86181640625, -1.734893798828125, -1.60797119140625, -1.481048583984375, -1.3541259765625, -1.227203369140625, -1.10028076171875, -0.973358154296875, -0.846435546875, -0.719512939453125, -0.59259033203125, -0.465667724609375, -0.3387451171875, -0.211822509765625, -0.08489990234375, 0.042022705078125, 0.1689453125, 0.295867919921875, 0.42279052734375, 0.549713134765625, 0.6766357421875, 0.803558349609375, 0.93048095703125, 1.057403564453125, 1.184326171875, 1.311248779296875, 1.43817138671875, 1.565093994140625, 1.6920166015625, 1.818939208984375, 1.94586181640625, 2.072784423828125, 2.19970703125, 2.326629638671875, 2.45355224609375, 2.580474853515625, 2.7073974609375, 2.834320068359375, 2.96124267578125, 3.088165283203125, 3.215087890625, 3.342010498046875, 3.46893310546875, 3.595855712890625, 3.7227783203125, 3.849700927734375, 3.97662353515625, 4.103546142578125, 4.23046875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 82.0, 669.0, 249.0, 10.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.73983001708984, -111.76908874511719, -109.79834747314453, -107.82760620117188, -105.85686492919922, -103.88612365722656, -101.9153823852539, -99.94464111328125, -97.9738998413086, -96.00315856933594, -94.03241729736328, -92.06167602539062, -90.09093475341797, -88.12019348144531, -86.14945220947266, -84.1787109375, -82.20796966552734, -80.23722839355469, -78.26648712158203, -76.29574584960938, -74.32500457763672, -72.35426330566406, -70.3835220336914, -68.41278076171875, -66.4420394897461, -64.47129821777344, -62.50055694580078, -60.529815673828125, -58.55907440185547, -56.58833312988281, -54.617591857910156, -52.6468505859375, -50.67610549926758, -48.70536422729492, -46.734622955322266, -44.76388168334961, -42.79314041137695, -40.8223991394043, -38.85165786743164, -36.880916595458984, -34.91017532348633, -32.93943405151367, -30.968692779541016, -28.99795150756836, -27.027210235595703, -25.056468963623047, -23.08572769165039, -21.114986419677734, -19.144245147705078, -17.173503875732422, -15.202762603759766, -13.23202133178711, -11.261280059814453, -9.290538787841797, -7.319797515869141, -5.349056243896484, -3.3783159255981445, -1.4075746536254883, 0.563166618347168, 2.533907890319824, 4.5046491622924805, 6.475390434265137, 8.446131706237793, 10.41687297821045, 12.387614250183105]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 9.0, 6.0, 9.0, 4.0, 12.0, 21.0, 9.0, 20.0, 20.0, 26.0, 32.0, 24.0, 39.0, 33.0, 39.0, 43.0, 35.0, 36.0, 44.0, 33.0, 44.0, 44.0, 38.0, 37.0, 32.0, 32.0, 42.0, 30.0, 36.0, 24.0, 28.0, 21.0, 24.0, 8.0, 12.0, 11.0, 9.0, 6.0, 5.0, 10.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.440852165222168, -12.071533203125, -11.702214241027832, -11.332895278930664, -10.963577270507812, -10.594258308410645, -10.224939346313477, -9.855620384216309, -9.48630142211914, -9.116982460021973, -8.747663497924805, -8.378344535827637, -8.009025573730469, -7.639707088470459, -7.270388603210449, -6.901069641113281, -6.531750679016113, -6.162431716918945, -5.793112754821777, -5.423794269561768, -5.0544753074646, -4.685156345367432, -4.315837860107422, -3.946518898010254, -3.577199935913086, -3.207880973815918, -2.838562250137329, -2.4692435264587402, -2.0999245643615723, -1.7306057214736938, -1.3612868785858154, -0.9919681549072266, -0.6226482391357422, -0.25332939624786377, 0.11598944664001465, 0.48530828952789307, 0.8546271324157715, 1.22394597530365, 1.5932648181915283, 1.9625835418701172, 2.331902503967285, 2.701221466064453, 3.070540189743042, 3.439858913421631, 3.809177875518799, 4.178496837615967, 4.547815322875977, 4.9171342849731445, 5.2864532470703125, 5.6557722091674805, 6.025091171264648, 6.394409656524658, 6.763728618621826, 7.133047580718994, 7.502366065979004, 7.871685028076172, 8.24100399017334, 8.610322952270508, 8.979641914367676, 9.348960876464844, 9.718278884887695, 10.087597846984863, 10.456916809082031, 10.8262357711792, 11.195554733276367]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 11.0, 15.0, 19.0, 25.0, 27.0, 21.0, 38.0, 29.0, 30.0, 33.0, 40.0, 38.0, 45.0, 43.0, 44.0, 47.0, 46.0, 41.0, 44.0, 51.0, 41.0, 32.0, 33.0, 30.0, 15.0, 17.0, 12.0, 14.0, 21.0, 9.0, 9.0, 9.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0078125, -0.97503662109375, -0.9422607421875, -0.90948486328125, -0.876708984375, -0.84393310546875, -0.8111572265625, -0.77838134765625, -0.74560546875, -0.71282958984375, -0.6800537109375, -0.64727783203125, -0.614501953125, -0.58172607421875, -0.5489501953125, -0.51617431640625, -0.4833984375, -0.45062255859375, -0.4178466796875, -0.38507080078125, -0.352294921875, -0.31951904296875, -0.2867431640625, -0.25396728515625, -0.22119140625, -0.18841552734375, -0.1556396484375, -0.12286376953125, -0.090087890625, -0.05731201171875, -0.0245361328125, 0.00823974609375, 0.041015625, 0.07379150390625, 0.1065673828125, 0.13934326171875, 0.172119140625, 0.20489501953125, 0.2376708984375, 0.27044677734375, 0.30322265625, 0.33599853515625, 0.3687744140625, 0.40155029296875, 0.434326171875, 0.46710205078125, 0.4998779296875, 0.53265380859375, 0.5654296875, 0.59820556640625, 0.6309814453125, 0.66375732421875, 0.696533203125, 0.72930908203125, 0.7620849609375, 0.79486083984375, 0.82763671875, 0.86041259765625, 0.8931884765625, 0.92596435546875, 0.958740234375, 0.99151611328125, 1.0242919921875, 1.05706787109375, 1.08984375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 13.0, 16.0, 29.0, 48.0, 52.0, 91.0, 107.0, 147.0, 193.0, 313.0, 457.0, 688.0, 1040.0, 1656.0, 2636.0, 4007.0, 7034.0, 12270.0, 23191.0, 50251.0, 150293.0, 769396.0, 2213201.0, 726171.0, 134561.0, 46485.0, 21691.0, 11340.0, 6365.0, 3867.0, 2316.0, 1469.0, 975.0, 625.0, 406.0, 279.0, 195.0, 131.0, 83.0, 62.0, 45.0, 31.0, 19.0, 13.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7407379150390625, -1.681671142578125, -1.6226043701171875, -1.56353759765625, -1.5044708251953125, -1.445404052734375, -1.3863372802734375, -1.3272705078125, -1.2682037353515625, -1.209136962890625, -1.1500701904296875, -1.09100341796875, -1.0319366455078125, -0.972869873046875, -0.9138031005859375, -0.854736328125, -0.7956695556640625, -0.736602783203125, -0.6775360107421875, -0.61846923828125, -0.5594024658203125, -0.500335693359375, -0.4412689208984375, -0.3822021484375, -0.3231353759765625, -0.264068603515625, -0.2050018310546875, -0.14593505859375, -0.0868682861328125, -0.027801513671875, 0.0312652587890625, 0.09033203125, 0.1493988037109375, 0.208465576171875, 0.2675323486328125, 0.32659912109375, 0.3856658935546875, 0.444732666015625, 0.5037994384765625, 0.5628662109375, 0.6219329833984375, 0.680999755859375, 0.7400665283203125, 0.79913330078125, 0.8582000732421875, 0.917266845703125, 0.9763336181640625, 1.035400390625, 1.0944671630859375, 1.153533935546875, 1.2126007080078125, 1.27166748046875, 1.3307342529296875, 1.389801025390625, 1.4488677978515625, 1.5079345703125, 1.5670013427734375, 1.626068115234375, 1.6851348876953125, 1.74420166015625, 1.8032684326171875, 1.862335205078125, 1.9214019775390625, 1.98046875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 19.0, 12.0, 22.0, 30.0, 41.0, 58.0, 94.0, 136.0, 224.0, 360.0, 523.0, 732.0, 598.0, 412.0, 263.0, 171.0, 111.0, 68.0, 64.0, 35.0, 26.0, 18.0, 12.0, 4.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.2109375, -4.104766845703125, -3.99859619140625, -3.892425537109375, -3.7862548828125, -3.680084228515625, -3.57391357421875, -3.467742919921875, -3.361572265625, -3.255401611328125, -3.14923095703125, -3.043060302734375, -2.9368896484375, -2.830718994140625, -2.72454833984375, -2.618377685546875, -2.51220703125, -2.406036376953125, -2.29986572265625, -2.193695068359375, -2.0875244140625, -1.981353759765625, -1.87518310546875, -1.769012451171875, -1.662841796875, -1.556671142578125, -1.45050048828125, -1.344329833984375, -1.2381591796875, -1.131988525390625, -1.02581787109375, -0.919647216796875, -0.8134765625, -0.707305908203125, -0.60113525390625, -0.494964599609375, -0.3887939453125, -0.282623291015625, -0.17645263671875, -0.070281982421875, 0.035888671875, 0.142059326171875, 0.24822998046875, 0.354400634765625, 0.4605712890625, 0.566741943359375, 0.67291259765625, 0.779083251953125, 0.88525390625, 0.991424560546875, 1.09759521484375, 1.203765869140625, 1.3099365234375, 1.416107177734375, 1.52227783203125, 1.628448486328125, 1.734619140625, 1.840789794921875, 1.94696044921875, 2.053131103515625, 2.1593017578125, 2.265472412109375, 2.37164306640625, 2.477813720703125, 2.583984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 7.0, 16.0, 22.0, 18.0, 35.0, 50.0, 61.0, 100.0, 191.0, 334.0, 591.0, 1238.0, 2586.0, 6091.0, 15722.0, 48124.0, 209905.0, 2057751.0, 1609329.0, 175012.0, 42706.0, 14157.0, 5472.0, 2316.0, 1071.0, 573.0, 275.0, 152.0, 128.0, 81.0, 50.0, 32.0, 22.0, 13.0, 10.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.76129150390625, -3.6163330078125, -3.47137451171875, -3.326416015625, -3.18145751953125, -3.0364990234375, -2.89154052734375, -2.74658203125, -2.60162353515625, -2.4566650390625, -2.31170654296875, -2.166748046875, -2.02178955078125, -1.8768310546875, -1.73187255859375, -1.5869140625, -1.44195556640625, -1.2969970703125, -1.15203857421875, -1.007080078125, -0.86212158203125, -0.7171630859375, -0.57220458984375, -0.42724609375, -0.28228759765625, -0.1373291015625, 0.00762939453125, 0.152587890625, 0.29754638671875, 0.4425048828125, 0.58746337890625, 0.732421875, 0.87738037109375, 1.0223388671875, 1.16729736328125, 1.312255859375, 1.45721435546875, 1.6021728515625, 1.74713134765625, 1.89208984375, 2.03704833984375, 2.1820068359375, 2.32696533203125, 2.471923828125, 2.61688232421875, 2.7618408203125, 2.90679931640625, 3.0517578125, 3.19671630859375, 3.3416748046875, 3.48663330078125, 3.631591796875, 3.77655029296875, 3.9215087890625, 4.06646728515625, 4.21142578125, 4.35638427734375, 4.5013427734375, 4.64630126953125, 4.791259765625, 4.93621826171875, 5.0811767578125, 5.22613525390625, 5.37109375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 20.0, 54.0, 119.0, 223.0, 229.0, 194.0, 94.0, 45.0, 12.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.313840866088867, -15.250967979431152, -14.188094139099121, -13.125221252441406, -12.062347412109375, -10.99947452545166, -9.936601638793945, -8.873727798461914, -7.810854911804199, -6.747981548309326, -5.685108184814453, -4.622235298156738, -3.5593619346618652, -2.496488571166992, -1.4336156845092773, -0.3707423210144043, 0.6921310424804688, 1.7550042867660522, 2.8178775310516357, 3.8807506561279297, 4.943624019622803, 6.006497383117676, 7.069370269775391, 8.132244110107422, 9.195116996765137, 10.257989883422852, 11.320863723754883, 12.383736610412598, 13.446609497070312, 14.509483337402344, 15.572356224060059, 16.635229110717773, 17.698101043701172, 18.760974884033203, 19.8238468170166, 20.886720657348633, 21.949594497680664, 23.012466430664062, 24.075340270996094, 25.138214111328125, 26.201087951660156, 27.263961791992188, 28.326833724975586, 29.389707565307617, 30.45258140563965, 31.515453338623047, 32.57832717895508, 33.64120101928711, 34.704071044921875, 35.766944885253906, 36.82981872558594, 37.89269256591797, 38.955562591552734, 40.018436431884766, 41.0813102722168, 42.14418411254883, 43.20705795288086, 44.26993179321289, 45.33280563354492, 46.39567565917969, 47.45854949951172, 48.52142333984375, 49.58429718017578, 50.64717102050781, 51.710044860839844]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 4.0, 4.0, 13.0, 15.0, 9.0, 13.0, 12.0, 13.0, 16.0, 17.0, 21.0, 28.0, 37.0, 48.0, 34.0, 39.0, 31.0, 22.0, 42.0, 53.0, 32.0, 32.0, 36.0, 30.0, 37.0, 41.0, 29.0, 25.0, 32.0, 27.0, 24.0, 18.0, 24.0, 18.0, 24.0, 18.0, 13.0, 8.0, 10.0, 10.0, 9.0, 2.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.24605941772461, -7.991235733032227, -7.7364115715026855, -7.4815874099731445, -7.226763725280762, -6.971940040588379, -6.717115879058838, -6.462291717529297, -6.207468032836914, -5.952644348144531, -5.69782018661499, -5.442996025085449, -5.188172340393066, -4.933348655700684, -4.678524494171143, -4.423700332641602, -4.168876647949219, -3.914052724838257, -3.659228801727295, -3.404404878616333, -3.149580955505371, -2.894757032394409, -2.6399331092834473, -2.3851091861724854, -2.1302852630615234, -1.8754613399505615, -1.6206374168395996, -1.3658134937286377, -1.1109895706176758, -0.8561656475067139, -0.601341724395752, -0.34651780128479004, -0.09169387817382812, 0.1631300449371338, 0.4179539680480957, 0.6727778911590576, 0.9276018142700195, 1.1824257373809814, 1.4372496604919434, 1.6920735836029053, 1.9468975067138672, 2.201721429824829, 2.456545352935791, 2.711369276046753, 2.966193199157715, 3.2210171222686768, 3.4758410453796387, 3.7306649684906006, 3.9854888916015625, 4.240312576293945, 4.495136737823486, 4.749960899353027, 5.00478458404541, 5.259608268737793, 5.514432430267334, 5.769256591796875, 6.024080276489258, 6.278903961181641, 6.533728122711182, 6.788552284240723, 7.0433759689331055, 7.298199653625488, 7.553023815155029, 7.80784797668457, 8.062671661376953]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 14.0, 9.0, 14.0, 21.0, 27.0, 17.0, 25.0, 30.0, 34.0, 22.0, 44.0, 39.0, 52.0, 36.0, 43.0, 48.0, 46.0, 49.0, 50.0, 40.0, 43.0, 39.0, 35.0, 36.0, 28.0, 17.0, 22.0, 25.0, 11.0, 12.0, 14.0, 8.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0673828125, -1.0327911376953125, -0.998199462890625, -0.9636077880859375, -0.92901611328125, -0.8944244384765625, -0.859832763671875, -0.8252410888671875, -0.7906494140625, -0.7560577392578125, -0.721466064453125, -0.6868743896484375, -0.65228271484375, -0.6176910400390625, -0.583099365234375, -0.5485076904296875, -0.513916015625, -0.4793243408203125, -0.444732666015625, -0.4101409912109375, -0.37554931640625, -0.3409576416015625, -0.306365966796875, -0.2717742919921875, -0.2371826171875, -0.2025909423828125, -0.167999267578125, -0.1334075927734375, -0.09881591796875, -0.0642242431640625, -0.029632568359375, 0.0049591064453125, 0.03955078125, 0.0741424560546875, 0.108734130859375, 0.1433258056640625, 0.17791748046875, 0.2125091552734375, 0.247100830078125, 0.2816925048828125, 0.3162841796875, 0.3508758544921875, 0.385467529296875, 0.4200592041015625, 0.45465087890625, 0.4892425537109375, 0.523834228515625, 0.5584259033203125, 0.593017578125, 0.6276092529296875, 0.662200927734375, 0.6967926025390625, 0.73138427734375, 0.7659759521484375, 0.800567626953125, 0.8351593017578125, 0.8697509765625, 0.9043426513671875, 0.938934326171875, 0.9735260009765625, 1.00811767578125, 1.0427093505859375, 1.077301025390625, 1.1118927001953125, 1.146484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 10.0, 10.0, 19.0, 30.0, 52.0, 67.0, 84.0, 153.0, 217.0, 342.0, 521.0, 806.0, 1256.0, 2036.0, 2970.0, 4833.0, 7401.0, 11749.0, 18184.0, 27838.0, 42350.0, 62038.0, 87171.0, 113428.0, 131661.0, 133223.0, 116542.0, 90171.0, 65845.0, 44564.0, 29276.0, 19355.0, 12174.0, 7930.0, 5130.0, 3251.0, 2056.0, 1373.0, 869.0, 530.0, 364.0, 231.0, 130.0, 87.0, 77.0, 51.0, 30.0, 25.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-0.72705078125, -0.704376220703125, -0.68170166015625, -0.659027099609375, -0.6363525390625, -0.613677978515625, -0.59100341796875, -0.568328857421875, -0.545654296875, -0.522979736328125, -0.50030517578125, -0.477630615234375, -0.4549560546875, -0.432281494140625, -0.40960693359375, -0.386932373046875, -0.3642578125, -0.341583251953125, -0.31890869140625, -0.296234130859375, -0.2735595703125, -0.250885009765625, -0.22821044921875, -0.205535888671875, -0.182861328125, -0.160186767578125, -0.13751220703125, -0.114837646484375, -0.0921630859375, -0.069488525390625, -0.04681396484375, -0.024139404296875, -0.00146484375, 0.021209716796875, 0.04388427734375, 0.066558837890625, 0.0892333984375, 0.111907958984375, 0.13458251953125, 0.157257080078125, 0.179931640625, 0.202606201171875, 0.22528076171875, 0.247955322265625, 0.2706298828125, 0.293304443359375, 0.31597900390625, 0.338653564453125, 0.361328125, 0.384002685546875, 0.40667724609375, 0.429351806640625, 0.4520263671875, 0.474700927734375, 0.49737548828125, 0.520050048828125, 0.542724609375, 0.565399169921875, 0.58807373046875, 0.610748291015625, 0.6334228515625, 0.656097412109375, 0.67877197265625, 0.701446533203125, 0.72412109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 16.0, 10.0, 20.0, 13.0, 16.0, 22.0, 19.0, 45.0, 29.0, 33.0, 34.0, 38.0, 43.0, 37.0, 43.0, 47.0, 1077.0, 50.0, 36.0, 36.0, 53.0, 43.0, 33.0, 34.0, 20.0, 26.0, 25.0, 11.0, 17.0, 14.0, 19.0, 4.0, 12.0, 13.0, 5.0, 3.0, 1.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8901596069335938, -0.8569793701171875, -0.8237991333007812, -0.790618896484375, -0.7574386596679688, -0.7242584228515625, -0.6910781860351562, -0.65789794921875, -0.6247177124023438, -0.5915374755859375, -0.5583572387695312, -0.525177001953125, -0.49199676513671875, -0.4588165283203125, -0.42563629150390625, -0.3924560546875, -0.35927581787109375, -0.3260955810546875, -0.29291534423828125, -0.259735107421875, -0.22655487060546875, -0.1933746337890625, -0.16019439697265625, -0.12701416015625, -0.09383392333984375, -0.0606536865234375, -0.02747344970703125, 0.005706787109375, 0.03888702392578125, 0.0720672607421875, 0.10524749755859375, 0.138427734375, 0.17160797119140625, 0.2047882080078125, 0.23796844482421875, 0.271148681640625, 0.30432891845703125, 0.3375091552734375, 0.37068939208984375, 0.40386962890625, 0.43704986572265625, 0.4702301025390625, 0.5034103393554688, 0.536590576171875, 0.5697708129882812, 0.6029510498046875, 0.6361312866210938, 0.6693115234375, 0.7024917602539062, 0.7356719970703125, 0.7688522338867188, 0.802032470703125, 0.8352127075195312, 0.8683929443359375, 0.9015731811523438, 0.93475341796875, 0.9679336547851562, 1.0011138916015625, 1.0342941284179688, 1.067474365234375, 1.1006546020507812, 1.1338348388671875, 1.1670150756835938, 1.2001953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 16.0, 16.0, 25.0, 34.0, 59.0, 73.0, 103.0, 152.0, 222.0, 305.0, 426.0, 583.0, 841.0, 1228.0, 1766.0, 2641.0, 3779.0, 5594.0, 7973.0, 12322.0, 19533.0, 39667.0, 183794.0, 1562573.0, 160041.0, 37547.0, 18832.0, 11784.0, 7902.0, 5336.0, 3701.0, 2609.0, 1692.0, 1172.0, 840.0, 565.0, 381.0, 289.0, 194.0, 133.0, 103.0, 86.0, 52.0, 28.0, 33.0, 17.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.9970703125, -0.9672775268554688, -0.9374847412109375, -0.9076919555664062, -0.877899169921875, -0.8481063842773438, -0.8183135986328125, -0.7885208129882812, -0.75872802734375, -0.7289352416992188, -0.6991424560546875, -0.6693496704101562, -0.639556884765625, -0.6097640991210938, -0.5799713134765625, -0.5501785278320312, -0.5203857421875, -0.49059295654296875, -0.4608001708984375, -0.43100738525390625, -0.401214599609375, -0.37142181396484375, -0.3416290283203125, -0.31183624267578125, -0.28204345703125, -0.25225067138671875, -0.2224578857421875, -0.19266510009765625, -0.162872314453125, -0.13307952880859375, -0.1032867431640625, -0.07349395751953125, -0.043701171875, -0.01390838623046875, 0.0158843994140625, 0.04567718505859375, 0.075469970703125, 0.10526275634765625, 0.1350555419921875, 0.16484832763671875, 0.19464111328125, 0.22443389892578125, 0.2542266845703125, 0.28401947021484375, 0.313812255859375, 0.34360504150390625, 0.3733978271484375, 0.40319061279296875, 0.4329833984375, 0.46277618408203125, 0.4925689697265625, 0.5223617553710938, 0.552154541015625, 0.5819473266601562, 0.6117401123046875, 0.6415328979492188, 0.67132568359375, 0.7011184692382812, 0.7309112548828125, 0.7607040405273438, 0.790496826171875, 0.8202896118164062, 0.8500823974609375, 0.8798751831054688, 0.90966796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 3.0, 5.0, 7.0, 7.0, 4.0, 7.0, 15.0, 16.0, 18.0, 26.0, 24.0, 25.0, 35.0, 33.0, 35.0, 51.0, 42.0, 64.0, 55.0, 48.0, 44.0, 58.0, 43.0, 42.0, 40.0, 39.0, 37.0, 32.0, 31.0, 22.0, 17.0, 16.0, 8.0, 6.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.056060791015625, -0.0539708137512207, -0.051880836486816406, -0.04979085922241211, -0.04770088195800781, -0.045610904693603516, -0.04352092742919922, -0.04143095016479492, -0.039340972900390625, -0.03725099563598633, -0.03516101837158203, -0.033071041107177734, -0.030981063842773438, -0.02889108657836914, -0.026801109313964844, -0.024711132049560547, -0.02262115478515625, -0.020531177520751953, -0.018441200256347656, -0.01635122299194336, -0.014261245727539062, -0.012171268463134766, -0.010081291198730469, -0.007991313934326172, -0.005901336669921875, -0.003811359405517578, -0.0017213821411132812, 0.0003685951232910156, 0.0024585723876953125, 0.004548549652099609, 0.006638526916503906, 0.008728504180908203, 0.0108184814453125, 0.012908458709716797, 0.014998435974121094, 0.01708841323852539, 0.019178390502929688, 0.021268367767333984, 0.02335834503173828, 0.025448322296142578, 0.027538299560546875, 0.029628276824951172, 0.03171825408935547, 0.033808231353759766, 0.03589820861816406, 0.03798818588256836, 0.040078163146972656, 0.04216814041137695, 0.04425811767578125, 0.04634809494018555, 0.048438072204589844, 0.05052804946899414, 0.05261802673339844, 0.054708003997802734, 0.05679798126220703, 0.05888795852661133, 0.060977935791015625, 0.06306791305541992, 0.06515789031982422, 0.06724786758422852, 0.06933784484863281, 0.07142782211303711, 0.0735177993774414, 0.0756077766418457, 0.07769775390625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 5.0, 5.0, 10.0, 18.0, 27.0, 31.0, 32.0, 58.0, 90.0, 101.0, 137.0, 232.0, 456.0, 1691.0, 21549.0, 682703.0, 328091.0, 11005.0, 1172.0, 410.0, 228.0, 144.0, 102.0, 81.0, 39.0, 27.0, 23.0, 12.0, 18.0, 11.0, 7.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3215713500976562, -1.2847442626953125, -1.2479171752929688, -1.211090087890625, -1.1742630004882812, -1.1374359130859375, -1.1006088256835938, -1.06378173828125, -1.0269546508789062, -0.9901275634765625, -0.9533004760742188, -0.916473388671875, -0.8796463012695312, -0.8428192138671875, -0.8059921264648438, -0.7691650390625, -0.7323379516601562, -0.6955108642578125, -0.6586837768554688, -0.621856689453125, -0.5850296020507812, -0.5482025146484375, -0.5113754272460938, -0.47454833984375, -0.43772125244140625, -0.4008941650390625, -0.36406707763671875, -0.327239990234375, -0.29041290283203125, -0.2535858154296875, -0.21675872802734375, -0.179931640625, -0.14310455322265625, -0.1062774658203125, -0.06945037841796875, -0.032623291015625, 0.00420379638671875, 0.0410308837890625, 0.07785797119140625, 0.11468505859375, 0.15151214599609375, 0.1883392333984375, 0.22516632080078125, 0.261993408203125, 0.29882049560546875, 0.3356475830078125, 0.37247467041015625, 0.4093017578125, 0.44612884521484375, 0.4829559326171875, 0.5197830200195312, 0.556610107421875, 0.5934371948242188, 0.6302642822265625, 0.6670913696289062, 0.70391845703125, 0.7407455444335938, 0.7775726318359375, 0.8143997192382812, 0.851226806640625, 0.8880538940429688, 0.9248809814453125, 0.9617080688476562, 0.99853515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 23.0, 76.0, 229.0, 395.0, 187.0, 63.0, 23.0, 10.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3318135738372803, -2.2814669609069824, -2.2311201095581055, -2.1807734966278076, -2.1304268836975098, -2.080080032348633, -2.029733419418335, -1.979386806488037, -1.9290400743484497, -1.8786933422088623, -1.8283467292785645, -1.777999997138977, -1.7276533842086792, -1.6773066520690918, -1.626960039138794, -1.5766133069992065, -1.5262665748596191, -1.4759198427200317, -1.4255732297897339, -1.3752264976501465, -1.3248798847198486, -1.2745331525802612, -1.2241864204406738, -1.173839807510376, -1.1234931945800781, -1.0731464624404907, -1.0227998495101929, -0.9724531173706055, -0.9221064448356628, -0.8717597723007202, -0.8214130997657776, -0.771066427230835, -0.7207196354866028, -0.6703729629516602, -0.6200262904167175, -0.5696796178817749, -0.5193328857421875, -0.4689862132072449, -0.41863954067230225, -0.36829283833503723, -0.3179461658000946, -0.267599493265152, -0.21725279092788696, -0.16690611839294434, -0.11655943095684052, -0.0662127435207367, -0.015866070985794067, 0.03448063135147095, 0.08482730388641357, 0.1351739913225174, 0.18552067875862122, 0.23586735129356384, 0.28621405363082886, 0.3365607261657715, 0.3869073987007141, 0.4372541010379791, 0.48760077357292175, 0.5379474759101868, 0.5882941484451294, 0.638640820980072, 0.6889874935150146, 0.739334225654602, 0.7896808385848999, 0.8400275707244873, 0.8903742432594299]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 19.0, 11.0, 23.0, 27.0, 30.0, 28.0, 31.0, 35.0, 34.0, 43.0, 56.0, 52.0, 44.0, 50.0, 52.0, 55.0, 38.0, 48.0, 46.0, 37.0, 42.0, 35.0, 20.0, 18.0, 21.0, 15.0, 18.0, 9.0, 15.0, 4.0, 6.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.33830541372299194, -0.32950419187545776, -0.3207029700279236, -0.3119017481803894, -0.3031005263328552, -0.29429927468299866, -0.2854980528354645, -0.2766968309879303, -0.2678956091403961, -0.25909438729286194, -0.25029316544532776, -0.24149192869663239, -0.2326907068490982, -0.22388948500156403, -0.21508824825286865, -0.20628702640533447, -0.1974858045578003, -0.1886845827102661, -0.17988336086273193, -0.17108212411403656, -0.16228090226650238, -0.1534796804189682, -0.14467844367027283, -0.13587722182273865, -0.12707599997520447, -0.11827477812767029, -0.10947354882955551, -0.10067231953144073, -0.09187109768390656, -0.08306987583637238, -0.0742686465382576, -0.06546741724014282, -0.05666619539260864, -0.047864969819784164, -0.039063744246959686, -0.030262518674135208, -0.02146129310131073, -0.012660067528486252, -0.0038588419556617737, 0.0049423836171627045, 0.013743609189987183, 0.02254483476281166, 0.03134606033563614, 0.04014728590846062, 0.048948511481285095, 0.05774973705410957, 0.06655096262693405, 0.07535219192504883, 0.08415341377258301, 0.09295463562011719, 0.10175586491823196, 0.11055709421634674, 0.11935831606388092, 0.1281595379114151, 0.13696077466011047, 0.14576199650764465, 0.15456321835517883, 0.163364440202713, 0.1721656620502472, 0.18096689879894257, 0.18976812064647675, 0.19856934249401093, 0.2073705792427063, 0.21617180109024048, 0.22497302293777466]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 12.0, 13.0, 15.0, 20.0, 21.0, 24.0, 19.0, 33.0, 31.0, 29.0, 35.0, 38.0, 51.0, 56.0, 44.0, 60.0, 59.0, 55.0, 42.0, 44.0, 53.0, 33.0, 40.0, 34.0, 26.0, 21.0, 17.0, 13.0, 13.0, 8.0, 6.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1611328125, -1.123046875, -1.0849609375, -1.046875, -1.0087890625, -0.970703125, -0.9326171875, -0.89453125, -0.8564453125, -0.818359375, -0.7802734375, -0.7421875, -0.7041015625, -0.666015625, -0.6279296875, -0.58984375, -0.5517578125, -0.513671875, -0.4755859375, -0.4375, -0.3994140625, -0.361328125, -0.3232421875, -0.28515625, -0.2470703125, -0.208984375, -0.1708984375, -0.1328125, -0.0947265625, -0.056640625, -0.0185546875, 0.01953125, 0.0576171875, 0.095703125, 0.1337890625, 0.171875, 0.2099609375, 0.248046875, 0.2861328125, 0.32421875, 0.3623046875, 0.400390625, 0.4384765625, 0.4765625, 0.5146484375, 0.552734375, 0.5908203125, 0.62890625, 0.6669921875, 0.705078125, 0.7431640625, 0.78125, 0.8193359375, 0.857421875, 0.8955078125, 0.93359375, 0.9716796875, 1.009765625, 1.0478515625, 1.0859375, 1.1240234375, 1.162109375, 1.2001953125, 1.23828125, 1.2763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 7.0, 15.0, 11.0, 23.0, 36.0, 75.0, 81.0, 149.0, 257.0, 336.0, 533.0, 789.0, 1270.0, 2063.0, 3438.0, 6665.0, 13764.0, 38434.0, 145924.0, 544052.0, 206631.0, 49187.0, 17127.0, 7436.0, 4011.0, 2255.0, 1431.0, 910.0, 557.0, 371.0, 240.0, 199.0, 98.0, 72.0, 37.0, 35.0, 13.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9381103515625, -1.870361328125, -1.8026123046875, -1.73486328125, -1.6671142578125, -1.599365234375, -1.5316162109375, -1.4638671875, -1.3961181640625, -1.328369140625, -1.2606201171875, -1.19287109375, -1.1251220703125, -1.057373046875, -0.9896240234375, -0.921875, -0.8541259765625, -0.786376953125, -0.7186279296875, -0.65087890625, -0.5831298828125, -0.515380859375, -0.4476318359375, -0.3798828125, -0.3121337890625, -0.244384765625, -0.1766357421875, -0.10888671875, -0.0411376953125, 0.026611328125, 0.0943603515625, 0.162109375, 0.2298583984375, 0.297607421875, 0.3653564453125, 0.43310546875, 0.5008544921875, 0.568603515625, 0.6363525390625, 0.7041015625, 0.7718505859375, 0.839599609375, 0.9073486328125, 0.97509765625, 1.0428466796875, 1.110595703125, 1.1783447265625, 1.24609375, 1.3138427734375, 1.381591796875, 1.4493408203125, 1.51708984375, 1.5848388671875, 1.652587890625, 1.7203369140625, 1.7880859375, 1.8558349609375, 1.923583984375, 1.9913330078125, 2.05908203125, 2.1268310546875, 2.194580078125, 2.2623291015625, 2.330078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 14.0, 11.0, 20.0, 17.0, 18.0, 27.0, 31.0, 35.0, 31.0, 34.0, 46.0, 61.0, 85.0, 110.0, 228.0, 1395.0, 254.0, 138.0, 82.0, 63.0, 45.0, 61.0, 36.0, 29.0, 21.0, 28.0, 20.0, 11.0, 5.0, 8.0, 11.0, 8.0, 7.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.968414306640625, -3.84307861328125, -3.717742919921875, -3.5924072265625, -3.467071533203125, -3.34173583984375, -3.216400146484375, -3.091064453125, -2.965728759765625, -2.84039306640625, -2.715057373046875, -2.5897216796875, -2.464385986328125, -2.33905029296875, -2.213714599609375, -2.08837890625, -1.963043212890625, -1.83770751953125, -1.712371826171875, -1.5870361328125, -1.461700439453125, -1.33636474609375, -1.211029052734375, -1.085693359375, -0.960357666015625, -0.83502197265625, -0.709686279296875, -0.5843505859375, -0.459014892578125, -0.33367919921875, -0.208343505859375, -0.0830078125, 0.042327880859375, 0.16766357421875, 0.292999267578125, 0.4183349609375, 0.543670654296875, 0.66900634765625, 0.794342041015625, 0.919677734375, 1.045013427734375, 1.17034912109375, 1.295684814453125, 1.4210205078125, 1.546356201171875, 1.67169189453125, 1.797027587890625, 1.92236328125, 2.047698974609375, 2.17303466796875, 2.298370361328125, 2.4237060546875, 2.549041748046875, 2.67437744140625, 2.799713134765625, 2.925048828125, 3.050384521484375, 3.17572021484375, 3.301055908203125, 3.4263916015625, 3.551727294921875, 3.67706298828125, 3.802398681640625, 3.927734375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 3.0, 6.0, 18.0, 17.0, 29.0, 33.0, 41.0, 62.0, 116.0, 182.0, 315.0, 726.0, 2074.0, 8892.0, 76820.0, 2675627.0, 354657.0, 20077.0, 3756.0, 1084.0, 443.0, 262.0, 145.0, 81.0, 56.0, 40.0, 40.0, 24.0, 15.0, 12.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.02734375, -6.8057861328125, -6.584228515625, -6.3626708984375, -6.14111328125, -5.9195556640625, -5.697998046875, -5.4764404296875, -5.2548828125, -5.0333251953125, -4.811767578125, -4.5902099609375, -4.36865234375, -4.1470947265625, -3.925537109375, -3.7039794921875, -3.482421875, -3.2608642578125, -3.039306640625, -2.8177490234375, -2.59619140625, -2.3746337890625, -2.153076171875, -1.9315185546875, -1.7099609375, -1.4884033203125, -1.266845703125, -1.0452880859375, -0.82373046875, -0.6021728515625, -0.380615234375, -0.1590576171875, 0.0625, 0.2840576171875, 0.505615234375, 0.7271728515625, 0.94873046875, 1.1702880859375, 1.391845703125, 1.6134033203125, 1.8349609375, 2.0565185546875, 2.278076171875, 2.4996337890625, 2.72119140625, 2.9427490234375, 3.164306640625, 3.3858642578125, 3.607421875, 3.8289794921875, 4.050537109375, 4.2720947265625, 4.49365234375, 4.7152099609375, 4.936767578125, 5.1583251953125, 5.3798828125, 5.6014404296875, 5.822998046875, 6.0445556640625, 6.26611328125, 6.4876708984375, 6.709228515625, 6.9307861328125, 7.15234375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 57.0, 938.0, 23.0, 1.0], "bins": [-221.81622314453125, -218.2049560546875, -214.5937042236328, -210.98243713378906, -207.37118530273438, -203.75991821289062, -200.14865112304688, -196.5373992919922, -192.92613220214844, -189.3148651123047, -185.70361328125, -182.09234619140625, -178.48109436035156, -174.8698272705078, -171.25857543945312, -167.64730834960938, -164.03604125976562, -160.42477416992188, -156.8135223388672, -153.20225524902344, -149.59100341796875, -145.979736328125, -142.36846923828125, -138.75721740722656, -135.14596557617188, -131.53469848632812, -127.92344665527344, -124.31217956542969, -120.70092010498047, -117.08966064453125, -113.47840118408203, -109.86714172363281, -106.25587463378906, -102.64461517333984, -99.03335571289062, -95.42208862304688, -91.81082916259766, -88.19956970214844, -84.58831024169922, -80.97705078125, -77.36578369140625, -73.75452423095703, -70.14326477050781, -66.53199768066406, -62.920738220214844, -59.309478759765625, -55.698219299316406, -52.08695983886719, -48.47570037841797, -44.86444091796875, -41.253177642822266, -37.64191818237305, -34.03065490722656, -30.419395446777344, -26.808135986328125, -23.196874618530273, -19.585613250732422, -15.97435188293457, -12.363091468811035, -8.7518310546875, -5.140569686889648, -1.5293083190917969, 2.081951141357422, 5.693212509155273, 9.304474830627441]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 16.0, 17.0, 15.0, 13.0, 15.0, 28.0, 35.0, 31.0, 35.0, 38.0, 34.0, 47.0, 51.0, 44.0, 42.0, 28.0, 56.0, 47.0, 40.0, 34.0, 43.0, 40.0, 39.0, 24.0, 20.0, 29.0, 12.0, 18.0, 19.0, 15.0, 16.0, 13.0, 5.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.436010360717773, -13.035432815551758, -12.634855270385742, -12.234277725219727, -11.833700180053711, -11.433122634887695, -11.032544136047363, -10.631966590881348, -10.231389045715332, -9.830811500549316, -9.4302339553833, -9.029656410217285, -8.629077911376953, -8.228500366210938, -7.827922821044922, -7.427345275878906, -7.026767730712891, -6.626190185546875, -6.225612640380859, -5.8250346183776855, -5.42445707321167, -5.023879528045654, -4.6233015060424805, -4.222723960876465, -3.822146415710449, -3.4215688705444336, -3.020991086959839, -2.620413303375244, -2.2198357582092285, -1.819258213043213, -1.4186804294586182, -1.0181026458740234, -0.6175241470336914, -0.21694648265838623, 0.18363118171691895, 0.5842088460922241, 0.9847865104675293, 1.385364055633545, 1.7859418392181396, 2.1865196228027344, 2.58709716796875, 2.9876747131347656, 3.3882524967193604, 3.788830280303955, 4.189407825469971, 4.589985370635986, 4.99056339263916, 5.391140937805176, 5.791718482971191, 6.192296028137207, 6.592873573303223, 6.9934515953063965, 7.394029140472412, 7.794606685638428, 8.195184707641602, 8.595762252807617, 8.996339797973633, 9.396917343139648, 9.797494888305664, 10.19807243347168, 10.598649978637695, 10.999227523803711, 11.399806022644043, 11.800383567810059, 12.200961112976074]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 8.0, 9.0, 13.0, 12.0, 22.0, 27.0, 23.0, 27.0, 35.0, 31.0, 40.0, 32.0, 44.0, 48.0, 55.0, 47.0, 54.0, 47.0, 50.0, 49.0, 62.0, 49.0, 42.0, 30.0, 22.0, 23.0, 13.0, 21.0, 14.0, 8.0, 7.0, 9.0, 9.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1169586181640625, -1.075714111328125, -1.0344696044921875, -0.99322509765625, -0.9519805908203125, -0.910736083984375, -0.8694915771484375, -0.8282470703125, -0.7870025634765625, -0.745758056640625, -0.7045135498046875, -0.66326904296875, -0.6220245361328125, -0.580780029296875, -0.5395355224609375, -0.498291015625, -0.4570465087890625, -0.415802001953125, -0.3745574951171875, -0.33331298828125, -0.2920684814453125, -0.250823974609375, -0.2095794677734375, -0.1683349609375, -0.1270904541015625, -0.085845947265625, -0.0446014404296875, -0.00335693359375, 0.0378875732421875, 0.079132080078125, 0.1203765869140625, 0.16162109375, 0.2028656005859375, 0.244110107421875, 0.2853546142578125, 0.32659912109375, 0.3678436279296875, 0.409088134765625, 0.4503326416015625, 0.4915771484375, 0.5328216552734375, 0.574066162109375, 0.6153106689453125, 0.65655517578125, 0.6977996826171875, 0.739044189453125, 0.7802886962890625, 0.821533203125, 0.8627777099609375, 0.904022216796875, 0.9452667236328125, 0.98651123046875, 1.0277557373046875, 1.069000244140625, 1.1102447509765625, 1.1514892578125, 1.1927337646484375, 1.233978271484375, 1.2752227783203125, 1.31646728515625, 1.3577117919921875, 1.398956298828125, 1.4402008056640625, 1.4814453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 10.0, 9.0, 17.0, 27.0, 44.0, 80.0, 94.0, 166.0, 263.0, 421.0, 696.0, 1177.0, 2244.0, 4264.0, 8469.0, 19071.0, 53053.0, 249714.0, 2112948.0, 1506478.0, 162759.0, 40793.0, 15765.0, 7329.0, 3719.0, 1986.0, 1048.0, 644.0, 364.0, 229.0, 145.0, 86.0, 45.0, 37.0, 18.0, 17.0, 11.0, 7.0, 7.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.589996337890625, -2.50616455078125, -2.422332763671875, -2.3385009765625, -2.254669189453125, -2.17083740234375, -2.087005615234375, -2.003173828125, -1.919342041015625, -1.83551025390625, -1.751678466796875, -1.6678466796875, -1.584014892578125, -1.50018310546875, -1.416351318359375, -1.33251953125, -1.248687744140625, -1.16485595703125, -1.081024169921875, -0.9971923828125, -0.913360595703125, -0.82952880859375, -0.745697021484375, -0.661865234375, -0.578033447265625, -0.49420166015625, -0.410369873046875, -0.3265380859375, -0.242706298828125, -0.15887451171875, -0.075042724609375, 0.0087890625, 0.092620849609375, 0.17645263671875, 0.260284423828125, 0.3441162109375, 0.427947998046875, 0.51177978515625, 0.595611572265625, 0.679443359375, 0.763275146484375, 0.84710693359375, 0.930938720703125, 1.0147705078125, 1.098602294921875, 1.18243408203125, 1.266265869140625, 1.35009765625, 1.433929443359375, 1.51776123046875, 1.601593017578125, 1.6854248046875, 1.769256591796875, 1.85308837890625, 1.936920166015625, 2.020751953125, 2.104583740234375, 2.18841552734375, 2.272247314453125, 2.3560791015625, 2.439910888671875, 2.52374267578125, 2.607574462890625, 2.69140625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 16.0, 9.0, 20.0, 19.0, 26.0, 48.0, 69.0, 73.0, 100.0, 161.0, 279.0, 399.0, 610.0, 656.0, 539.0, 360.0, 231.0, 140.0, 83.0, 68.0, 51.0, 30.0, 23.0, 12.0, 17.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.174713134765625, -3.07012939453125, -2.965545654296875, -2.8609619140625, -2.756378173828125, -2.65179443359375, -2.547210693359375, -2.442626953125, -2.338043212890625, -2.23345947265625, -2.128875732421875, -2.0242919921875, -1.919708251953125, -1.81512451171875, -1.710540771484375, -1.60595703125, -1.501373291015625, -1.39678955078125, -1.292205810546875, -1.1876220703125, -1.083038330078125, -0.97845458984375, -0.873870849609375, -0.769287109375, -0.664703369140625, -0.56011962890625, -0.455535888671875, -0.3509521484375, -0.246368408203125, -0.14178466796875, -0.037200927734375, 0.0673828125, 0.171966552734375, 0.27655029296875, 0.381134033203125, 0.4857177734375, 0.590301513671875, 0.69488525390625, 0.799468994140625, 0.904052734375, 1.008636474609375, 1.11322021484375, 1.217803955078125, 1.3223876953125, 1.426971435546875, 1.53155517578125, 1.636138916015625, 1.74072265625, 1.845306396484375, 1.94989013671875, 2.054473876953125, 2.1590576171875, 2.263641357421875, 2.36822509765625, 2.472808837890625, 2.577392578125, 2.681976318359375, 2.78656005859375, 2.891143798828125, 2.9957275390625, 3.100311279296875, 3.20489501953125, 3.309478759765625, 3.4140625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 8.0, 10.0, 4.0, 5.0, 10.0, 19.0, 26.0, 38.0, 55.0, 94.0, 143.0, 198.0, 365.0, 615.0, 1099.0, 2136.0, 4358.0, 9587.0, 23335.0, 64683.0, 243754.0, 1746819.0, 1746482.0, 243759.0, 64905.0, 23245.0, 9475.0, 4248.0, 2116.0, 1075.0, 641.0, 337.0, 227.0, 141.0, 90.0, 50.0, 39.0, 21.0, 17.0, 11.0, 11.0, 6.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.751953125, -3.63470458984375, -3.5174560546875, -3.40020751953125, -3.282958984375, -3.16571044921875, -3.0484619140625, -2.93121337890625, -2.81396484375, -2.69671630859375, -2.5794677734375, -2.46221923828125, -2.344970703125, -2.22772216796875, -2.1104736328125, -1.99322509765625, -1.8759765625, -1.75872802734375, -1.6414794921875, -1.52423095703125, -1.406982421875, -1.28973388671875, -1.1724853515625, -1.05523681640625, -0.93798828125, -0.82073974609375, -0.7034912109375, -0.58624267578125, -0.468994140625, -0.35174560546875, -0.2344970703125, -0.11724853515625, 0.0, 0.11724853515625, 0.2344970703125, 0.35174560546875, 0.468994140625, 0.58624267578125, 0.7034912109375, 0.82073974609375, 0.93798828125, 1.05523681640625, 1.1724853515625, 1.28973388671875, 1.406982421875, 1.52423095703125, 1.6414794921875, 1.75872802734375, 1.8759765625, 1.99322509765625, 2.1104736328125, 2.22772216796875, 2.344970703125, 2.46221923828125, 2.5794677734375, 2.69671630859375, 2.81396484375, 2.93121337890625, 3.0484619140625, 3.16571044921875, 3.282958984375, 3.40020751953125, 3.5174560546875, 3.63470458984375, 3.751953125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 27.0, 43.0, 83.0, 123.0, 203.0, 220.0, 157.0, 85.0, 36.0, 14.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3842716217041, -24.446584701538086, -23.508895874023438, -22.571208953857422, -21.633522033691406, -20.69583511352539, -19.758148193359375, -18.820459365844727, -17.88277244567871, -16.945085525512695, -16.007396697998047, -15.069709777832031, -14.132022857666016, -13.1943359375, -12.256648063659668, -11.318960189819336, -10.38127326965332, -9.443586349487305, -8.505898475646973, -7.568211078643799, -6.630523681640625, -5.692836284637451, -4.755148887634277, -3.8174614906311035, -2.8797740936279297, -1.9420866966247559, -1.004399299621582, -0.0667119026184082, 0.8709754943847656, 1.8086628913879395, 2.7463502883911133, 3.684037685394287, 4.621726989746094, 5.559414386749268, 6.497101783752441, 7.434789180755615, 8.372476577758789, 9.310163497924805, 10.247851371765137, 11.185539245605469, 12.123226165771484, 13.0609130859375, 13.998600959777832, 14.936288833618164, 15.87397575378418, 16.811662673950195, 17.749351501464844, 18.68703842163086, 19.624725341796875, 20.56241226196289, 21.500099182128906, 22.437788009643555, 23.37547492980957, 24.313161849975586, 25.250850677490234, 26.18853759765625, 27.126224517822266, 28.06391143798828, 29.001598358154297, 29.939287185668945, 30.87697410583496, 31.814661026000977, 32.752349853515625, 33.69003677368164, 34.627723693847656]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 13.0, 12.0, 7.0, 18.0, 15.0, 27.0, 17.0, 24.0, 21.0, 29.0, 24.0, 33.0, 35.0, 37.0, 38.0, 39.0, 32.0, 43.0, 32.0, 42.0, 31.0, 39.0, 41.0, 30.0, 28.0, 32.0, 34.0, 22.0, 24.0, 26.0, 18.0, 20.0, 12.0, 18.0, 9.0, 16.0, 3.0, 8.0, 7.0, 5.0, 4.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.944015026092529, -7.674643039703369, -7.405271053314209, -7.135899066925049, -6.866527080535889, -6.5971550941467285, -6.327783107757568, -6.058411121368408, -5.789039134979248, -5.519667148590088, -5.250295162200928, -4.980923175811768, -4.711551189422607, -4.442179203033447, -4.172807216644287, -3.903435230255127, -3.634063243865967, -3.3646912574768066, -3.0953192710876465, -2.8259472846984863, -2.556575298309326, -2.287203311920166, -2.017831325531006, -1.7484593391418457, -1.4790873527526855, -1.2097153663635254, -0.9403433799743652, -0.6709713935852051, -0.4015994071960449, -0.13222742080688477, 0.1371445655822754, 0.40651655197143555, 0.6758880615234375, 0.9452600479125977, 1.2146320343017578, 1.484004020690918, 1.7533760070800781, 2.0227479934692383, 2.2921199798583984, 2.5614919662475586, 2.8308639526367188, 3.100235939025879, 3.369607925415039, 3.638979911804199, 3.9083518981933594, 4.1777238845825195, 4.44709587097168, 4.71646785736084, 4.98583984375, 5.25521183013916, 5.52458381652832, 5.7939558029174805, 6.063327789306641, 6.332699775695801, 6.602071762084961, 6.871443748474121, 7.140815734863281, 7.410187721252441, 7.679559707641602, 7.948931694030762, 8.218303680419922, 8.487675666809082, 8.757047653198242, 9.026419639587402, 9.295791625976562]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 4.0, 9.0, 8.0, 7.0, 6.0, 9.0, 17.0, 26.0, 22.0, 22.0, 23.0, 33.0, 39.0, 39.0, 46.0, 42.0, 52.0, 51.0, 68.0, 52.0, 57.0, 48.0, 45.0, 35.0, 35.0, 30.0, 30.0, 27.0, 28.0, 23.0, 17.0, 9.0, 8.0, 7.0, 7.0, 12.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3330078125, -1.2921142578125, -1.251220703125, -1.2103271484375, -1.16943359375, -1.1285400390625, -1.087646484375, -1.0467529296875, -1.005859375, -0.9649658203125, -0.924072265625, -0.8831787109375, -0.84228515625, -0.8013916015625, -0.760498046875, -0.7196044921875, -0.6787109375, -0.6378173828125, -0.596923828125, -0.5560302734375, -0.51513671875, -0.4742431640625, -0.433349609375, -0.3924560546875, -0.3515625, -0.3106689453125, -0.269775390625, -0.2288818359375, -0.18798828125, -0.1470947265625, -0.106201171875, -0.0653076171875, -0.0244140625, 0.0164794921875, 0.057373046875, 0.0982666015625, 0.13916015625, 0.1800537109375, 0.220947265625, 0.2618408203125, 0.302734375, 0.3436279296875, 0.384521484375, 0.4254150390625, 0.46630859375, 0.5072021484375, 0.548095703125, 0.5889892578125, 0.6298828125, 0.6707763671875, 0.711669921875, 0.7525634765625, 0.79345703125, 0.8343505859375, 0.875244140625, 0.9161376953125, 0.95703125, 0.9979248046875, 1.038818359375, 1.0797119140625, 1.12060546875, 1.1614990234375, 1.202392578125, 1.2432861328125, 1.2841796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 9.0, 13.0, 19.0, 24.0, 66.0, 77.0, 100.0, 179.0, 277.0, 405.0, 664.0, 1006.0, 1648.0, 2646.0, 4369.0, 7140.0, 11869.0, 19718.0, 32518.0, 51973.0, 79943.0, 114080.0, 142926.0, 153150.0, 134617.0, 103150.0, 70423.0, 44803.0, 27524.0, 16989.0, 10154.0, 6145.0, 3798.0, 2268.0, 1447.0, 855.0, 526.0, 377.0, 240.0, 153.0, 84.0, 58.0, 46.0, 23.0, 26.0, 8.0, 11.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7539596557617188, -0.7291107177734375, -0.7042617797851562, -0.679412841796875, -0.6545639038085938, -0.6297149658203125, -0.6048660278320312, -0.58001708984375, -0.5551681518554688, -0.5303192138671875, -0.5054702758789062, -0.480621337890625, -0.45577239990234375, -0.4309234619140625, -0.40607452392578125, -0.3812255859375, -0.35637664794921875, -0.3315277099609375, -0.30667877197265625, -0.281829833984375, -0.25698089599609375, -0.2321319580078125, -0.20728302001953125, -0.18243408203125, -0.15758514404296875, -0.1327362060546875, -0.10788726806640625, -0.083038330078125, -0.05818939208984375, -0.0333404541015625, -0.00849151611328125, 0.016357421875, 0.04120635986328125, 0.0660552978515625, 0.09090423583984375, 0.115753173828125, 0.14060211181640625, 0.1654510498046875, 0.19029998779296875, 0.21514892578125, 0.23999786376953125, 0.2648468017578125, 0.28969573974609375, 0.314544677734375, 0.33939361572265625, 0.3642425537109375, 0.38909149169921875, 0.4139404296875, 0.43878936767578125, 0.4636383056640625, 0.48848724365234375, 0.513336181640625, 0.5381851196289062, 0.5630340576171875, 0.5878829956054688, 0.61273193359375, 0.6375808715820312, 0.6624298095703125, 0.6872787475585938, 0.712127685546875, 0.7369766235351562, 0.7618255615234375, 0.7866744995117188, 0.8115234375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 12.0, 3.0, 6.0, 9.0, 9.0, 14.0, 21.0, 17.0, 19.0, 27.0, 31.0, 39.0, 38.0, 38.0, 49.0, 42.0, 41.0, 42.0, 1070.0, 40.0, 48.0, 44.0, 41.0, 43.0, 36.0, 44.0, 31.0, 30.0, 22.0, 19.0, 18.0, 18.0, 14.0, 19.0, 6.0, 13.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2398223876953125, -1.199371337890625, -1.1589202880859375, -1.11846923828125, -1.0780181884765625, -1.037567138671875, -0.9971160888671875, -0.9566650390625, -0.9162139892578125, -0.875762939453125, -0.8353118896484375, -0.79486083984375, -0.7544097900390625, -0.713958740234375, -0.6735076904296875, -0.633056640625, -0.5926055908203125, -0.552154541015625, -0.5117034912109375, -0.47125244140625, -0.4308013916015625, -0.390350341796875, -0.3498992919921875, -0.3094482421875, -0.2689971923828125, -0.228546142578125, -0.1880950927734375, -0.14764404296875, -0.1071929931640625, -0.066741943359375, -0.0262908935546875, 0.01416015625, 0.0546112060546875, 0.095062255859375, 0.1355133056640625, 0.17596435546875, 0.2164154052734375, 0.256866455078125, 0.2973175048828125, 0.3377685546875, 0.3782196044921875, 0.418670654296875, 0.4591217041015625, 0.49957275390625, 0.5400238037109375, 0.580474853515625, 0.6209259033203125, 0.661376953125, 0.7018280029296875, 0.742279052734375, 0.7827301025390625, 0.82318115234375, 0.8636322021484375, 0.904083251953125, 0.9445343017578125, 0.9849853515625, 1.0254364013671875, 1.065887451171875, 1.1063385009765625, 1.14678955078125, 1.1872406005859375, 1.227691650390625, 1.2681427001953125, 1.30859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 14.0, 17.0, 17.0, 39.0, 61.0, 84.0, 114.0, 175.0, 221.0, 361.0, 519.0, 845.0, 1208.0, 1868.0, 2752.0, 4387.0, 6774.0, 10654.0, 17978.0, 34997.0, 133542.0, 1558892.0, 223651.0, 43912.0, 20384.0, 11874.0, 7635.0, 4814.0, 3184.0, 2051.0, 1372.0, 896.0, 620.0, 372.0, 262.0, 162.0, 127.0, 88.0, 58.0, 53.0, 29.0, 23.0, 14.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0363006591796875, -1.001312255859375, -0.9663238525390625, -0.93133544921875, -0.8963470458984375, -0.861358642578125, -0.8263702392578125, -0.7913818359375, -0.7563934326171875, -0.721405029296875, -0.6864166259765625, -0.65142822265625, -0.6164398193359375, -0.581451416015625, -0.5464630126953125, -0.511474609375, -0.4764862060546875, -0.441497802734375, -0.4065093994140625, -0.37152099609375, -0.3365325927734375, -0.301544189453125, -0.2665557861328125, -0.2315673828125, -0.1965789794921875, -0.161590576171875, -0.1266021728515625, -0.09161376953125, -0.0566253662109375, -0.021636962890625, 0.0133514404296875, 0.04833984375, 0.0833282470703125, 0.118316650390625, 0.1533050537109375, 0.18829345703125, 0.2232818603515625, 0.258270263671875, 0.2932586669921875, 0.3282470703125, 0.3632354736328125, 0.398223876953125, 0.4332122802734375, 0.46820068359375, 0.5031890869140625, 0.538177490234375, 0.5731658935546875, 0.608154296875, 0.6431427001953125, 0.678131103515625, 0.7131195068359375, 0.74810791015625, 0.7830963134765625, 0.818084716796875, 0.8530731201171875, 0.8880615234375, 0.9230499267578125, 0.958038330078125, 0.9930267333984375, 1.02801513671875, 1.0630035400390625, 1.097991943359375, 1.1329803466796875, 1.16796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 3.0, 12.0, 13.0, 15.0, 21.0, 14.0, 23.0, 31.0, 26.0, 30.0, 45.0, 58.0, 62.0, 69.0, 52.0, 58.0, 64.0, 61.0, 47.0, 45.0, 48.0, 30.0, 21.0, 32.0, 23.0, 15.0, 11.0, 18.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10654544830322266, -0.10243415832519531, -0.09832286834716797, -0.09421157836914062, -0.09010028839111328, -0.08598899841308594, -0.0818777084350586, -0.07776641845703125, -0.0736551284790039, -0.06954383850097656, -0.06543254852294922, -0.061321258544921875, -0.05720996856689453, -0.05309867858886719, -0.048987388610839844, -0.0448760986328125, -0.040764808654785156, -0.03665351867675781, -0.03254222869873047, -0.028430938720703125, -0.02431964874267578, -0.020208358764648438, -0.016097068786621094, -0.01198577880859375, -0.007874488830566406, -0.0037631988525390625, 0.00034809112548828125, 0.004459381103515625, 0.008570671081542969, 0.012681961059570312, 0.016793251037597656, 0.020904541015625, 0.025015830993652344, 0.029127120971679688, 0.03323841094970703, 0.037349700927734375, 0.04146099090576172, 0.04557228088378906, 0.049683570861816406, 0.05379486083984375, 0.057906150817871094, 0.06201744079589844, 0.06612873077392578, 0.07024002075195312, 0.07435131072998047, 0.07846260070800781, 0.08257389068603516, 0.0866851806640625, 0.09079647064208984, 0.09490776062011719, 0.09901905059814453, 0.10313034057617188, 0.10724163055419922, 0.11135292053222656, 0.1154642105102539, 0.11957550048828125, 0.1236867904663086, 0.12779808044433594, 0.13190937042236328, 0.13602066040039062, 0.14013195037841797, 0.1442432403564453, 0.14835453033447266, 0.1524658203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 9.0, 14.0, 7.0, 21.0, 22.0, 28.0, 43.0, 64.0, 94.0, 163.0, 340.0, 1043.0, 6582.0, 81715.0, 878114.0, 72385.0, 6079.0, 984.0, 333.0, 163.0, 104.0, 56.0, 47.0, 38.0, 26.0, 14.0, 21.0, 5.0, 9.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.42144775390625, -2.3585205078125, -2.29559326171875, -2.232666015625, -2.16973876953125, -2.1068115234375, -2.04388427734375, -1.98095703125, -1.91802978515625, -1.8551025390625, -1.79217529296875, -1.729248046875, -1.66632080078125, -1.6033935546875, -1.54046630859375, -1.4775390625, -1.41461181640625, -1.3516845703125, -1.28875732421875, -1.225830078125, -1.16290283203125, -1.0999755859375, -1.03704833984375, -0.97412109375, -0.91119384765625, -0.8482666015625, -0.78533935546875, -0.722412109375, -0.65948486328125, -0.5965576171875, -0.53363037109375, -0.470703125, -0.40777587890625, -0.3448486328125, -0.28192138671875, -0.218994140625, -0.15606689453125, -0.0931396484375, -0.03021240234375, 0.03271484375, 0.09564208984375, 0.1585693359375, 0.22149658203125, 0.284423828125, 0.34735107421875, 0.4102783203125, 0.47320556640625, 0.5361328125, 0.59906005859375, 0.6619873046875, 0.72491455078125, 0.787841796875, 0.85076904296875, 0.9136962890625, 0.97662353515625, 1.03955078125, 1.10247802734375, 1.1654052734375, 1.22833251953125, 1.291259765625, 1.35418701171875, 1.4171142578125, 1.48004150390625, 1.54296875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 14.0, 33.0, 95.0, 191.0, 301.0, 200.0, 89.0, 40.0, 17.0, 11.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8741536140441895, -2.807976007461548, -2.7417984008789062, -2.6756210327148438, -2.609443426132202, -2.5432658195495605, -2.477088212966919, -2.4109106063842773, -2.344733238220215, -2.2785556316375732, -2.2123780250549316, -2.146200656890869, -2.0800230503082275, -2.013845443725586, -1.9476678371429443, -1.8814902305603027, -1.8153126239776611, -1.7491350173950195, -1.6829575300216675, -1.6167799234390259, -1.5506024360656738, -1.4844248294830322, -1.4182472229003906, -1.352069616317749, -1.285892128944397, -1.2197145223617554, -1.1535370349884033, -1.0873594284057617, -1.0211818218231201, -0.9550043344497681, -0.8888267278671265, -0.8226491808891296, -0.7564716339111328, -0.690294086933136, -0.6241165399551392, -0.5579389333724976, -0.49176138639450073, -0.4255838394165039, -0.3594062626361847, -0.2932286858558655, -0.22705113887786865, -0.16087357699871063, -0.09469601511955261, -0.028518453240394592, 0.03765910863876343, 0.10383665561676025, 0.17001423239707947, 0.23619180917739868, 0.3023693561553955, 0.36854690313339233, 0.43472447991371155, 0.5009020566940308, 0.5670796036720276, 0.6332571506500244, 0.699434757232666, 0.7656123042106628, 0.8317898511886597, 0.8979673981666565, 0.9641449451446533, 1.030322551727295, 1.0965001583099365, 1.1626776456832886, 1.2288552522659302, 1.2950327396392822, 1.3612103462219238]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 12.0, 14.0, 6.0, 10.0, 17.0, 23.0, 37.0, 40.0, 32.0, 28.0, 39.0, 28.0, 51.0, 45.0, 61.0, 45.0, 53.0, 53.0, 50.0, 40.0, 43.0, 40.0, 39.0, 30.0, 25.0, 25.0, 28.0, 21.0, 11.0, 17.0, 7.0, 6.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.500812292098999, -0.4838857054710388, -0.4669591188430786, -0.4500325322151184, -0.4331059455871582, -0.416179358959198, -0.3992527723312378, -0.3823261857032776, -0.3653995990753174, -0.3484730124473572, -0.331546425819397, -0.31461983919143677, -0.29769325256347656, -0.28076666593551636, -0.26384007930755615, -0.24691349267959595, -0.22998690605163574, -0.21306031942367554, -0.19613373279571533, -0.17920714616775513, -0.16228055953979492, -0.14535397291183472, -0.1284273862838745, -0.1115007996559143, -0.0945742130279541, -0.0776476263999939, -0.06072103977203369, -0.043794453144073486, -0.02686786651611328, -0.009941279888153076, 0.006985306739807129, 0.023911893367767334, 0.04083847999572754, 0.057765066623687744, 0.07469165325164795, 0.09161823987960815, 0.10854482650756836, 0.12547141313552856, 0.14239799976348877, 0.15932458639144897, 0.17625117301940918, 0.19317775964736938, 0.2101043462753296, 0.2270309329032898, 0.24395751953125, 0.2608841061592102, 0.2778106927871704, 0.2947372794151306, 0.3116638660430908, 0.328590452671051, 0.34551703929901123, 0.36244362592697144, 0.37937021255493164, 0.39629679918289185, 0.41322338581085205, 0.43014997243881226, 0.44707655906677246, 0.46400314569473267, 0.48092973232269287, 0.4978563189506531, 0.5147829055786133, 0.5317094922065735, 0.5486360788345337, 0.5655626654624939, 0.5824892520904541]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 5.0, 6.0, 13.0, 12.0, 19.0, 29.0, 35.0, 36.0, 34.0, 45.0, 46.0, 40.0, 56.0, 64.0, 64.0, 63.0, 55.0, 54.0, 46.0, 45.0, 41.0, 31.0, 29.0, 27.0, 23.0, 17.0, 23.0, 9.0, 10.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.533203125, -1.4862213134765625, -1.439239501953125, -1.3922576904296875, -1.34527587890625, -1.2982940673828125, -1.251312255859375, -1.2043304443359375, -1.1573486328125, -1.1103668212890625, -1.063385009765625, -1.0164031982421875, -0.96942138671875, -0.9224395751953125, -0.875457763671875, -0.8284759521484375, -0.781494140625, -0.7345123291015625, -0.687530517578125, -0.6405487060546875, -0.59356689453125, -0.5465850830078125, -0.499603271484375, -0.4526214599609375, -0.4056396484375, -0.3586578369140625, -0.311676025390625, -0.2646942138671875, -0.21771240234375, -0.1707305908203125, -0.123748779296875, -0.0767669677734375, -0.02978515625, 0.0171966552734375, 0.064178466796875, 0.1111602783203125, 0.15814208984375, 0.2051239013671875, 0.252105712890625, 0.2990875244140625, 0.3460693359375, 0.3930511474609375, 0.440032958984375, 0.4870147705078125, 0.53399658203125, 0.5809783935546875, 0.627960205078125, 0.6749420166015625, 0.721923828125, 0.7689056396484375, 0.815887451171875, 0.8628692626953125, 0.90985107421875, 0.9568328857421875, 1.003814697265625, 1.0507965087890625, 1.0977783203125, 1.1447601318359375, 1.191741943359375, 1.2387237548828125, 1.28570556640625, 1.3326873779296875, 1.379669189453125, 1.4266510009765625, 1.4736328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 14.0, 27.0, 39.0, 69.0, 99.0, 189.0, 310.0, 505.0, 906.0, 1630.0, 2959.0, 5679.0, 11486.0, 26618.0, 79182.0, 394857.0, 393615.0, 79777.0, 26389.0, 11675.0, 5681.0, 2946.0, 1686.0, 957.0, 522.0, 297.0, 163.0, 99.0, 62.0, 29.0, 22.0, 19.0, 14.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51171875, -2.4332275390625, -2.354736328125, -2.2762451171875, -2.19775390625, -2.1192626953125, -2.040771484375, -1.9622802734375, -1.8837890625, -1.8052978515625, -1.726806640625, -1.6483154296875, -1.56982421875, -1.4913330078125, -1.412841796875, -1.3343505859375, -1.255859375, -1.1773681640625, -1.098876953125, -1.0203857421875, -0.94189453125, -0.8634033203125, -0.784912109375, -0.7064208984375, -0.6279296875, -0.5494384765625, -0.470947265625, -0.3924560546875, -0.31396484375, -0.2354736328125, -0.156982421875, -0.0784912109375, 0.0, 0.0784912109375, 0.156982421875, 0.2354736328125, 0.31396484375, 0.3924560546875, 0.470947265625, 0.5494384765625, 0.6279296875, 0.7064208984375, 0.784912109375, 0.8634033203125, 0.94189453125, 1.0203857421875, 1.098876953125, 1.1773681640625, 1.255859375, 1.3343505859375, 1.412841796875, 1.4913330078125, 1.56982421875, 1.6483154296875, 1.726806640625, 1.8052978515625, 1.8837890625, 1.9622802734375, 2.040771484375, 2.1192626953125, 2.19775390625, 2.2762451171875, 2.354736328125, 2.4332275390625, 2.51171875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 10.0, 3.0, 8.0, 7.0, 9.0, 7.0, 13.0, 25.0, 31.0, 33.0, 26.0, 48.0, 55.0, 50.0, 79.0, 95.0, 169.0, 378.0, 1378.0, 143.0, 100.0, 81.0, 46.0, 54.0, 50.0, 28.0, 22.0, 27.0, 16.0, 16.0, 8.0, 11.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.57293701171875, -4.4036865234375, -4.23443603515625, -4.065185546875, -3.89593505859375, -3.7266845703125, -3.55743408203125, -3.38818359375, -3.21893310546875, -3.0496826171875, -2.88043212890625, -2.711181640625, -2.54193115234375, -2.3726806640625, -2.20343017578125, -2.0341796875, -1.86492919921875, -1.6956787109375, -1.52642822265625, -1.357177734375, -1.18792724609375, -1.0186767578125, -0.84942626953125, -0.68017578125, -0.51092529296875, -0.3416748046875, -0.17242431640625, -0.003173828125, 0.16607666015625, 0.3353271484375, 0.50457763671875, 0.673828125, 0.84307861328125, 1.0123291015625, 1.18157958984375, 1.350830078125, 1.52008056640625, 1.6893310546875, 1.85858154296875, 2.02783203125, 2.19708251953125, 2.3663330078125, 2.53558349609375, 2.704833984375, 2.87408447265625, 3.0433349609375, 3.21258544921875, 3.3818359375, 3.55108642578125, 3.7203369140625, 3.88958740234375, 4.058837890625, 4.22808837890625, 4.3973388671875, 4.56658935546875, 4.73583984375, 4.90509033203125, 5.0743408203125, 5.24359130859375, 5.412841796875, 5.58209228515625, 5.7513427734375, 5.92059326171875, 6.08984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 7.0, 11.0, 12.0, 17.0, 16.0, 32.0, 48.0, 55.0, 90.0, 156.0, 288.0, 553.0, 1544.0, 7326.0, 73949.0, 2789426.0, 252390.0, 15464.0, 2631.0, 761.0, 336.0, 205.0, 123.0, 78.0, 48.0, 36.0, 25.0, 15.0, 11.0, 17.0, 11.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.6273193359375, -9.332763671875, -9.0382080078125, -8.74365234375, -8.4490966796875, -8.154541015625, -7.8599853515625, -7.5654296875, -7.2708740234375, -6.976318359375, -6.6817626953125, -6.38720703125, -6.0926513671875, -5.798095703125, -5.5035400390625, -5.208984375, -4.9144287109375, -4.619873046875, -4.3253173828125, -4.03076171875, -3.7362060546875, -3.441650390625, -3.1470947265625, -2.8525390625, -2.5579833984375, -2.263427734375, -1.9688720703125, -1.67431640625, -1.3797607421875, -1.085205078125, -0.7906494140625, -0.49609375, -0.2015380859375, 0.093017578125, 0.3875732421875, 0.68212890625, 0.9766845703125, 1.271240234375, 1.5657958984375, 1.8603515625, 2.1549072265625, 2.449462890625, 2.7440185546875, 3.03857421875, 3.3331298828125, 3.627685546875, 3.9222412109375, 4.216796875, 4.5113525390625, 4.805908203125, 5.1004638671875, 5.39501953125, 5.6895751953125, 5.984130859375, 6.2786865234375, 6.5732421875, 6.8677978515625, 7.162353515625, 7.4569091796875, 7.75146484375, 8.0460205078125, 8.340576171875, 8.6351318359375, 8.9296875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 40.0, 290.0, 536.0, 130.0, 17.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.43467712402344, -72.67379760742188, -70.91292572021484, -69.15204620361328, -67.39116668701172, -65.63029479980469, -63.869415283203125, -62.10853576660156, -60.347660064697266, -58.58678436279297, -56.825904846191406, -55.06502914428711, -53.30415344238281, -51.54327392578125, -49.78239822387695, -48.021522521972656, -46.260643005371094, -44.4997673034668, -42.738887786865234, -40.97801208496094, -39.21713638305664, -37.45625686645508, -35.69538116455078, -33.93450164794922, -32.17362976074219, -30.412752151489258, -28.65187644958496, -26.89099884033203, -25.1301212310791, -23.369243621826172, -21.608367919921875, -19.847490310668945, -18.086612701416016, -16.325735092163086, -14.564858436584473, -12.80398178100586, -11.04310417175293, -9.282227516174316, -7.521350860595703, -5.760473251342773, -3.99959659576416, -2.2387194633483887, -0.4778425693511963, 1.283034324645996, 3.0439114570617676, 4.804788589477539, 6.565665245056152, 8.326542854309082, 10.087419509887695, 11.848296165466309, 13.609173774719238, 15.370050430297852, 17.13092803955078, 18.891803741455078, 20.652681350708008, 22.413558959960938, 24.174434661865234, 25.935312271118164, 27.69618797302246, 29.45706558227539, 31.21794319152832, 32.97882080078125, 34.73969650268555, 36.500572204589844, 38.261451721191406]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 9.0, 10.0, 12.0, 10.0, 14.0, 17.0, 16.0, 22.0, 31.0, 31.0, 29.0, 28.0, 30.0, 22.0, 36.0, 36.0, 33.0, 46.0, 30.0, 34.0, 46.0, 50.0, 35.0, 42.0, 27.0, 37.0, 26.0, 25.0, 34.0, 23.0, 20.0, 26.0, 17.0, 19.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.29312801361084, -9.966480255126953, -9.639832496643066, -9.31318473815918, -8.98653793334961, -8.659890174865723, -8.333242416381836, -8.00659465789795, -7.6799468994140625, -7.353299140930176, -7.026651382446289, -6.7000041007995605, -6.373356342315674, -6.046708583831787, -5.720061302185059, -5.393413543701172, -5.066765785217285, -4.740118026733398, -4.413470268249512, -4.086822986602783, -3.7601752281188965, -3.4335274696350098, -3.106879949569702, -2.7802324295043945, -2.453584671020508, -2.126936912536621, -1.8002893924713135, -1.4736417531967163, -1.1469941139221191, -0.820346474647522, -0.4936988353729248, -0.1670513153076172, 0.15959548950195312, 0.4862431287765503, 0.8128907680511475, 1.1395384073257446, 1.4661860466003418, 1.792833685874939, 2.119481325149536, 2.4461288452148438, 2.7727766036987305, 3.099424362182617, 3.426071882247925, 3.7527194023132324, 4.079367160797119, 4.406014919281006, 4.732662200927734, 5.059309959411621, 5.385957717895508, 5.7126054763793945, 6.039253234863281, 6.36590051651001, 6.6925482749938965, 7.019196033477783, 7.345843315124512, 7.672491073608398, 7.999138832092285, 8.325786590576172, 8.652434349060059, 8.979082107543945, 9.305728912353516, 9.632376670837402, 9.959024429321289, 10.285672187805176, 10.612319946289062]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 9.0, 8.0, 16.0, 14.0, 27.0, 24.0, 24.0, 30.0, 30.0, 35.0, 50.0, 39.0, 40.0, 60.0, 56.0, 51.0, 56.0, 65.0, 56.0, 40.0, 35.0, 37.0, 27.0, 24.0, 24.0, 20.0, 16.0, 16.0, 13.0, 8.0, 5.0, 5.0, 2.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.392578125, -1.3492279052734375, -1.305877685546875, -1.2625274658203125, -1.21917724609375, -1.1758270263671875, -1.132476806640625, -1.0891265869140625, -1.0457763671875, -1.0024261474609375, -0.959075927734375, -0.9157257080078125, -0.87237548828125, -0.8290252685546875, -0.785675048828125, -0.7423248291015625, -0.698974609375, -0.6556243896484375, -0.612274169921875, -0.5689239501953125, -0.52557373046875, -0.4822235107421875, -0.438873291015625, -0.3955230712890625, -0.3521728515625, -0.3088226318359375, -0.265472412109375, -0.2221221923828125, -0.17877197265625, -0.1354217529296875, -0.092071533203125, -0.0487213134765625, -0.00537109375, 0.0379791259765625, 0.081329345703125, 0.1246795654296875, 0.16802978515625, 0.2113800048828125, 0.254730224609375, 0.2980804443359375, 0.3414306640625, 0.3847808837890625, 0.428131103515625, 0.4714813232421875, 0.51483154296875, 0.5581817626953125, 0.601531982421875, 0.6448822021484375, 0.688232421875, 0.7315826416015625, 0.774932861328125, 0.8182830810546875, 0.86163330078125, 0.9049835205078125, 0.948333740234375, 0.9916839599609375, 1.0350341796875, 1.0783843994140625, 1.121734619140625, 1.1650848388671875, 1.20843505859375, 1.2517852783203125, 1.295135498046875, 1.3384857177734375, 1.3818359375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 10.0, 9.0, 21.0, 26.0, 28.0, 38.0, 53.0, 49.0, 104.0, 170.0, 357.0, 816.0, 2196.0, 6318.0, 23345.0, 150239.0, 2792422.0, 1130931.0, 65058.0, 14454.0, 4576.0, 1607.0, 702.0, 308.0, 151.0, 86.0, 50.0, 38.0, 24.0, 20.0, 15.0, 13.0, 8.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4765625, -4.34417724609375, -4.2117919921875, -4.07940673828125, -3.947021484375, -3.81463623046875, -3.6822509765625, -3.54986572265625, -3.41748046875, -3.28509521484375, -3.1527099609375, -3.02032470703125, -2.887939453125, -2.75555419921875, -2.6231689453125, -2.49078369140625, -2.3583984375, -2.22601318359375, -2.0936279296875, -1.96124267578125, -1.828857421875, -1.69647216796875, -1.5640869140625, -1.43170166015625, -1.29931640625, -1.16693115234375, -1.0345458984375, -0.90216064453125, -0.769775390625, -0.63739013671875, -0.5050048828125, -0.37261962890625, -0.240234375, -0.10784912109375, 0.0245361328125, 0.15692138671875, 0.289306640625, 0.42169189453125, 0.5540771484375, 0.68646240234375, 0.81884765625, 0.95123291015625, 1.0836181640625, 1.21600341796875, 1.348388671875, 1.48077392578125, 1.6131591796875, 1.74554443359375, 1.8779296875, 2.01031494140625, 2.1427001953125, 2.27508544921875, 2.407470703125, 2.53985595703125, 2.6722412109375, 2.80462646484375, 2.93701171875, 3.06939697265625, 3.2017822265625, 3.33416748046875, 3.466552734375, 3.59893798828125, 3.7313232421875, 3.86370849609375, 3.99609375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 4.0, 9.0, 13.0, 14.0, 19.0, 23.0, 35.0, 37.0, 60.0, 79.0, 86.0, 142.0, 170.0, 252.0, 362.0, 497.0, 566.0, 497.0, 370.0, 238.0, 151.0, 112.0, 73.0, 58.0, 50.0, 31.0, 26.0, 22.0, 21.0, 12.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.00390625, -2.916412353515625, -2.82891845703125, -2.741424560546875, -2.6539306640625, -2.566436767578125, -2.47894287109375, -2.391448974609375, -2.303955078125, -2.216461181640625, -2.12896728515625, -2.041473388671875, -1.9539794921875, -1.866485595703125, -1.77899169921875, -1.691497802734375, -1.60400390625, -1.516510009765625, -1.42901611328125, -1.341522216796875, -1.2540283203125, -1.166534423828125, -1.07904052734375, -0.991546630859375, -0.904052734375, -0.816558837890625, -0.72906494140625, -0.641571044921875, -0.5540771484375, -0.466583251953125, -0.37908935546875, -0.291595458984375, -0.2041015625, -0.116607666015625, -0.02911376953125, 0.058380126953125, 0.1458740234375, 0.233367919921875, 0.32086181640625, 0.408355712890625, 0.495849609375, 0.583343505859375, 0.67083740234375, 0.758331298828125, 0.8458251953125, 0.933319091796875, 1.02081298828125, 1.108306884765625, 1.19580078125, 1.283294677734375, 1.37078857421875, 1.458282470703125, 1.5457763671875, 1.633270263671875, 1.72076416015625, 1.808258056640625, 1.895751953125, 1.983245849609375, 2.07073974609375, 2.158233642578125, 2.2457275390625, 2.333221435546875, 2.42071533203125, 2.508209228515625, 2.595703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 10.0, 22.0, 24.0, 37.0, 42.0, 72.0, 125.0, 233.0, 550.0, 1289.0, 3959.0, 16782.0, 107224.0, 2402782.0, 1560249.0, 81754.0, 13508.0, 3408.0, 1134.0, 468.0, 229.0, 122.0, 79.0, 50.0, 29.0, 18.0, 15.0, 12.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.76995849609375, -6.5438232421875, -6.31768798828125, -6.091552734375, -5.86541748046875, -5.6392822265625, -5.41314697265625, -5.18701171875, -4.96087646484375, -4.7347412109375, -4.50860595703125, -4.282470703125, -4.05633544921875, -3.8302001953125, -3.60406494140625, -3.3779296875, -3.15179443359375, -2.9256591796875, -2.69952392578125, -2.473388671875, -2.24725341796875, -2.0211181640625, -1.79498291015625, -1.56884765625, -1.34271240234375, -1.1165771484375, -0.89044189453125, -0.664306640625, -0.43817138671875, -0.2120361328125, 0.01409912109375, 0.240234375, 0.46636962890625, 0.6925048828125, 0.91864013671875, 1.144775390625, 1.37091064453125, 1.5970458984375, 1.82318115234375, 2.04931640625, 2.27545166015625, 2.5015869140625, 2.72772216796875, 2.953857421875, 3.17999267578125, 3.4061279296875, 3.63226318359375, 3.8583984375, 4.08453369140625, 4.3106689453125, 4.53680419921875, 4.762939453125, 4.98907470703125, 5.2152099609375, 5.44134521484375, 5.66748046875, 5.89361572265625, 6.1197509765625, 6.34588623046875, 6.572021484375, 6.79815673828125, 7.0242919921875, 7.25042724609375, 7.4765625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 15.0, 26.0, 54.0, 108.0, 185.0, 208.0, 186.0, 120.0, 60.0, 25.0, 13.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.76798629760742, -31.846311569213867, -30.92463493347168, -30.002960205078125, -29.08128547668457, -28.159608840942383, -27.237934112548828, -26.31625747680664, -25.394582748413086, -24.47290802001953, -23.551231384277344, -22.62955665588379, -21.707881927490234, -20.786205291748047, -19.864530563354492, -18.942855834960938, -18.02117919921875, -17.099504470825195, -16.177827835083008, -15.256153106689453, -14.334477424621582, -13.412801742553711, -12.491127014160156, -11.569451332092285, -10.647777557373047, -9.726101875305176, -8.804427146911621, -7.88275146484375, -6.961075782775879, -6.039400577545166, -5.117725372314453, -4.196049690246582, -3.274374008178711, -2.352698564529419, -1.4310232400894165, -0.5093479156494141, 0.41232752799987793, 1.33400297164917, 2.255678176879883, 3.177353858947754, 4.099029064178467, 5.02070426940918, 5.942379951477051, 6.864055156707764, 7.785730361938477, 8.707406044006348, 9.629081726074219, 10.550756454467773, 11.472432136535645, 12.394107818603516, 13.31578254699707, 14.237458229064941, 15.159133911132812, 16.080808639526367, 17.002483367919922, 17.92416000366211, 18.845834732055664, 19.76750946044922, 20.689186096191406, 21.61086082458496, 22.532535552978516, 23.454212188720703, 24.375886917114258, 25.297561645507812, 26.21923828125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 14.0, 11.0, 12.0, 6.0, 13.0, 15.0, 26.0, 21.0, 26.0, 27.0, 27.0, 32.0, 36.0, 46.0, 40.0, 45.0, 50.0, 26.0, 32.0, 33.0, 46.0, 41.0, 39.0, 39.0, 23.0, 39.0, 26.0, 31.0, 30.0, 28.0, 24.0, 6.0, 19.0, 12.0, 11.0, 8.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.187625885009766, -8.903886795043945, -8.620147705078125, -8.336409568786621, -8.0526704788208, -7.7689313888549805, -7.485192775726318, -7.201454162597656, -6.917715072631836, -6.633975982666016, -6.3502373695373535, -6.066498756408691, -5.782759666442871, -5.499020576477051, -5.215281963348389, -4.931543350219727, -4.647804260253906, -4.364065170288086, -4.080326557159424, -3.7965877056121826, -3.5128488540649414, -3.2291100025177, -2.945371150970459, -2.6616322994232178, -2.3778934478759766, -2.0941545963287354, -1.8104157447814941, -1.526676893234253, -1.2429380416870117, -0.9591991901397705, -0.6754603385925293, -0.3917214870452881, -0.10798168182373047, 0.17575716972351074, 0.45949602127075195, 0.7432348728179932, 1.0269737243652344, 1.3107125759124756, 1.5944514274597168, 1.878190279006958, 2.161929130554199, 2.4456679821014404, 2.7294068336486816, 3.013145685195923, 3.296884536743164, 3.5806233882904053, 3.8643622398376465, 4.148100852966309, 4.431839942932129, 4.715579032897949, 4.999317646026611, 5.283056259155273, 5.566795349121094, 5.850534439086914, 6.134273052215576, 6.418011665344238, 6.701750755310059, 6.985489845275879, 7.269228458404541, 7.552967071533203, 7.836706161499023, 8.120445251464844, 8.404184341430664, 8.687922477722168, 8.971661567687988]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 7.0, 12.0, 14.0, 27.0, 14.0, 38.0, 36.0, 39.0, 48.0, 46.0, 59.0, 57.0, 62.0, 75.0, 74.0, 68.0, 62.0, 42.0, 39.0, 32.0, 31.0, 29.0, 24.0, 22.0, 8.0, 14.0, 7.0, 5.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.08984375, -2.0339508056640625, -1.978057861328125, -1.9221649169921875, -1.86627197265625, -1.8103790283203125, -1.754486083984375, -1.6985931396484375, -1.6427001953125, -1.5868072509765625, -1.530914306640625, -1.4750213623046875, -1.41912841796875, -1.3632354736328125, -1.307342529296875, -1.2514495849609375, -1.195556640625, -1.1396636962890625, -1.083770751953125, -1.0278778076171875, -0.97198486328125, -0.9160919189453125, -0.860198974609375, -0.8043060302734375, -0.7484130859375, -0.6925201416015625, -0.636627197265625, -0.5807342529296875, -0.52484130859375, -0.4689483642578125, -0.413055419921875, -0.3571624755859375, -0.30126953125, -0.2453765869140625, -0.189483642578125, -0.1335906982421875, -0.07769775390625, -0.0218048095703125, 0.034088134765625, 0.0899810791015625, 0.1458740234375, 0.2017669677734375, 0.257659912109375, 0.3135528564453125, 0.36944580078125, 0.4253387451171875, 0.481231689453125, 0.5371246337890625, 0.593017578125, 0.6489105224609375, 0.704803466796875, 0.7606964111328125, 0.81658935546875, 0.8724822998046875, 0.928375244140625, 0.9842681884765625, 1.0401611328125, 1.0960540771484375, 1.151947021484375, 1.2078399658203125, 1.26373291015625, 1.3196258544921875, 1.375518798828125, 1.4314117431640625, 1.4873046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 3.0, 6.0, 11.0, 15.0, 15.0, 36.0, 36.0, 64.0, 87.0, 154.0, 264.0, 438.0, 718.0, 1299.0, 2248.0, 4107.0, 7536.0, 13287.0, 24447.0, 43571.0, 73575.0, 114728.0, 155522.0, 174763.0, 153221.0, 112237.0, 71395.0, 42030.0, 23483.0, 13017.0, 7115.0, 3940.0, 2085.0, 1284.0, 744.0, 413.0, 237.0, 179.0, 76.0, 47.0, 48.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.939453125, -0.9095993041992188, -0.8797454833984375, -0.8498916625976562, -0.820037841796875, -0.7901840209960938, -0.7603302001953125, -0.7304763793945312, -0.70062255859375, -0.6707687377929688, -0.6409149169921875, -0.6110610961914062, -0.581207275390625, -0.5513534545898438, -0.5214996337890625, -0.49164581298828125, -0.4617919921875, -0.43193817138671875, -0.4020843505859375, -0.37223052978515625, -0.342376708984375, -0.31252288818359375, -0.2826690673828125, -0.25281524658203125, -0.22296142578125, -0.19310760498046875, -0.1632537841796875, -0.13339996337890625, -0.103546142578125, -0.07369232177734375, -0.0438385009765625, -0.01398468017578125, 0.015869140625, 0.04572296142578125, 0.0755767822265625, 0.10543060302734375, 0.135284423828125, 0.16513824462890625, 0.1949920654296875, 0.22484588623046875, 0.25469970703125, 0.28455352783203125, 0.3144073486328125, 0.34426116943359375, 0.374114990234375, 0.40396881103515625, 0.4338226318359375, 0.46367645263671875, 0.4935302734375, 0.5233840942382812, 0.5532379150390625, 0.5830917358398438, 0.612945556640625, 0.6427993774414062, 0.6726531982421875, 0.7025070190429688, 0.73236083984375, 0.7622146606445312, 0.7920684814453125, 0.8219223022460938, 0.851776123046875, 0.8816299438476562, 0.9114837646484375, 0.9413375854492188, 0.97119140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 8.0, 11.0, 8.0, 11.0, 18.0, 28.0, 25.0, 44.0, 28.0, 39.0, 43.0, 35.0, 43.0, 44.0, 46.0, 1065.0, 53.0, 39.0, 58.0, 41.0, 40.0, 35.0, 41.0, 25.0, 25.0, 30.0, 22.0, 14.0, 23.0, 13.0, 11.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4771270751953125, -1.435699462890625, -1.3942718505859375, -1.35284423828125, -1.3114166259765625, -1.269989013671875, -1.2285614013671875, -1.1871337890625, -1.1457061767578125, -1.104278564453125, -1.0628509521484375, -1.02142333984375, -0.9799957275390625, -0.938568115234375, -0.8971405029296875, -0.855712890625, -0.8142852783203125, -0.772857666015625, -0.7314300537109375, -0.69000244140625, -0.6485748291015625, -0.607147216796875, -0.5657196044921875, -0.5242919921875, -0.4828643798828125, -0.441436767578125, -0.4000091552734375, -0.35858154296875, -0.3171539306640625, -0.275726318359375, -0.2342987060546875, -0.19287109375, -0.1514434814453125, -0.110015869140625, -0.0685882568359375, -0.02716064453125, 0.0142669677734375, 0.055694580078125, 0.0971221923828125, 0.1385498046875, 0.1799774169921875, 0.221405029296875, 0.2628326416015625, 0.30426025390625, 0.3456878662109375, 0.387115478515625, 0.4285430908203125, 0.469970703125, 0.5113983154296875, 0.552825927734375, 0.5942535400390625, 0.63568115234375, 0.6771087646484375, 0.718536376953125, 0.7599639892578125, 0.8013916015625, 0.8428192138671875, 0.884246826171875, 0.9256744384765625, 0.96710205078125, 1.0085296630859375, 1.049957275390625, 1.0913848876953125, 1.1328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 13.0, 11.0, 20.0, 29.0, 40.0, 49.0, 64.0, 120.0, 154.0, 251.0, 310.0, 431.0, 666.0, 887.0, 1275.0, 1878.0, 2652.0, 3862.0, 5764.0, 8390.0, 12789.0, 20996.0, 42141.0, 159470.0, 1458562.0, 255442.0, 53562.0, 23845.0, 14327.0, 9197.0, 6277.0, 4165.0, 2828.0, 1961.0, 1450.0, 932.0, 647.0, 497.0, 338.0, 245.0, 180.0, 116.0, 87.0, 64.0, 32.0, 36.0, 21.0, 11.0, 13.0, 17.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.93408203125, -0.904541015625, -0.875, -0.845458984375, -0.81591796875, -0.786376953125, -0.7568359375, -0.727294921875, -0.69775390625, -0.668212890625, -0.638671875, -0.609130859375, -0.57958984375, -0.550048828125, -0.5205078125, -0.490966796875, -0.46142578125, -0.431884765625, -0.40234375, -0.372802734375, -0.34326171875, -0.313720703125, -0.2841796875, -0.254638671875, -0.22509765625, -0.195556640625, -0.166015625, -0.136474609375, -0.10693359375, -0.077392578125, -0.0478515625, -0.018310546875, 0.01123046875, 0.040771484375, 0.0703125, 0.099853515625, 0.12939453125, 0.158935546875, 0.1884765625, 0.218017578125, 0.24755859375, 0.277099609375, 0.306640625, 0.336181640625, 0.36572265625, 0.395263671875, 0.4248046875, 0.454345703125, 0.48388671875, 0.513427734375, 0.54296875, 0.572509765625, 0.60205078125, 0.631591796875, 0.6611328125, 0.690673828125, 0.72021484375, 0.749755859375, 0.779296875, 0.808837890625, 0.83837890625, 0.867919921875, 0.8974609375, 0.927001953125, 0.95654296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 9.0, 5.0, 3.0, 10.0, 20.0, 24.0, 35.0, 39.0, 61.0, 79.0, 82.0, 115.0, 118.0, 111.0, 72.0, 48.0, 45.0, 32.0, 20.0, 19.0, 9.0, 7.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2119140625, -0.20529937744140625, -0.1986846923828125, -0.19207000732421875, -0.185455322265625, -0.17884063720703125, -0.1722259521484375, -0.16561126708984375, -0.15899658203125, -0.15238189697265625, -0.1457672119140625, -0.13915252685546875, -0.132537841796875, -0.12592315673828125, -0.1193084716796875, -0.11269378662109375, -0.1060791015625, -0.09946441650390625, -0.0928497314453125, -0.08623504638671875, -0.079620361328125, -0.07300567626953125, -0.0663909912109375, -0.05977630615234375, -0.05316162109375, -0.04654693603515625, -0.0399322509765625, -0.03331756591796875, -0.026702880859375, -0.02008819580078125, -0.0134735107421875, -0.00685882568359375, -0.000244140625, 0.00637054443359375, 0.0129852294921875, 0.01959991455078125, 0.026214599609375, 0.03282928466796875, 0.0394439697265625, 0.04605865478515625, 0.05267333984375, 0.05928802490234375, 0.0659027099609375, 0.07251739501953125, 0.079132080078125, 0.08574676513671875, 0.0923614501953125, 0.09897613525390625, 0.1055908203125, 0.11220550537109375, 0.1188201904296875, 0.12543487548828125, 0.132049560546875, 0.13866424560546875, 0.1452789306640625, 0.15189361572265625, 0.15850830078125, 0.16512298583984375, 0.1717376708984375, 0.17835235595703125, 0.184967041015625, 0.19158172607421875, 0.1981964111328125, 0.20481109619140625, 0.21142578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 6.0, 7.0, 8.0, 8.0, 15.0, 17.0, 24.0, 42.0, 96.0, 192.0, 572.0, 2126.0, 11882.0, 822747.0, 201999.0, 6593.0, 1438.0, 430.0, 137.0, 76.0, 44.0, 22.0, 21.0, 14.0, 8.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.021240234375, -2.92333984375, -2.825439453125, -2.7275390625, -2.629638671875, -2.53173828125, -2.433837890625, -2.3359375, -2.238037109375, -2.14013671875, -2.042236328125, -1.9443359375, -1.846435546875, -1.74853515625, -1.650634765625, -1.552734375, -1.454833984375, -1.35693359375, -1.259033203125, -1.1611328125, -1.063232421875, -0.96533203125, -0.867431640625, -0.76953125, -0.671630859375, -0.57373046875, -0.475830078125, -0.3779296875, -0.280029296875, -0.18212890625, -0.084228515625, 0.013671875, 0.111572265625, 0.20947265625, 0.307373046875, 0.4052734375, 0.503173828125, 0.60107421875, 0.698974609375, 0.796875, 0.894775390625, 0.99267578125, 1.090576171875, 1.1884765625, 1.286376953125, 1.38427734375, 1.482177734375, 1.580078125, 1.677978515625, 1.77587890625, 1.873779296875, 1.9716796875, 2.069580078125, 2.16748046875, 2.265380859375, 2.36328125, 2.461181640625, 2.55908203125, 2.656982421875, 2.7548828125, 2.852783203125, 2.95068359375, 3.048583984375, 3.146484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 28.0, 58.0, 100.0, 192.0, 269.0, 164.0, 87.0, 46.0, 20.0, 9.0, 6.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.608473539352417, -2.5345613956451416, -2.4606494903564453, -2.38673734664917, -2.3128254413604736, -2.2389132976531982, -2.165001392364502, -2.0910892486572266, -2.017177104949951, -1.9432650804519653, -1.8693530559539795, -1.7954410314559937, -1.7215290069580078, -1.6476168632507324, -1.5737048387527466, -1.4997928142547607, -1.4258809089660645, -1.3519688844680786, -1.2780568599700928, -1.204144835472107, -1.130232810974121, -1.0563206672668457, -0.9824086427688599, -0.908496618270874, -0.8345845937728882, -0.7606725692749023, -0.6867605447769165, -0.6128484606742859, -0.5389364361763, -0.4650244116783142, -0.391112357378006, -0.31720030307769775, -0.24328827857971191, -0.16937623918056488, -0.09546419978141785, -0.021552160382270813, 0.05235987901687622, 0.12627190351486206, 0.2001839578151703, 0.2740960121154785, 0.34800803661346436, 0.4219200611114502, 0.4958321154117584, 0.5697441697120667, 0.6436561942100525, 0.7175682187080383, 0.791480302810669, 0.8653923273086548, 0.9393043518066406, 1.0132163763046265, 1.0871284008026123, 1.1610404253005981, 1.234952449798584, 1.3088645935058594, 1.3827766180038452, 1.456688642501831, 1.530600666999817, 1.6045126914978027, 1.6784247159957886, 1.7523367404937744, 1.8262488842010498, 1.900160789489746, 1.9740729331970215, 2.047985076904297, 2.121896982192993]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 14.0, 9.0, 17.0, 25.0, 34.0, 41.0, 54.0, 43.0, 37.0, 50.0, 53.0, 50.0, 65.0, 53.0, 65.0, 56.0, 48.0, 45.0, 31.0, 32.0, 32.0, 21.0, 23.0, 22.0, 11.0, 15.0, 3.0, 13.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8811373114585876, -0.8552358150482178, -0.8293343186378479, -0.803432822227478, -0.7775313854217529, -0.7516298890113831, -0.7257283926010132, -0.6998268961906433, -0.6739253997802734, -0.6480239033699036, -0.6221224069595337, -0.5962209701538086, -0.5703194737434387, -0.5444179773330688, -0.518516480922699, -0.4926149845123291, -0.466713547706604, -0.44081205129623413, -0.41491058468818665, -0.3890090882778168, -0.3631076216697693, -0.3372061252593994, -0.31130462884902954, -0.28540313243865967, -0.2595016658306122, -0.2336001843214035, -0.20769870281219482, -0.18179720640182495, -0.15589572489261627, -0.1299942433834076, -0.10409274697303772, -0.07819126546382904, -0.05228978395462036, -0.026388298720121384, -0.000486813485622406, 0.02541467547416687, 0.05131615698337555, 0.07721763849258423, 0.1031191349029541, 0.12902061641216278, 0.15492209792137146, 0.18082357943058014, 0.20672506093978882, 0.2326265573501587, 0.25852805376052856, 0.28442952036857605, 0.3103310167789459, 0.3362324833869934, 0.3621339797973633, 0.38803547620773315, 0.41393694281578064, 0.4398384392261505, 0.465739905834198, 0.49164140224456787, 0.5175428986549377, 0.5434443950653076, 0.5693458318710327, 0.5952473282814026, 0.6211488246917725, 0.6470502614974976, 0.6729517579078674, 0.6988532543182373, 0.7247547507286072, 0.750656247138977, 0.7765577435493469]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 13.0, 13.0, 20.0, 28.0, 36.0, 37.0, 49.0, 46.0, 43.0, 45.0, 66.0, 56.0, 74.0, 76.0, 62.0, 51.0, 56.0, 35.0, 34.0, 24.0, 35.0, 18.0, 18.0, 17.0, 16.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.06640625, -2.012451171875, -1.95849609375, -1.904541015625, -1.8505859375, -1.796630859375, -1.74267578125, -1.688720703125, -1.634765625, -1.580810546875, -1.52685546875, -1.472900390625, -1.4189453125, -1.364990234375, -1.31103515625, -1.257080078125, -1.203125, -1.149169921875, -1.09521484375, -1.041259765625, -0.9873046875, -0.933349609375, -0.87939453125, -0.825439453125, -0.771484375, -0.717529296875, -0.66357421875, -0.609619140625, -0.5556640625, -0.501708984375, -0.44775390625, -0.393798828125, -0.33984375, -0.285888671875, -0.23193359375, -0.177978515625, -0.1240234375, -0.070068359375, -0.01611328125, 0.037841796875, 0.091796875, 0.145751953125, 0.19970703125, 0.253662109375, 0.3076171875, 0.361572265625, 0.41552734375, 0.469482421875, 0.5234375, 0.577392578125, 0.63134765625, 0.685302734375, 0.7392578125, 0.793212890625, 0.84716796875, 0.901123046875, 0.955078125, 1.009033203125, 1.06298828125, 1.116943359375, 1.1708984375, 1.224853515625, 1.27880859375, 1.332763671875, 1.38671875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 12.0, 14.0, 26.0, 29.0, 59.0, 100.0, 170.0, 297.0, 531.0, 1092.0, 2199.0, 5277.0, 13608.0, 40056.0, 142718.0, 498398.0, 246286.0, 64039.0, 20199.0, 7354.0, 3096.0, 1410.0, 697.0, 360.0, 222.0, 126.0, 70.0, 41.0, 21.0, 16.0, 11.0, 7.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.052276611328125, -1.98541259765625, -1.918548583984375, -1.8516845703125, -1.784820556640625, -1.71795654296875, -1.651092529296875, -1.584228515625, -1.517364501953125, -1.45050048828125, -1.383636474609375, -1.3167724609375, -1.249908447265625, -1.18304443359375, -1.116180419921875, -1.04931640625, -0.982452392578125, -0.91558837890625, -0.848724365234375, -0.7818603515625, -0.714996337890625, -0.64813232421875, -0.581268310546875, -0.514404296875, -0.447540283203125, -0.38067626953125, -0.313812255859375, -0.2469482421875, -0.180084228515625, -0.11322021484375, -0.046356201171875, 0.0205078125, 0.087371826171875, 0.15423583984375, 0.221099853515625, 0.2879638671875, 0.354827880859375, 0.42169189453125, 0.488555908203125, 0.555419921875, 0.622283935546875, 0.68914794921875, 0.756011962890625, 0.8228759765625, 0.889739990234375, 0.95660400390625, 1.023468017578125, 1.09033203125, 1.157196044921875, 1.22406005859375, 1.290924072265625, 1.3577880859375, 1.424652099609375, 1.49151611328125, 1.558380126953125, 1.625244140625, 1.692108154296875, 1.75897216796875, 1.825836181640625, 1.8927001953125, 1.959564208984375, 2.02642822265625, 2.093292236328125, 2.16015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 12.0, 10.0, 11.0, 13.0, 13.0, 22.0, 23.0, 31.0, 36.0, 35.0, 38.0, 39.0, 51.0, 60.0, 85.0, 111.0, 204.0, 1449.0, 216.0, 110.0, 70.0, 87.0, 56.0, 27.0, 39.0, 30.0, 26.0, 26.0, 28.0, 18.0, 17.0, 12.0, 7.0, 2.0, 3.0, 4.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.310791015625, -4.16455078125, -4.018310546875, -3.8720703125, -3.725830078125, -3.57958984375, -3.433349609375, -3.287109375, -3.140869140625, -2.99462890625, -2.848388671875, -2.7021484375, -2.555908203125, -2.40966796875, -2.263427734375, -2.1171875, -1.970947265625, -1.82470703125, -1.678466796875, -1.5322265625, -1.385986328125, -1.23974609375, -1.093505859375, -0.947265625, -0.801025390625, -0.65478515625, -0.508544921875, -0.3623046875, -0.216064453125, -0.06982421875, 0.076416015625, 0.22265625, 0.368896484375, 0.51513671875, 0.661376953125, 0.8076171875, 0.953857421875, 1.10009765625, 1.246337890625, 1.392578125, 1.538818359375, 1.68505859375, 1.831298828125, 1.9775390625, 2.123779296875, 2.27001953125, 2.416259765625, 2.5625, 2.708740234375, 2.85498046875, 3.001220703125, 3.1474609375, 3.293701171875, 3.43994140625, 3.586181640625, 3.732421875, 3.878662109375, 4.02490234375, 4.171142578125, 4.3173828125, 4.463623046875, 4.60986328125, 4.756103515625, 4.90234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 19.0, 24.0, 27.0, 42.0, 100.0, 120.0, 199.0, 354.0, 865.0, 2773.0, 26514.0, 2829568.0, 275007.0, 7227.0, 1539.0, 524.0, 280.0, 190.0, 109.0, 62.0, 36.0, 36.0, 23.0, 13.0, 10.0, 13.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.318603515625, -10.97314453125, -10.627685546875, -10.2822265625, -9.936767578125, -9.59130859375, -9.245849609375, -8.900390625, -8.554931640625, -8.20947265625, -7.864013671875, -7.5185546875, -7.173095703125, -6.82763671875, -6.482177734375, -6.13671875, -5.791259765625, -5.44580078125, -5.100341796875, -4.7548828125, -4.409423828125, -4.06396484375, -3.718505859375, -3.373046875, -3.027587890625, -2.68212890625, -2.336669921875, -1.9912109375, -1.645751953125, -1.30029296875, -0.954833984375, -0.609375, -0.263916015625, 0.08154296875, 0.427001953125, 0.7724609375, 1.117919921875, 1.46337890625, 1.808837890625, 2.154296875, 2.499755859375, 2.84521484375, 3.190673828125, 3.5361328125, 3.881591796875, 4.22705078125, 4.572509765625, 4.91796875, 5.263427734375, 5.60888671875, 5.954345703125, 6.2998046875, 6.645263671875, 6.99072265625, 7.336181640625, 7.681640625, 8.027099609375, 8.37255859375, 8.718017578125, 9.0634765625, 9.408935546875, 9.75439453125, 10.099853515625, 10.4453125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 147.0, 748.0, 112.0, 5.0, 2.0, 0.0, 2.0], "bins": [-133.59580993652344, -131.31063842773438, -129.02548217773438, -126.74031066894531, -124.45513916015625, -122.16997528076172, -119.88480377197266, -117.59963989257812, -115.31446838378906, -113.02930450439453, -110.74413299560547, -108.45896911621094, -106.17379760742188, -103.88863372802734, -101.60346221923828, -99.31829833984375, -97.03312683105469, -94.74796295166016, -92.4627914428711, -90.17762756347656, -87.8924560546875, -85.60729217529297, -83.3221206665039, -81.03695678710938, -78.75179290771484, -76.46662902832031, -74.18145751953125, -71.89629364013672, -69.61112213134766, -67.32595825195312, -65.04078674316406, -62.75562286376953, -60.4704475402832, -58.185279846191406, -55.90011215209961, -53.61494445800781, -51.329776763916016, -49.04460906982422, -46.75944519042969, -44.474273681640625, -42.189109802246094, -39.9039421081543, -37.6187744140625, -35.3336067199707, -33.048439025878906, -30.76327133178711, -28.478105545043945, -26.19293785095215, -23.90776824951172, -21.622600555419922, -19.337432861328125, -17.052265167236328, -14.767098426818848, -12.48193073272705, -10.19676399230957, -7.911596298217773, -5.626428604125977, -3.341261148452759, -1.056093692779541, 1.2290735244750977, 3.5142412185668945, 5.799408912658691, 8.084575653076172, 10.369743347167969, 12.654911041259766]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 9.0, 2.0, 11.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 21.0, 20.0, 20.0, 28.0, 39.0, 27.0, 31.0, 33.0, 23.0, 47.0, 28.0, 36.0, 36.0, 30.0, 39.0, 32.0, 41.0, 29.0, 29.0, 56.0, 33.0, 21.0, 27.0, 26.0, 18.0, 19.0, 17.0, 14.0, 23.0, 13.0, 9.0, 4.0, 10.0, 8.0, 6.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21320915222168, -9.859966278076172, -9.50672435760498, -9.153481483459473, -8.800239562988281, -8.446996688842773, -8.093753814697266, -7.740511894226074, -7.387269020080566, -7.034026622772217, -6.680784225463867, -6.327541351318359, -5.97429895401001, -5.62105655670166, -5.2678141593933105, -4.914571762084961, -4.561329364776611, -4.208086967468262, -3.854844331741333, -3.5016019344329834, -3.1483592987060547, -2.795116901397705, -2.4418745040893555, -2.0886318683624268, -1.7353894710540771, -1.382146954536438, -1.0289044380187988, -0.6756620407104492, -0.32241952419281006, 0.0308229923248291, 0.3840653896331787, 0.7373080253601074, 1.090550422668457, 1.4437929391860962, 1.7970354557037354, 2.150277853012085, 2.5035204887390137, 2.8567628860473633, 3.210005283355713, 3.5632479190826416, 3.916490316390991, 4.26973295211792, 4.6229753494262695, 4.976217746734619, 5.329460144042969, 5.682703018188477, 6.035944938659668, 6.389187812805176, 6.742430210113525, 7.095672607421875, 7.448915004730225, 7.802157402038574, 8.155400276184082, 8.508642196655273, 8.861885070800781, 9.215127944946289, 9.56836986541748, 9.921612739562988, 10.27485466003418, 10.628097534179688, 10.981339454650879, 11.334582328796387, 11.687824249267578, 12.041067123413086, 12.394309997558594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 6.0, 6.0, 15.0, 17.0, 18.0, 25.0, 38.0, 36.0, 36.0, 39.0, 62.0, 57.0, 71.0, 70.0, 57.0, 67.0, 64.0, 53.0, 51.0, 47.0, 39.0, 23.0, 30.0, 21.0, 15.0, 11.0, 7.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0407257080078125, -1.983795166015625, -1.9268646240234375, -1.86993408203125, -1.8130035400390625, -1.756072998046875, -1.6991424560546875, -1.6422119140625, -1.5852813720703125, -1.528350830078125, -1.4714202880859375, -1.41448974609375, -1.3575592041015625, -1.300628662109375, -1.2436981201171875, -1.186767578125, -1.1298370361328125, -1.072906494140625, -1.0159759521484375, -0.95904541015625, -0.9021148681640625, -0.845184326171875, -0.7882537841796875, -0.7313232421875, -0.6743927001953125, -0.617462158203125, -0.5605316162109375, -0.50360107421875, -0.4466705322265625, -0.389739990234375, -0.3328094482421875, -0.27587890625, -0.2189483642578125, -0.162017822265625, -0.1050872802734375, -0.04815673828125, 0.0087738037109375, 0.065704345703125, 0.1226348876953125, 0.1795654296875, 0.2364959716796875, 0.293426513671875, 0.3503570556640625, 0.40728759765625, 0.4642181396484375, 0.521148681640625, 0.5780792236328125, 0.635009765625, 0.6919403076171875, 0.748870849609375, 0.8058013916015625, 0.86273193359375, 0.9196624755859375, 0.976593017578125, 1.0335235595703125, 1.0904541015625, 1.1473846435546875, 1.204315185546875, 1.2612457275390625, 1.31817626953125, 1.3751068115234375, 1.432037353515625, 1.4889678955078125, 1.5458984375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 12.0, 13.0, 24.0, 27.0, 31.0, 45.0, 77.0, 124.0, 185.0, 323.0, 544.0, 970.0, 1852.0, 3608.0, 7954.0, 19946.0, 66148.0, 439576.0, 2722782.0, 788509.0, 95233.0, 27063.0, 10002.0, 4473.0, 2143.0, 1136.0, 640.0, 314.0, 196.0, 112.0, 76.0, 45.0, 30.0, 21.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.18359375, -4.08306884765625, -3.9825439453125, -3.88201904296875, -3.781494140625, -3.68096923828125, -3.5804443359375, -3.47991943359375, -3.37939453125, -3.27886962890625, -3.1783447265625, -3.07781982421875, -2.977294921875, -2.87677001953125, -2.7762451171875, -2.67572021484375, -2.5751953125, -2.47467041015625, -2.3741455078125, -2.27362060546875, -2.173095703125, -2.07257080078125, -1.9720458984375, -1.87152099609375, -1.77099609375, -1.67047119140625, -1.5699462890625, -1.46942138671875, -1.368896484375, -1.26837158203125, -1.1678466796875, -1.06732177734375, -0.966796875, -0.86627197265625, -0.7657470703125, -0.66522216796875, -0.564697265625, -0.46417236328125, -0.3636474609375, -0.26312255859375, -0.16259765625, -0.06207275390625, 0.0384521484375, 0.13897705078125, 0.239501953125, 0.34002685546875, 0.4405517578125, 0.54107666015625, 0.6416015625, 0.74212646484375, 0.8426513671875, 0.94317626953125, 1.043701171875, 1.14422607421875, 1.2447509765625, 1.34527587890625, 1.44580078125, 1.54632568359375, 1.6468505859375, 1.74737548828125, 1.847900390625, 1.94842529296875, 2.0489501953125, 2.14947509765625, 2.25]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 11.0, 14.0, 16.0, 18.0, 28.0, 40.0, 54.0, 80.0, 94.0, 176.0, 208.0, 309.0, 459.0, 555.0, 584.0, 428.0, 253.0, 209.0, 140.0, 102.0, 68.0, 53.0, 42.0, 34.0, 16.0, 12.0, 12.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.595001220703125, -2.49859619140625, -2.402191162109375, -2.3057861328125, -2.209381103515625, -2.11297607421875, -2.016571044921875, -1.920166015625, -1.823760986328125, -1.72735595703125, -1.630950927734375, -1.5345458984375, -1.438140869140625, -1.34173583984375, -1.245330810546875, -1.14892578125, -1.052520751953125, -0.95611572265625, -0.859710693359375, -0.7633056640625, -0.666900634765625, -0.57049560546875, -0.474090576171875, -0.377685546875, -0.281280517578125, -0.18487548828125, -0.088470458984375, 0.0079345703125, 0.104339599609375, 0.20074462890625, 0.297149658203125, 0.3935546875, 0.489959716796875, 0.58636474609375, 0.682769775390625, 0.7791748046875, 0.875579833984375, 0.97198486328125, 1.068389892578125, 1.164794921875, 1.261199951171875, 1.35760498046875, 1.454010009765625, 1.5504150390625, 1.646820068359375, 1.74322509765625, 1.839630126953125, 1.93603515625, 2.032440185546875, 2.12884521484375, 2.225250244140625, 2.3216552734375, 2.418060302734375, 2.51446533203125, 2.610870361328125, 2.707275390625, 2.803680419921875, 2.90008544921875, 2.996490478515625, 3.0928955078125, 3.189300537109375, 3.28570556640625, 3.382110595703125, 3.478515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 4.0, 12.0, 20.0, 31.0, 57.0, 74.0, 118.0, 236.0, 452.0, 985.0, 2209.0, 5658.0, 16059.0, 53341.0, 270262.0, 2631415.0, 1041641.0, 123812.0, 30978.0, 10156.0, 3672.0, 1549.0, 754.0, 330.0, 187.0, 96.0, 48.0, 35.0, 22.0, 13.0, 12.0, 3.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.67578125, -5.521484375, -5.3671875, -5.212890625, -5.05859375, -4.904296875, -4.75, -4.595703125, -4.44140625, -4.287109375, -4.1328125, -3.978515625, -3.82421875, -3.669921875, -3.515625, -3.361328125, -3.20703125, -3.052734375, -2.8984375, -2.744140625, -2.58984375, -2.435546875, -2.28125, -2.126953125, -1.97265625, -1.818359375, -1.6640625, -1.509765625, -1.35546875, -1.201171875, -1.046875, -0.892578125, -0.73828125, -0.583984375, -0.4296875, -0.275390625, -0.12109375, 0.033203125, 0.1875, 0.341796875, 0.49609375, 0.650390625, 0.8046875, 0.958984375, 1.11328125, 1.267578125, 1.421875, 1.576171875, 1.73046875, 1.884765625, 2.0390625, 2.193359375, 2.34765625, 2.501953125, 2.65625, 2.810546875, 2.96484375, 3.119140625, 3.2734375, 3.427734375, 3.58203125, 3.736328125, 3.890625, 4.044921875, 4.19921875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 7.0, 3.0, 7.0, 19.0, 19.0, 21.0, 37.0, 44.0, 46.0, 62.0, 83.0, 83.0, 89.0, 92.0, 55.0, 76.0, 60.0, 56.0, 32.0, 30.0, 21.0, 14.0, 16.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.79543685913086, -9.430390357971191, -9.065343856811523, -8.700298309326172, -8.335251808166504, -7.970205307006836, -7.605158805847168, -7.2401123046875, -6.87506628036499, -6.510019779205322, -6.1449737548828125, -5.7799272537231445, -5.414880752563477, -5.049834728240967, -4.684788227081299, -4.319742202758789, -3.954695701599121, -3.5896494388580322, -3.2246031761169434, -2.8595566749572754, -2.4945104122161865, -2.1294641494750977, -1.7644176483154297, -1.3993713855743408, -1.034325122833252, -0.6692788004875183, -0.30423247814178467, 0.06081390380859375, 0.4258601665496826, 0.7909064292907715, 1.1559529304504395, 1.5209991931915283, 1.8860445022583008, 2.2510907649993896, 2.6161370277404785, 2.9811835289001465, 3.3462297916412354, 3.711276054382324, 4.076322555541992, 4.44136905670166, 4.80641508102417, 5.171461582183838, 5.536507606506348, 5.901554107666016, 6.266600608825684, 6.631646633148193, 6.996693134307861, 7.361739158630371, 7.726785659790039, 8.091832160949707, 8.456878662109375, 8.821924209594727, 9.186970710754395, 9.552017211914062, 9.91706371307373, 10.282110214233398, 10.64715576171875, 11.012202262878418, 11.377248764038086, 11.742294311523438, 12.107340812683105, 12.472387313842773, 12.837433815002441, 13.20248031616211, 13.567526817321777]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 5.0, 12.0, 14.0, 24.0, 19.0, 21.0, 24.0, 25.0, 24.0, 27.0, 33.0, 31.0, 38.0, 22.0, 47.0, 42.0, 43.0, 33.0, 37.0, 39.0, 40.0, 34.0, 45.0, 28.0, 35.0, 38.0, 34.0, 29.0, 15.0, 19.0, 18.0, 12.0, 18.0, 18.0, 6.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.779570579528809, -8.490565299987793, -8.201559066772461, -7.912553787231445, -7.62354850769043, -7.334542751312256, -7.045536994934082, -6.756531715393066, -6.467525959014893, -6.178520202636719, -5.889514923095703, -5.600509166717529, -5.3115034103393555, -5.02249813079834, -4.733492374420166, -4.444486618041992, -4.155481338500977, -3.866475820541382, -3.577470302581787, -3.2884645462036133, -2.9994590282440186, -2.710453510284424, -2.42144775390625, -2.1324422359466553, -1.8434367179870605, -1.5544312000274658, -1.2654255628585815, -0.976419985294342, -0.6874144077301025, -0.3984088897705078, -0.10940325260162354, 0.17960238456726074, 0.46860694885253906, 0.7576125264167786, 1.046618103981018, 1.3356237411499023, 1.624629259109497, 1.9136347770690918, 2.2026405334472656, 2.4916460514068604, 2.780651569366455, 3.06965708732605, 3.3586626052856445, 3.6476683616638184, 3.936673879623413, 4.225679397583008, 4.514685153961182, 4.8036909103393555, 5.092696189880371, 5.381701946258545, 5.6707072257995605, 5.959712982177734, 6.24871826171875, 6.537724018096924, 6.826729774475098, 7.115735054016113, 7.404740810394287, 7.693746566772461, 7.982751846313477, 8.271757125854492, 8.560763359069824, 8.84976863861084, 9.138773918151855, 9.427780151367188, 9.716785430908203]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 16.0, 14.0, 19.0, 27.0, 28.0, 46.0, 47.0, 49.0, 59.0, 68.0, 58.0, 71.0, 66.0, 66.0, 61.0, 52.0, 52.0, 40.0, 31.0, 31.0, 32.0, 16.0, 11.0, 7.0, 11.0, 8.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.6070556640625, -2.546142578125, -2.4852294921875, -2.42431640625, -2.3634033203125, -2.302490234375, -2.2415771484375, -2.1806640625, -2.1197509765625, -2.058837890625, -1.9979248046875, -1.93701171875, -1.8760986328125, -1.815185546875, -1.7542724609375, -1.693359375, -1.6324462890625, -1.571533203125, -1.5106201171875, -1.44970703125, -1.3887939453125, -1.327880859375, -1.2669677734375, -1.2060546875, -1.1451416015625, -1.084228515625, -1.0233154296875, -0.96240234375, -0.9014892578125, -0.840576171875, -0.7796630859375, -0.71875, -0.6578369140625, -0.596923828125, -0.5360107421875, -0.47509765625, -0.4141845703125, -0.353271484375, -0.2923583984375, -0.2314453125, -0.1705322265625, -0.109619140625, -0.0487060546875, 0.01220703125, 0.0731201171875, 0.134033203125, 0.1949462890625, 0.255859375, 0.3167724609375, 0.377685546875, 0.4385986328125, 0.49951171875, 0.5604248046875, 0.621337890625, 0.6822509765625, 0.7431640625, 0.8040771484375, 0.864990234375, 0.9259033203125, 0.98681640625, 1.0477294921875, 1.108642578125, 1.1695556640625, 1.23046875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 3.0, 3.0, 9.0, 10.0, 31.0, 19.0, 26.0, 52.0, 90.0, 149.0, 293.0, 500.0, 917.0, 1769.0, 3591.0, 7182.0, 14368.0, 28092.0, 53690.0, 98080.0, 156681.0, 202403.0, 188521.0, 131079.0, 77468.0, 40825.0, 21101.0, 10578.0, 5326.0, 2665.0, 1393.0, 719.0, 392.0, 184.0, 126.0, 77.0, 44.0, 20.0, 26.0, 15.0, 9.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.1015625, -1.0669097900390625, -1.032257080078125, -0.9976043701171875, -0.96295166015625, -0.9282989501953125, -0.893646240234375, -0.8589935302734375, -0.8243408203125, -0.7896881103515625, -0.755035400390625, -0.7203826904296875, -0.68572998046875, -0.6510772705078125, -0.616424560546875, -0.5817718505859375, -0.547119140625, -0.5124664306640625, -0.477813720703125, -0.4431610107421875, -0.40850830078125, -0.3738555908203125, -0.339202880859375, -0.3045501708984375, -0.2698974609375, -0.2352447509765625, -0.200592041015625, -0.1659393310546875, -0.13128662109375, -0.0966339111328125, -0.061981201171875, -0.0273284912109375, 0.00732421875, 0.0419769287109375, 0.076629638671875, 0.1112823486328125, 0.14593505859375, 0.1805877685546875, 0.215240478515625, 0.2498931884765625, 0.2845458984375, 0.3191986083984375, 0.353851318359375, 0.3885040283203125, 0.42315673828125, 0.4578094482421875, 0.492462158203125, 0.5271148681640625, 0.561767578125, 0.5964202880859375, 0.631072998046875, 0.6657257080078125, 0.70037841796875, 0.7350311279296875, 0.769683837890625, 0.8043365478515625, 0.8389892578125, 0.8736419677734375, 0.908294677734375, 0.9429473876953125, 0.97760009765625, 1.0122528076171875, 1.046905517578125, 1.0815582275390625, 1.1162109375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 5.0, 11.0, 3.0, 6.0, 12.0, 12.0, 11.0, 12.0, 21.0, 21.0, 16.0, 19.0, 34.0, 23.0, 23.0, 28.0, 31.0, 28.0, 29.0, 32.0, 39.0, 38.0, 31.0, 1057.0, 25.0, 38.0, 42.0, 32.0, 38.0, 35.0, 27.0, 22.0, 31.0, 26.0, 24.0, 12.0, 19.0, 12.0, 22.0, 6.0, 14.0, 16.0, 5.0, 8.0, 15.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93310546875, -0.9011154174804688, -0.8691253662109375, -0.8371353149414062, -0.805145263671875, -0.7731552124023438, -0.7411651611328125, -0.7091751098632812, -0.67718505859375, -0.6451950073242188, -0.6132049560546875, -0.5812149047851562, -0.549224853515625, -0.5172348022460938, -0.4852447509765625, -0.45325469970703125, -0.4212646484375, -0.38927459716796875, -0.3572845458984375, -0.32529449462890625, -0.293304443359375, -0.26131439208984375, -0.2293243408203125, -0.19733428955078125, -0.16534423828125, -0.13335418701171875, -0.1013641357421875, -0.06937408447265625, -0.037384033203125, -0.00539398193359375, 0.0265960693359375, 0.05858612060546875, 0.090576171875, 0.12256622314453125, 0.1545562744140625, 0.18654632568359375, 0.218536376953125, 0.25052642822265625, 0.2825164794921875, 0.31450653076171875, 0.34649658203125, 0.37848663330078125, 0.4104766845703125, 0.44246673583984375, 0.474456787109375, 0.5064468383789062, 0.5384368896484375, 0.5704269409179688, 0.6024169921875, 0.6344070434570312, 0.6663970947265625, 0.6983871459960938, 0.730377197265625, 0.7623672485351562, 0.7943572998046875, 0.8263473510742188, 0.85833740234375, 0.8903274536132812, 0.9223175048828125, 0.9543075561523438, 0.986297607421875, 1.0182876586914062, 1.0502777099609375, 1.0822677612304688, 1.1142578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 11.0, 6.0, 25.0, 23.0, 55.0, 68.0, 106.0, 166.0, 271.0, 403.0, 576.0, 838.0, 1332.0, 1825.0, 2898.0, 4384.0, 6490.0, 10504.0, 16617.0, 30937.0, 86697.0, 958819.0, 814710.0, 83083.0, 30116.0, 16661.0, 10082.0, 6632.0, 4292.0, 2895.0, 1859.0, 1265.0, 855.0, 578.0, 362.0, 224.0, 149.0, 101.0, 72.0, 46.0, 29.0, 25.0, 20.0, 14.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.0018463134765625, -0.969512939453125, -0.9371795654296875, -0.90484619140625, -0.8725128173828125, -0.840179443359375, -0.8078460693359375, -0.7755126953125, -0.7431793212890625, -0.710845947265625, -0.6785125732421875, -0.64617919921875, -0.6138458251953125, -0.581512451171875, -0.5491790771484375, -0.516845703125, -0.4845123291015625, -0.452178955078125, -0.4198455810546875, -0.38751220703125, -0.3551788330078125, -0.322845458984375, -0.2905120849609375, -0.2581787109375, -0.2258453369140625, -0.193511962890625, -0.1611785888671875, -0.12884521484375, -0.0965118408203125, -0.064178466796875, -0.0318450927734375, 0.00048828125, 0.0328216552734375, 0.065155029296875, 0.0974884033203125, 0.12982177734375, 0.1621551513671875, 0.194488525390625, 0.2268218994140625, 0.2591552734375, 0.2914886474609375, 0.323822021484375, 0.3561553955078125, 0.38848876953125, 0.4208221435546875, 0.453155517578125, 0.4854888916015625, 0.517822265625, 0.5501556396484375, 0.582489013671875, 0.6148223876953125, 0.64715576171875, 0.6794891357421875, 0.711822509765625, 0.7441558837890625, 0.7764892578125, 0.8088226318359375, 0.841156005859375, 0.8734893798828125, 0.90582275390625, 0.9381561279296875, 0.970489501953125, 1.0028228759765625, 1.03515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 11.0, 10.0, 15.0, 16.0, 26.0, 29.0, 40.0, 42.0, 58.0, 79.0, 68.0, 93.0, 76.0, 100.0, 59.0, 46.0, 35.0, 24.0, 23.0, 17.0, 14.0, 18.0, 10.0, 8.0, 12.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1748046875, -0.16961288452148438, -0.16442108154296875, -0.15922927856445312, -0.1540374755859375, -0.14884567260742188, -0.14365386962890625, -0.13846206665039062, -0.133270263671875, -0.12807846069335938, -0.12288665771484375, -0.11769485473632812, -0.1125030517578125, -0.10731124877929688, -0.10211944580078125, -0.09692764282226562, -0.09173583984375, -0.08654403686523438, -0.08135223388671875, -0.07616043090820312, -0.0709686279296875, -0.06577682495117188, -0.06058502197265625, -0.055393218994140625, -0.050201416015625, -0.045009613037109375, -0.03981781005859375, -0.034626007080078125, -0.0294342041015625, -0.024242401123046875, -0.01905059814453125, -0.013858795166015625, -0.0086669921875, -0.003475189208984375, 0.00171661376953125, 0.006908416748046875, 0.0121002197265625, 0.017292022705078125, 0.02248382568359375, 0.027675628662109375, 0.032867431640625, 0.038059234619140625, 0.04325103759765625, 0.048442840576171875, 0.0536346435546875, 0.058826446533203125, 0.06401824951171875, 0.06921005249023438, 0.07440185546875, 0.07959365844726562, 0.08478546142578125, 0.08997726440429688, 0.0951690673828125, 0.10036087036132812, 0.10555267333984375, 0.11074447631835938, 0.115936279296875, 0.12112808227539062, 0.12631988525390625, 0.13151168823242188, 0.1367034912109375, 0.14189529418945312, 0.14708709716796875, 0.15227890014648438, 0.157470703125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 0.0, 8.0, 13.0, 14.0, 11.0, 25.0, 35.0, 33.0, 40.0, 88.0, 180.0, 448.0, 1640.0, 7888.0, 71737.0, 902857.0, 54519.0, 6687.0, 1460.0, 410.0, 159.0, 81.0, 56.0, 30.0, 33.0, 15.0, 16.0, 12.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.40234375, -2.323455810546875, -2.24456787109375, -2.165679931640625, -2.0867919921875, -2.007904052734375, -1.92901611328125, -1.850128173828125, -1.771240234375, -1.692352294921875, -1.61346435546875, -1.534576416015625, -1.4556884765625, -1.376800537109375, -1.29791259765625, -1.219024658203125, -1.14013671875, -1.061248779296875, -0.98236083984375, -0.903472900390625, -0.8245849609375, -0.745697021484375, -0.66680908203125, -0.587921142578125, -0.509033203125, -0.430145263671875, -0.35125732421875, -0.272369384765625, -0.1934814453125, -0.114593505859375, -0.03570556640625, 0.043182373046875, 0.1220703125, 0.200958251953125, 0.27984619140625, 0.358734130859375, 0.4376220703125, 0.516510009765625, 0.59539794921875, 0.674285888671875, 0.753173828125, 0.832061767578125, 0.91094970703125, 0.989837646484375, 1.0687255859375, 1.147613525390625, 1.22650146484375, 1.305389404296875, 1.38427734375, 1.463165283203125, 1.54205322265625, 1.620941162109375, 1.6998291015625, 1.778717041015625, 1.85760498046875, 1.936492919921875, 2.015380859375, 2.094268798828125, 2.17315673828125, 2.252044677734375, 2.3309326171875, 2.409820556640625, 2.48870849609375, 2.567596435546875, 2.646484375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 14.0, 12.0, 19.0, 31.0, 33.0, 45.0, 49.0, 77.0, 139.0, 164.0, 113.0, 84.0, 59.0, 39.0, 23.0, 24.0, 13.0, 12.0, 9.0, 4.0, 5.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3291393518447876, -1.2866466045379639, -1.2441538572311401, -1.2016611099243164, -1.1591684818267822, -1.1166757345199585, -1.0741829872131348, -1.031690239906311, -0.9891974925994873, -0.9467047452926636, -0.9042119979858398, -0.8617193102836609, -0.8192265629768372, -0.7767338156700134, -0.7342411279678345, -0.6917483806610107, -0.649255633354187, -0.6067628860473633, -0.5642701387405396, -0.5217774510383606, -0.47928470373153687, -0.43679195642471313, -0.3942992389202118, -0.35180652141571045, -0.3093137741088867, -0.266821026802063, -0.22432830929756165, -0.1818355768918991, -0.13934284448623657, -0.09685011208057404, -0.0543573796749115, -0.011864662170410156, 0.030628204345703125, 0.07312093675136566, 0.1156136691570282, 0.15810640156269073, 0.20059913396835327, 0.2430918663740158, 0.28558459877967834, 0.3280773162841797, 0.3705700635910034, 0.41306281089782715, 0.4555555284023285, 0.49804824590682983, 0.5405409932136536, 0.5830337405204773, 0.6255264282226562, 0.66801917552948, 0.7105119228363037, 0.7530046701431274, 0.7954974174499512, 0.8379901051521301, 0.8804828524589539, 0.9229755997657776, 0.9654682874679565, 1.0079610347747803, 1.050453782081604, 1.0929465293884277, 1.1354392766952515, 1.1779320240020752, 1.2204246520996094, 1.262917399406433, 1.3054101467132568, 1.3479028940200806, 1.3903956413269043]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 13.0, 13.0, 17.0, 21.0, 14.0, 34.0, 33.0, 44.0, 52.0, 41.0, 49.0, 55.0, 54.0, 48.0, 54.0, 48.0, 63.0, 66.0, 47.0, 33.0, 29.0, 34.0, 33.0, 22.0, 14.0, 13.0, 15.0, 11.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.3303589820861816, -1.2977761030197144, -1.265193223953247, -1.2326103448867798, -1.2000274658203125, -1.1674445867538452, -1.134861707687378, -1.102278709411621, -1.0696959495544434, -1.037113070487976, -1.0045301914215088, -0.9719473123550415, -0.9393644332885742, -0.9067815542221069, -0.8741986155509949, -0.8416157364845276, -0.8090327978134155, -0.7764499187469482, -0.743867039680481, -0.7112841606140137, -0.6787012815475464, -0.6461184024810791, -0.613535463809967, -0.5809525847434998, -0.5483697056770325, -0.5157868266105652, -0.4832039475440979, -0.4506210386753082, -0.41803815960884094, -0.38545528054237366, -0.352872371673584, -0.3202894926071167, -0.28770655393600464, -0.25512367486953735, -0.22254078090190887, -0.1899578869342804, -0.1573750078678131, -0.12479212880134583, -0.09220923483371735, -0.05962634086608887, -0.027043461799621582, 0.0055394247174263, 0.03812231123447418, 0.07070519775152206, 0.10328808426856995, 0.13587096333503723, 0.1684538573026657, 0.2010367512702942, 0.23361963033676147, 0.26620250940322876, 0.29878538846969604, 0.3313682973384857, 0.363951176404953, 0.3965340554714203, 0.42911696434020996, 0.46169984340667725, 0.49428272247314453, 0.5268656015396118, 0.5594484806060791, 0.5920313596725464, 0.6246142387390137, 0.657197117805481, 0.689780056476593, 0.7223629355430603, 0.7549458146095276]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 10.0, 11.0, 16.0, 15.0, 24.0, 35.0, 39.0, 38.0, 52.0, 63.0, 64.0, 83.0, 79.0, 59.0, 74.0, 57.0, 60.0, 46.0, 34.0, 41.0, 24.0, 26.0, 19.0, 8.0, 8.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.557098388671875, -2.49114990234375, -2.425201416015625, -2.3592529296875, -2.293304443359375, -2.22735595703125, -2.161407470703125, -2.095458984375, -2.029510498046875, -1.96356201171875, -1.897613525390625, -1.8316650390625, -1.765716552734375, -1.69976806640625, -1.633819580078125, -1.56787109375, -1.501922607421875, -1.43597412109375, -1.370025634765625, -1.3040771484375, -1.238128662109375, -1.17218017578125, -1.106231689453125, -1.040283203125, -0.974334716796875, -0.90838623046875, -0.842437744140625, -0.7764892578125, -0.710540771484375, -0.64459228515625, -0.578643798828125, -0.5126953125, -0.446746826171875, -0.38079833984375, -0.314849853515625, -0.2489013671875, -0.182952880859375, -0.11700439453125, -0.051055908203125, 0.014892578125, 0.080841064453125, 0.14678955078125, 0.212738037109375, 0.2786865234375, 0.344635009765625, 0.41058349609375, 0.476531982421875, 0.54248046875, 0.608428955078125, 0.67437744140625, 0.740325927734375, 0.8062744140625, 0.872222900390625, 0.93817138671875, 1.004119873046875, 1.070068359375, 1.136016845703125, 1.20196533203125, 1.267913818359375, 1.3338623046875, 1.399810791015625, 1.46575927734375, 1.531707763671875, 1.59765625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 24.0, 44.0, 83.0, 153.0, 302.0, 586.0, 1324.0, 2991.0, 7953.0, 25307.0, 93628.0, 430188.0, 370591.0, 80893.0, 22081.0, 7154.0, 2769.0, 1295.0, 565.0, 290.0, 142.0, 69.0, 36.0, 23.0, 9.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.424652099609375, -3.29266357421875, -3.160675048828125, -3.0286865234375, -2.896697998046875, -2.76470947265625, -2.632720947265625, -2.500732421875, -2.368743896484375, -2.23675537109375, -2.104766845703125, -1.9727783203125, -1.840789794921875, -1.70880126953125, -1.576812744140625, -1.44482421875, -1.312835693359375, -1.18084716796875, -1.048858642578125, -0.9168701171875, -0.784881591796875, -0.65289306640625, -0.520904541015625, -0.388916015625, -0.256927490234375, -0.12493896484375, 0.007049560546875, 0.1390380859375, 0.271026611328125, 0.40301513671875, 0.535003662109375, 0.6669921875, 0.798980712890625, 0.93096923828125, 1.062957763671875, 1.1949462890625, 1.326934814453125, 1.45892333984375, 1.590911865234375, 1.722900390625, 1.854888916015625, 1.98687744140625, 2.118865966796875, 2.2508544921875, 2.382843017578125, 2.51483154296875, 2.646820068359375, 2.77880859375, 2.910797119140625, 3.04278564453125, 3.174774169921875, 3.3067626953125, 3.438751220703125, 3.57073974609375, 3.702728271484375, 3.834716796875, 3.966705322265625, 4.09869384765625, 4.230682373046875, 4.3626708984375, 4.494659423828125, 4.62664794921875, 4.758636474609375, 4.890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 7.0, 14.0, 17.0, 17.0, 23.0, 26.0, 31.0, 39.0, 40.0, 59.0, 52.0, 96.0, 134.0, 199.0, 1308.0, 256.0, 166.0, 111.0, 78.0, 64.0, 48.0, 43.0, 34.0, 33.0, 22.0, 17.0, 19.0, 21.0, 16.0, 4.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.58837890625, -4.4345703125, -4.28076171875, -4.126953125, -3.97314453125, -3.8193359375, -3.66552734375, -3.51171875, -3.35791015625, -3.2041015625, -3.05029296875, -2.896484375, -2.74267578125, -2.5888671875, -2.43505859375, -2.28125, -2.12744140625, -1.9736328125, -1.81982421875, -1.666015625, -1.51220703125, -1.3583984375, -1.20458984375, -1.05078125, -0.89697265625, -0.7431640625, -0.58935546875, -0.435546875, -0.28173828125, -0.1279296875, 0.02587890625, 0.1796875, 0.33349609375, 0.4873046875, 0.64111328125, 0.794921875, 0.94873046875, 1.1025390625, 1.25634765625, 1.41015625, 1.56396484375, 1.7177734375, 1.87158203125, 2.025390625, 2.17919921875, 2.3330078125, 2.48681640625, 2.640625, 2.79443359375, 2.9482421875, 3.10205078125, 3.255859375, 3.40966796875, 3.5634765625, 3.71728515625, 3.87109375, 4.02490234375, 4.1787109375, 4.33251953125, 4.486328125, 4.64013671875, 4.7939453125, 4.94775390625, 5.1015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 4.0, 14.0, 18.0, 12.0, 16.0, 24.0, 35.0, 34.0, 54.0, 74.0, 99.0, 127.0, 230.0, 360.0, 670.0, 1558.0, 4066.0, 16232.0, 114621.0, 2133656.0, 803997.0, 54300.0, 9905.0, 2945.0, 1176.0, 540.0, 282.0, 162.0, 126.0, 73.0, 74.0, 44.0, 31.0, 26.0, 26.0, 23.0, 12.0, 12.0, 4.0, 7.0, 5.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.48046875, -7.2454833984375, -7.010498046875, -6.7755126953125, -6.54052734375, -6.3055419921875, -6.070556640625, -5.8355712890625, -5.6005859375, -5.3656005859375, -5.130615234375, -4.8956298828125, -4.66064453125, -4.4256591796875, -4.190673828125, -3.9556884765625, -3.720703125, -3.4857177734375, -3.250732421875, -3.0157470703125, -2.78076171875, -2.5457763671875, -2.310791015625, -2.0758056640625, -1.8408203125, -1.6058349609375, -1.370849609375, -1.1358642578125, -0.90087890625, -0.6658935546875, -0.430908203125, -0.1959228515625, 0.0390625, 0.2740478515625, 0.509033203125, 0.7440185546875, 0.97900390625, 1.2139892578125, 1.448974609375, 1.6839599609375, 1.9189453125, 2.1539306640625, 2.388916015625, 2.6239013671875, 2.85888671875, 3.0938720703125, 3.328857421875, 3.5638427734375, 3.798828125, 4.0338134765625, 4.268798828125, 4.5037841796875, 4.73876953125, 4.9737548828125, 5.208740234375, 5.4437255859375, 5.6787109375, 5.9136962890625, 6.148681640625, 6.3836669921875, 6.61865234375, 6.8536376953125, 7.088623046875, 7.3236083984375, 7.55859375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 9.0, 44.0, 201.0, 371.0, 297.0, 80.0, 12.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.52214813232422, -59.07243347167969, -57.622718811035156, -56.173004150390625, -54.723289489746094, -53.27357482910156, -51.82386016845703, -50.3741455078125, -48.92443084716797, -47.47471618652344, -46.025001525878906, -44.575286865234375, -43.125572204589844, -41.67585754394531, -40.22614288330078, -38.77642822265625, -37.326717376708984, -35.87700271606445, -34.42728805541992, -32.97757339477539, -31.52785873413086, -30.078144073486328, -28.62843132019043, -27.1787166595459, -25.729001998901367, -24.279287338256836, -22.829572677612305, -21.379859924316406, -19.930145263671875, -18.480430603027344, -17.030715942382812, -15.581001281738281, -14.13128662109375, -12.681571960449219, -11.231857299804688, -9.782143592834473, -8.332428932189941, -6.88271427154541, -5.433000564575195, -3.983285903930664, -2.533571243286133, -1.0838568210601807, 0.3658576011657715, 1.8155717849731445, 3.265286445617676, 4.715001106262207, 6.164714813232422, 7.614429473876953, 9.064144134521484, 10.513858795166016, 11.963573455810547, 13.413287162780762, 14.863001823425293, 16.31271743774414, 17.76243019104004, 19.21214485168457, 20.6618595123291, 22.111574172973633, 23.561288833618164, 25.011001586914062, 26.460716247558594, 27.910430908203125, 29.360145568847656, 30.809860229492188, 32.25957489013672]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 1.0, 12.0, 11.0, 10.0, 12.0, 16.0, 27.0, 27.0, 24.0, 18.0, 25.0, 31.0, 28.0, 29.0, 42.0, 42.0, 52.0, 45.0, 44.0, 44.0, 35.0, 41.0, 48.0, 34.0, 32.0, 33.0, 28.0, 19.0, 24.0, 28.0, 20.0, 19.0, 13.0, 21.0, 5.0, 16.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-13.023686408996582, -12.636239051818848, -12.248790740966797, -11.861343383789062, -11.473895072937012, -11.086447715759277, -10.698999404907227, -10.311552047729492, -9.924104690551758, -9.536657333374023, -9.149209022521973, -8.761761665344238, -8.374313354492188, -7.986865997314453, -7.5994181632995605, -7.211970329284668, -6.824522018432617, -6.437074184417725, -6.049626350402832, -5.662178993225098, -5.274730682373047, -4.8872833251953125, -4.49983549118042, -4.112387657165527, -3.7249398231506348, -3.337491989135742, -2.9500441551208496, -2.562596559524536, -2.1751487255096436, -1.787700891494751, -1.4002532958984375, -1.012805461883545, -0.6253576278686523, -0.23790985345840454, 0.14953792095184326, 0.5369856357574463, 0.9244334697723389, 1.3118813037872314, 1.699328899383545, 2.0867767333984375, 2.47422456741333, 2.8616724014282227, 3.2491202354431152, 3.6365678310394287, 4.024015426635742, 4.411463737487793, 4.798911094665527, 5.18635892868042, 5.5738067626953125, 5.961254596710205, 6.348702430725098, 6.736149787902832, 7.123598098754883, 7.511045455932617, 7.89849328994751, 8.285941123962402, 8.673389434814453, 9.060836791992188, 9.448285102844238, 9.835732460021973, 10.223180770874023, 10.610628128051758, 10.998075485229492, 11.385523796081543, 11.772971153259277]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 7.0, 8.0, 10.0, 18.0, 13.0, 14.0, 17.0, 27.0, 33.0, 35.0, 20.0, 37.0, 39.0, 48.0, 36.0, 51.0, 61.0, 39.0, 48.0, 40.0, 40.0, 49.0, 36.0, 40.0, 30.0, 24.0, 24.0, 20.0, 16.0, 17.0, 14.0, 20.0, 7.0, 12.0, 3.0, 6.0, 8.0, 8.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4677734375, -1.4225311279296875, -1.377288818359375, -1.3320465087890625, -1.28680419921875, -1.2415618896484375, -1.196319580078125, -1.1510772705078125, -1.1058349609375, -1.0605926513671875, -1.015350341796875, -0.9701080322265625, -0.92486572265625, -0.8796234130859375, -0.834381103515625, -0.7891387939453125, -0.743896484375, -0.6986541748046875, -0.653411865234375, -0.6081695556640625, -0.56292724609375, -0.5176849365234375, -0.472442626953125, -0.4272003173828125, -0.3819580078125, -0.3367156982421875, -0.291473388671875, -0.2462310791015625, -0.20098876953125, -0.1557464599609375, -0.110504150390625, -0.0652618408203125, -0.02001953125, 0.0252227783203125, 0.070465087890625, 0.1157073974609375, 0.16094970703125, 0.2061920166015625, 0.251434326171875, 0.2966766357421875, 0.3419189453125, 0.3871612548828125, 0.432403564453125, 0.4776458740234375, 0.52288818359375, 0.5681304931640625, 0.613372802734375, 0.6586151123046875, 0.703857421875, 0.7490997314453125, 0.794342041015625, 0.8395843505859375, 0.88482666015625, 0.9300689697265625, 0.975311279296875, 1.0205535888671875, 1.0657958984375, 1.1110382080078125, 1.156280517578125, 1.2015228271484375, 1.24676513671875, 1.2920074462890625, 1.337249755859375, 1.3824920654296875, 1.427734375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 10.0, 9.0, 13.0, 7.0, 9.0, 30.0, 40.0, 66.0, 91.0, 98.0, 165.0, 267.0, 507.0, 1008.0, 1998.0, 4322.0, 11191.0, 37678.0, 281296.0, 2876667.0, 876481.0, 71756.0, 17831.0, 6505.0, 2851.0, 1502.0, 762.0, 414.0, 244.0, 125.0, 95.0, 73.0, 47.0, 31.0, 21.0, 18.0, 8.0, 9.0, 5.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.65325927734375, -3.5213623046875, -3.38946533203125, -3.257568359375, -3.12567138671875, -2.9937744140625, -2.86187744140625, -2.72998046875, -2.59808349609375, -2.4661865234375, -2.33428955078125, -2.202392578125, -2.07049560546875, -1.9385986328125, -1.80670166015625, -1.6748046875, -1.54290771484375, -1.4110107421875, -1.27911376953125, -1.147216796875, -1.01531982421875, -0.8834228515625, -0.75152587890625, -0.61962890625, -0.48773193359375, -0.3558349609375, -0.22393798828125, -0.092041015625, 0.03985595703125, 0.1717529296875, 0.30364990234375, 0.435546875, 0.56744384765625, 0.6993408203125, 0.83123779296875, 0.963134765625, 1.09503173828125, 1.2269287109375, 1.35882568359375, 1.49072265625, 1.62261962890625, 1.7545166015625, 1.88641357421875, 2.018310546875, 2.15020751953125, 2.2821044921875, 2.41400146484375, 2.5458984375, 2.67779541015625, 2.8096923828125, 2.94158935546875, 3.073486328125, 3.20538330078125, 3.3372802734375, 3.46917724609375, 3.60107421875, 3.73297119140625, 3.8648681640625, 3.99676513671875, 4.128662109375, 4.26055908203125, 4.3924560546875, 4.52435302734375, 4.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 9.0, 8.0, 9.0, 13.0, 17.0, 29.0, 37.0, 48.0, 70.0, 105.0, 165.0, 196.0, 325.0, 442.0, 554.0, 556.0, 450.0, 325.0, 207.0, 111.0, 90.0, 84.0, 67.0, 29.0, 26.0, 20.0, 20.0, 14.0, 7.0, 8.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.611328125, -3.51104736328125, -3.4107666015625, -3.31048583984375, -3.210205078125, -3.10992431640625, -3.0096435546875, -2.90936279296875, -2.80908203125, -2.70880126953125, -2.6085205078125, -2.50823974609375, -2.407958984375, -2.30767822265625, -2.2073974609375, -2.10711669921875, -2.0068359375, -1.90655517578125, -1.8062744140625, -1.70599365234375, -1.605712890625, -1.50543212890625, -1.4051513671875, -1.30487060546875, -1.20458984375, -1.10430908203125, -1.0040283203125, -0.90374755859375, -0.803466796875, -0.70318603515625, -0.6029052734375, -0.50262451171875, -0.40234375, -0.30206298828125, -0.2017822265625, -0.10150146484375, -0.001220703125, 0.09906005859375, 0.1993408203125, 0.29962158203125, 0.39990234375, 0.50018310546875, 0.6004638671875, 0.70074462890625, 0.801025390625, 0.90130615234375, 1.0015869140625, 1.10186767578125, 1.2021484375, 1.30242919921875, 1.4027099609375, 1.50299072265625, 1.603271484375, 1.70355224609375, 1.8038330078125, 1.90411376953125, 2.00439453125, 2.10467529296875, 2.2049560546875, 2.30523681640625, 2.405517578125, 2.50579833984375, 2.6060791015625, 2.70635986328125, 2.806640625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 17.0, 19.0, 31.0, 35.0, 48.0, 89.0, 159.0, 278.0, 543.0, 1112.0, 2426.0, 6668.0, 21830.0, 103640.0, 1238227.0, 2588820.0, 182906.0, 32347.0, 9172.0, 3132.0, 1332.0, 631.0, 321.0, 205.0, 87.0, 62.0, 29.0, 28.0, 20.0, 19.0, 10.0, 7.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.1124267578125, -4.924072265625, -4.7357177734375, -4.54736328125, -4.3590087890625, -4.170654296875, -3.9822998046875, -3.7939453125, -3.6055908203125, -3.417236328125, -3.2288818359375, -3.04052734375, -2.8521728515625, -2.663818359375, -2.4754638671875, -2.287109375, -2.0987548828125, -1.910400390625, -1.7220458984375, -1.53369140625, -1.3453369140625, -1.156982421875, -0.9686279296875, -0.7802734375, -0.5919189453125, -0.403564453125, -0.2152099609375, -0.02685546875, 0.1614990234375, 0.349853515625, 0.5382080078125, 0.7265625, 0.9149169921875, 1.103271484375, 1.2916259765625, 1.47998046875, 1.6683349609375, 1.856689453125, 2.0450439453125, 2.2333984375, 2.4217529296875, 2.610107421875, 2.7984619140625, 2.98681640625, 3.1751708984375, 3.363525390625, 3.5518798828125, 3.740234375, 3.9285888671875, 4.116943359375, 4.3052978515625, 4.49365234375, 4.6820068359375, 4.870361328125, 5.0587158203125, 5.2470703125, 5.4354248046875, 5.623779296875, 5.8121337890625, 6.00048828125, 6.1888427734375, 6.377197265625, 6.5655517578125, 6.75390625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 10.0, 4.0, 7.0, 19.0, 18.0, 18.0, 34.0, 38.0, 54.0, 60.0, 64.0, 99.0, 87.0, 94.0, 86.0, 86.0, 65.0, 43.0, 33.0, 27.0, 18.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.854825019836426, -12.424972534179688, -11.99512004852295, -11.565267562866211, -11.135414123535156, -10.705561637878418, -10.27570915222168, -9.845856666564941, -9.416004180908203, -8.986151695251465, -8.556299209594727, -8.126445770263672, -7.696593761444092, -7.266740798950195, -6.836888313293457, -6.407035827636719, -5.977182865142822, -5.547330379486084, -5.1174774169921875, -4.687624931335449, -4.257772445678711, -3.8279197216033936, -3.398066997528076, -2.968214511871338, -2.5383617877960205, -2.108509063720703, -1.6786565780639648, -1.2488038539886475, -0.8189512491226196, -0.3890986442565918, 0.040754079818725586, 0.47060656547546387, 0.9004592895507812, 1.330311894416809, 1.760164499282837, 2.1900172233581543, 2.6198697090148926, 3.04972243309021, 3.4795751571655273, 3.9094276428222656, 4.339280128479004, 4.769132614135742, 5.198985576629639, 5.628838062286377, 6.058690547943115, 6.488543510437012, 6.91839599609375, 7.348248481750488, 7.778101444244385, 8.207954406738281, 8.63780689239502, 9.067659378051758, 9.497511863708496, 9.927364349365234, 10.357217788696289, 10.787069320678711, 11.216922760009766, 11.646775245666504, 12.076627731323242, 12.506481170654297, 12.936333656311035, 13.366186141967773, 13.796038627624512, 14.22589111328125, 14.655743598937988]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 9.0, 8.0, 14.0, 18.0, 12.0, 11.0, 18.0, 13.0, 21.0, 30.0, 26.0, 34.0, 26.0, 37.0, 43.0, 38.0, 38.0, 30.0, 38.0, 40.0, 29.0, 40.0, 36.0, 38.0, 39.0, 38.0, 36.0, 21.0, 27.0, 21.0, 19.0, 15.0, 23.0, 19.0, 17.0, 21.0, 11.0, 9.0, 8.0, 10.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0], "bins": [-10.632645606994629, -10.340533256530762, -10.048420906066895, -9.756307601928711, -9.464195251464844, -9.172082901000977, -8.87997055053711, -8.587858200073242, -8.295744895935059, -8.003632545471191, -7.711519718170166, -7.419407367706299, -7.127294540405273, -6.835182189941406, -6.543069839477539, -6.250957012176514, -5.9588446617126465, -5.666732311248779, -5.374619483947754, -5.082507133483887, -4.790394306182861, -4.498281955718994, -4.206169128417969, -3.9140567779541016, -3.6219441890716553, -3.329831600189209, -3.0377190113067627, -2.7456064224243164, -2.453494071960449, -2.161381244659424, -1.8692688941955566, -1.5771563053131104, -1.285043716430664, -0.9929311275482178, -0.7008185982704163, -0.40870606899261475, -0.11659348011016846, 0.17551910877227783, 0.46763157844543457, 0.7597441673278809, 1.0518567562103271, 1.3439693450927734, 1.6360819339752197, 1.9281944036483765, 2.220306873321533, 2.5124197006225586, 2.804532051086426, 3.096644639968872, 3.3887572288513184, 3.6808698177337646, 3.972982406616211, 4.265094757080078, 4.5572075843811035, 4.849319934844971, 5.141432762145996, 5.433545112609863, 5.7256574630737305, 6.017769813537598, 6.309882640838623, 6.60199499130249, 6.894107818603516, 7.186220169067383, 7.47833251953125, 7.770445346832275, 8.0625581741333]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 8.0, 16.0, 15.0, 15.0, 19.0, 26.0, 24.0, 26.0, 24.0, 39.0, 33.0, 44.0, 42.0, 59.0, 39.0, 44.0, 49.0, 68.0, 56.0, 37.0, 46.0, 39.0, 22.0, 39.0, 22.0, 27.0, 18.0, 18.0, 13.0, 14.0, 11.0, 10.0, 7.0, 7.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.697265625, -1.6486968994140625, -1.600128173828125, -1.5515594482421875, -1.50299072265625, -1.4544219970703125, -1.405853271484375, -1.3572845458984375, -1.3087158203125, -1.2601470947265625, -1.211578369140625, -1.1630096435546875, -1.11444091796875, -1.0658721923828125, -1.017303466796875, -0.9687347412109375, -0.920166015625, -0.8715972900390625, -0.823028564453125, -0.7744598388671875, -0.72589111328125, -0.6773223876953125, -0.628753662109375, -0.5801849365234375, -0.5316162109375, -0.4830474853515625, -0.434478759765625, -0.3859100341796875, -0.33734130859375, -0.2887725830078125, -0.240203857421875, -0.1916351318359375, -0.14306640625, -0.0944976806640625, -0.045928955078125, 0.0026397705078125, 0.05120849609375, 0.0997772216796875, 0.148345947265625, 0.1969146728515625, 0.2454833984375, 0.2940521240234375, 0.342620849609375, 0.3911895751953125, 0.43975830078125, 0.4883270263671875, 0.536895751953125, 0.5854644775390625, 0.634033203125, 0.6826019287109375, 0.731170654296875, 0.7797393798828125, 0.82830810546875, 0.8768768310546875, 0.925445556640625, 0.9740142822265625, 1.0225830078125, 1.0711517333984375, 1.119720458984375, 1.1682891845703125, 1.21685791015625, 1.2654266357421875, 1.313995361328125, 1.3625640869140625, 1.4111328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 13.0, 21.0, 24.0, 38.0, 64.0, 96.0, 132.0, 240.0, 412.0, 593.0, 993.0, 1696.0, 2824.0, 4729.0, 8118.0, 13967.0, 24226.0, 40895.0, 66488.0, 103969.0, 150387.0, 181974.0, 157042.0, 110075.0, 71912.0, 44387.0, 26386.0, 15328.0, 8865.0, 5093.0, 2986.0, 1743.0, 1048.0, 665.0, 411.0, 249.0, 149.0, 107.0, 75.0, 32.0, 33.0, 21.0, 10.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9072113037109375, -0.879364013671875, -0.8515167236328125, -0.82366943359375, -0.7958221435546875, -0.767974853515625, -0.7401275634765625, -0.7122802734375, -0.6844329833984375, -0.656585693359375, -0.6287384033203125, -0.60089111328125, -0.5730438232421875, -0.545196533203125, -0.5173492431640625, -0.489501953125, -0.4616546630859375, -0.433807373046875, -0.4059600830078125, -0.37811279296875, -0.3502655029296875, -0.322418212890625, -0.2945709228515625, -0.2667236328125, -0.2388763427734375, -0.211029052734375, -0.1831817626953125, -0.15533447265625, -0.1274871826171875, -0.099639892578125, -0.0717926025390625, -0.0439453125, -0.0160980224609375, 0.011749267578125, 0.0395965576171875, 0.06744384765625, 0.0952911376953125, 0.123138427734375, 0.1509857177734375, 0.1788330078125, 0.2066802978515625, 0.234527587890625, 0.2623748779296875, 0.29022216796875, 0.3180694580078125, 0.345916748046875, 0.3737640380859375, 0.401611328125, 0.4294586181640625, 0.457305908203125, 0.4851531982421875, 0.51300048828125, 0.5408477783203125, 0.568695068359375, 0.5965423583984375, 0.6243896484375, 0.6522369384765625, 0.680084228515625, 0.7079315185546875, 0.73577880859375, 0.7636260986328125, 0.791473388671875, 0.8193206787109375, 0.84716796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 18.0, 16.0, 10.0, 13.0, 9.0, 16.0, 25.0, 17.0, 23.0, 32.0, 36.0, 35.0, 38.0, 25.0, 40.0, 42.0, 37.0, 36.0, 1060.0, 45.0, 40.0, 39.0, 36.0, 30.0, 32.0, 27.0, 17.0, 29.0, 25.0, 25.0, 18.0, 16.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1083984375, -1.0740509033203125, -1.039703369140625, -1.0053558349609375, -0.97100830078125, -0.9366607666015625, -0.902313232421875, -0.8679656982421875, -0.8336181640625, -0.7992706298828125, -0.764923095703125, -0.7305755615234375, -0.69622802734375, -0.6618804931640625, -0.627532958984375, -0.5931854248046875, -0.558837890625, -0.5244903564453125, -0.490142822265625, -0.4557952880859375, -0.42144775390625, -0.3871002197265625, -0.352752685546875, -0.3184051513671875, -0.2840576171875, -0.2497100830078125, -0.215362548828125, -0.1810150146484375, -0.14666748046875, -0.1123199462890625, -0.077972412109375, -0.0436248779296875, -0.00927734375, 0.0250701904296875, 0.059417724609375, 0.0937652587890625, 0.12811279296875, 0.1624603271484375, 0.196807861328125, 0.2311553955078125, 0.2655029296875, 0.2998504638671875, 0.334197998046875, 0.3685455322265625, 0.40289306640625, 0.4372406005859375, 0.471588134765625, 0.5059356689453125, 0.540283203125, 0.5746307373046875, 0.608978271484375, 0.6433258056640625, 0.67767333984375, 0.7120208740234375, 0.746368408203125, 0.7807159423828125, 0.8150634765625, 0.8494110107421875, 0.883758544921875, 0.9181060791015625, 0.95245361328125, 0.9868011474609375, 1.021148681640625, 1.0554962158203125, 1.08984375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 23.0, 36.0, 54.0, 63.0, 100.0, 132.0, 215.0, 306.0, 407.0, 597.0, 933.0, 1320.0, 1940.0, 2878.0, 4258.0, 6208.0, 9379.0, 14858.0, 25536.0, 65595.0, 425459.0, 1350686.0, 103735.0, 32565.0, 17091.0, 10596.0, 7081.0, 4807.0, 3199.0, 2275.0, 1476.0, 1037.0, 719.0, 443.0, 290.0, 254.0, 190.0, 112.0, 76.0, 59.0, 41.0, 17.0, 17.0, 12.0, 13.0, 1.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.96875, -0.938629150390625, -0.90850830078125, -0.878387451171875, -0.8482666015625, -0.818145751953125, -0.78802490234375, -0.757904052734375, -0.727783203125, -0.697662353515625, -0.66754150390625, -0.637420654296875, -0.6072998046875, -0.577178955078125, -0.54705810546875, -0.516937255859375, -0.48681640625, -0.456695556640625, -0.42657470703125, -0.396453857421875, -0.3663330078125, -0.336212158203125, -0.30609130859375, -0.275970458984375, -0.245849609375, -0.215728759765625, -0.18560791015625, -0.155487060546875, -0.1253662109375, -0.095245361328125, -0.06512451171875, -0.035003662109375, -0.0048828125, 0.025238037109375, 0.05535888671875, 0.085479736328125, 0.1156005859375, 0.145721435546875, 0.17584228515625, 0.205963134765625, 0.236083984375, 0.266204833984375, 0.29632568359375, 0.326446533203125, 0.3565673828125, 0.386688232421875, 0.41680908203125, 0.446929931640625, 0.47705078125, 0.507171630859375, 0.53729248046875, 0.567413330078125, 0.5975341796875, 0.627655029296875, 0.65777587890625, 0.687896728515625, 0.718017578125, 0.748138427734375, 0.77825927734375, 0.808380126953125, 0.8385009765625, 0.868621826171875, 0.89874267578125, 0.928863525390625, 0.958984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 12.0, 15.0, 17.0, 14.0, 21.0, 38.0, 33.0, 46.0, 49.0, 46.0, 83.0, 77.0, 98.0, 66.0, 62.0, 57.0, 42.0, 35.0, 38.0, 29.0, 14.0, 17.0, 8.0, 12.0, 12.0, 5.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.12310791015625, -0.11988067626953125, -0.1166534423828125, -0.11342620849609375, -0.110198974609375, -0.10697174072265625, -0.1037445068359375, -0.10051727294921875, -0.0972900390625, -0.09406280517578125, -0.0908355712890625, -0.08760833740234375, -0.084381103515625, -0.08115386962890625, -0.0779266357421875, -0.07469940185546875, -0.07147216796875, -0.06824493408203125, -0.0650177001953125, -0.06179046630859375, -0.058563232421875, -0.05533599853515625, -0.0521087646484375, -0.04888153076171875, -0.045654296875, -0.04242706298828125, -0.0391998291015625, -0.03597259521484375, -0.032745361328125, -0.02951812744140625, -0.0262908935546875, -0.02306365966796875, -0.01983642578125, -0.01660919189453125, -0.0133819580078125, -0.01015472412109375, -0.006927490234375, -0.00370025634765625, -0.0004730224609375, 0.00275421142578125, 0.0059814453125, 0.00920867919921875, 0.0124359130859375, 0.01566314697265625, 0.018890380859375, 0.02211761474609375, 0.0253448486328125, 0.02857208251953125, 0.03179931640625, 0.03502655029296875, 0.0382537841796875, 0.04148101806640625, 0.044708251953125, 0.04793548583984375, 0.0511627197265625, 0.05438995361328125, 0.0576171875, 0.06084442138671875, 0.0640716552734375, 0.06729888916015625, 0.070526123046875, 0.07375335693359375, 0.0769805908203125, 0.08020782470703125, 0.08343505859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 12.0, 12.0, 30.0, 24.0, 50.0, 83.0, 128.0, 281.0, 1032.0, 6918.0, 170311.0, 847865.0, 18855.0, 2072.0, 379.0, 163.0, 86.0, 57.0, 41.0, 23.0, 28.0, 16.0, 10.0, 8.0, 10.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4230194091796875, -1.366546630859375, -1.3100738525390625, -1.25360107421875, -1.1971282958984375, -1.140655517578125, -1.0841827392578125, -1.0277099609375, -0.9712371826171875, -0.914764404296875, -0.8582916259765625, -0.80181884765625, -0.7453460693359375, -0.688873291015625, -0.6324005126953125, -0.575927734375, -0.5194549560546875, -0.462982177734375, -0.4065093994140625, -0.35003662109375, -0.2935638427734375, -0.237091064453125, -0.1806182861328125, -0.1241455078125, -0.0676727294921875, -0.011199951171875, 0.0452728271484375, 0.10174560546875, 0.1582183837890625, 0.214691162109375, 0.2711639404296875, 0.32763671875, 0.3841094970703125, 0.440582275390625, 0.4970550537109375, 0.55352783203125, 0.6100006103515625, 0.666473388671875, 0.7229461669921875, 0.7794189453125, 0.8358917236328125, 0.892364501953125, 0.9488372802734375, 1.00531005859375, 1.0617828369140625, 1.118255615234375, 1.1747283935546875, 1.231201171875, 1.2876739501953125, 1.344146728515625, 1.4006195068359375, 1.45709228515625, 1.5135650634765625, 1.570037841796875, 1.6265106201171875, 1.6829833984375, 1.7394561767578125, 1.795928955078125, 1.8524017333984375, 1.90887451171875, 1.9653472900390625, 2.021820068359375, 2.0782928466796875, 2.134765625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 10.0, 17.0, 32.0, 49.0, 50.0, 90.0, 136.0, 155.0, 138.0, 106.0, 64.0, 34.0, 33.0, 24.0, 16.0, 10.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9815634489059448, -0.9584847688674927, -0.9354060292243958, -0.9123273491859436, -0.8892486095428467, -0.8661699295043945, -0.8430912494659424, -0.8200125694274902, -0.7969338297843933, -0.7738551497459412, -0.7507764101028442, -0.7276977300643921, -0.7046190500259399, -0.681540310382843, -0.6584616303443909, -0.635382890701294, -0.6123042106628418, -0.5892255306243896, -0.5661467909812927, -0.5430681109428406, -0.5199893712997437, -0.4969106912612915, -0.47383201122283936, -0.4507533013820648, -0.4276745915412903, -0.40459588170051575, -0.3815171718597412, -0.35843849182128906, -0.3353597819805145, -0.31228107213974, -0.28920239210128784, -0.2661236822605133, -0.24304494261741638, -0.21996623277664185, -0.1968875378370285, -0.17380884289741516, -0.15073013305664062, -0.1276514232158661, -0.10457272827625275, -0.0814940333366394, -0.05841532349586487, -0.03533662110567093, -0.01225791871547699, 0.01082078367471695, 0.03389948606491089, 0.05697818845510483, 0.08005689084529877, 0.10313558578491211, 0.12621429562568665, 0.14929300546646118, 0.17237170040607452, 0.19545039534568787, 0.2185291051864624, 0.24160781502723694, 0.2646865248680115, 0.2877652049064636, 0.31084391474723816, 0.3339226245880127, 0.35700130462646484, 0.3800800144672394, 0.4031587243080139, 0.42623743414878845, 0.449316143989563, 0.47239482402801514, 0.4954735338687897]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 8.0, 5.0, 14.0, 18.0, 27.0, 40.0, 35.0, 42.0, 45.0, 50.0, 70.0, 57.0, 80.0, 77.0, 57.0, 56.0, 59.0, 43.0, 56.0, 38.0, 28.0, 27.0, 24.0, 14.0, 9.0, 10.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7357281446456909, -0.7173859477043152, -0.6990438103675842, -0.6807016134262085, -0.6623594164848328, -0.644017219543457, -0.6256750822067261, -0.6073328852653503, -0.5889906883239746, -0.5706484913825989, -0.5523063540458679, -0.5339641571044922, -0.5156219601631165, -0.4972797930240631, -0.47893762588500977, -0.46059542894363403, -0.4422532618045807, -0.42391109466552734, -0.4055688977241516, -0.38722673058509827, -0.36888453364372253, -0.3505423665046692, -0.33220016956329346, -0.3138580024242401, -0.29551583528518677, -0.2771736681461334, -0.2588314712047577, -0.24048930406570435, -0.2221471071243286, -0.20380493998527527, -0.18546275794506073, -0.1671205759048462, -0.14877837896347046, -0.13043619692325592, -0.11209401488304138, -0.09375184029340744, -0.0754096582531929, -0.05706747621297836, -0.03872530162334442, -0.020383119583129883, -0.0020409375429153442, 0.016301242634654045, 0.034643422812223434, 0.052985601127147675, 0.07132778316736221, 0.08966996520757675, 0.1080121397972107, 0.12635432183742523, 0.14469650387763977, 0.1630386859178543, 0.18138086795806885, 0.1997230350971222, 0.21806523203849792, 0.23640739917755127, 0.254749596118927, 0.27309176325798035, 0.2914339303970337, 0.30977609753608704, 0.32811829447746277, 0.3464604616165161, 0.36480265855789185, 0.3831448256969452, 0.40148699283599854, 0.41982918977737427, 0.43817138671875]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 30.0, 20.0, 30.0, 41.0, 53.0, 49.0, 52.0, 51.0, 72.0, 76.0, 72.0, 75.0, 67.0, 58.0, 46.0, 46.0, 31.0, 22.0, 29.0, 17.0, 14.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0], "bins": [-3.1796875, -3.1104736328125, -3.041259765625, -2.9720458984375, -2.90283203125, -2.8336181640625, -2.764404296875, -2.6951904296875, -2.6259765625, -2.5567626953125, -2.487548828125, -2.4183349609375, -2.34912109375, -2.2799072265625, -2.210693359375, -2.1414794921875, -2.072265625, -2.0030517578125, -1.933837890625, -1.8646240234375, -1.79541015625, -1.7261962890625, -1.656982421875, -1.5877685546875, -1.5185546875, -1.4493408203125, -1.380126953125, -1.3109130859375, -1.24169921875, -1.1724853515625, -1.103271484375, -1.0340576171875, -0.96484375, -0.8956298828125, -0.826416015625, -0.7572021484375, -0.68798828125, -0.6187744140625, -0.549560546875, -0.4803466796875, -0.4111328125, -0.3419189453125, -0.272705078125, -0.2034912109375, -0.13427734375, -0.0650634765625, 0.004150390625, 0.0733642578125, 0.142578125, 0.2117919921875, 0.281005859375, 0.3502197265625, 0.41943359375, 0.4886474609375, 0.557861328125, 0.6270751953125, 0.6962890625, 0.7655029296875, 0.834716796875, 0.9039306640625, 0.97314453125, 1.0423583984375, 1.111572265625, 1.1807861328125, 1.25]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 9.0, 19.0, 23.0, 41.0, 56.0, 98.0, 162.0, 235.0, 417.0, 765.0, 1401.0, 2709.0, 5753.0, 13653.0, 38859.0, 144011.0, 524645.0, 226741.0, 55827.0, 18486.0, 7447.0, 3371.0, 1735.0, 894.0, 453.0, 295.0, 156.0, 95.0, 60.0, 43.0, 31.0, 15.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.837890625, -2.735260009765625, -2.63262939453125, -2.529998779296875, -2.4273681640625, -2.324737548828125, -2.22210693359375, -2.119476318359375, -2.016845703125, -1.914215087890625, -1.81158447265625, -1.708953857421875, -1.6063232421875, -1.503692626953125, -1.40106201171875, -1.298431396484375, -1.19580078125, -1.093170166015625, -0.99053955078125, -0.887908935546875, -0.7852783203125, -0.682647705078125, -0.58001708984375, -0.477386474609375, -0.374755859375, -0.272125244140625, -0.16949462890625, -0.066864013671875, 0.0357666015625, 0.138397216796875, 0.24102783203125, 0.343658447265625, 0.4462890625, 0.548919677734375, 0.65155029296875, 0.754180908203125, 0.8568115234375, 0.959442138671875, 1.06207275390625, 1.164703369140625, 1.267333984375, 1.369964599609375, 1.47259521484375, 1.575225830078125, 1.6778564453125, 1.780487060546875, 1.88311767578125, 1.985748291015625, 2.08837890625, 2.191009521484375, 2.29364013671875, 2.396270751953125, 2.4989013671875, 2.601531982421875, 2.70416259765625, 2.806793212890625, 2.909423828125, 3.012054443359375, 3.11468505859375, 3.217315673828125, 3.3199462890625, 3.422576904296875, 3.52520751953125, 3.627838134765625, 3.73046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 25.0, 14.0, 22.0, 25.0, 17.0, 16.0, 26.0, 21.0, 35.0, 40.0, 68.0, 68.0, 94.0, 147.0, 286.0, 1343.0, 198.0, 89.0, 74.0, 58.0, 29.0, 39.0, 33.0, 33.0, 26.0, 26.0, 19.0, 23.0, 20.0, 15.0, 8.0, 10.0, 13.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.955078125, -3.827789306640625, -3.70050048828125, -3.573211669921875, -3.4459228515625, -3.318634033203125, -3.19134521484375, -3.064056396484375, -2.936767578125, -2.809478759765625, -2.68218994140625, -2.554901123046875, -2.4276123046875, -2.300323486328125, -2.17303466796875, -2.045745849609375, -1.91845703125, -1.791168212890625, -1.66387939453125, -1.536590576171875, -1.4093017578125, -1.282012939453125, -1.15472412109375, -1.027435302734375, -0.900146484375, -0.772857666015625, -0.64556884765625, -0.518280029296875, -0.3909912109375, -0.263702392578125, -0.13641357421875, -0.009124755859375, 0.1181640625, 0.245452880859375, 0.37274169921875, 0.500030517578125, 0.6273193359375, 0.754608154296875, 0.88189697265625, 1.009185791015625, 1.136474609375, 1.263763427734375, 1.39105224609375, 1.518341064453125, 1.6456298828125, 1.772918701171875, 1.90020751953125, 2.027496337890625, 2.15478515625, 2.282073974609375, 2.40936279296875, 2.536651611328125, 2.6639404296875, 2.791229248046875, 2.91851806640625, 3.045806884765625, 3.173095703125, 3.300384521484375, 3.42767333984375, 3.554962158203125, 3.6822509765625, 3.809539794921875, 3.93682861328125, 4.064117431640625, 4.19140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 3.0, 2.0, 11.0, 1.0, 16.0, 15.0, 17.0, 21.0, 25.0, 30.0, 41.0, 52.0, 53.0, 68.0, 94.0, 111.0, 208.0, 350.0, 655.0, 1977.0, 9764.0, 99632.0, 2627056.0, 378176.0, 21618.0, 3466.0, 979.0, 403.0, 234.0, 139.0, 131.0, 75.0, 53.0, 47.0, 35.0, 27.0, 27.0, 15.0, 23.0, 10.0, 9.0, 3.0, 7.0, 11.0, 5.0, 6.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.16436767578125, -7.9146728515625, -7.66497802734375, -7.415283203125, -7.16558837890625, -6.9158935546875, -6.66619873046875, -6.41650390625, -6.16680908203125, -5.9171142578125, -5.66741943359375, -5.417724609375, -5.16802978515625, -4.9183349609375, -4.66864013671875, -4.4189453125, -4.16925048828125, -3.9195556640625, -3.66986083984375, -3.420166015625, -3.17047119140625, -2.9207763671875, -2.67108154296875, -2.42138671875, -2.17169189453125, -1.9219970703125, -1.67230224609375, -1.422607421875, -1.17291259765625, -0.9232177734375, -0.67352294921875, -0.423828125, -0.17413330078125, 0.0755615234375, 0.32525634765625, 0.574951171875, 0.82464599609375, 1.0743408203125, 1.32403564453125, 1.57373046875, 1.82342529296875, 2.0731201171875, 2.32281494140625, 2.572509765625, 2.82220458984375, 3.0718994140625, 3.32159423828125, 3.5712890625, 3.82098388671875, 4.0706787109375, 4.32037353515625, 4.570068359375, 4.81976318359375, 5.0694580078125, 5.31915283203125, 5.56884765625, 5.81854248046875, 6.0682373046875, 6.31793212890625, 6.567626953125, 6.81732177734375, 7.0670166015625, 7.31671142578125, 7.56640625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 308.0, 705.0, 1.0, 1.0], "bins": [-339.839599609375, -334.2760925292969, -328.7126159667969, -323.14910888671875, -317.58563232421875, -312.0221252441406, -306.4586181640625, -300.8951416015625, -295.3316345214844, -289.76812744140625, -284.20465087890625, -278.6411437988281, -273.07763671875, -267.51416015625, -261.9506530761719, -256.3871765136719, -250.82366943359375, -245.2601776123047, -239.69668579101562, -234.1331787109375, -228.56968688964844, -223.00619506835938, -217.44268798828125, -211.8791961669922, -206.31570434570312, -200.75221252441406, -195.188720703125, -189.62521362304688, -184.0617218017578, -178.49822998046875, -172.93472290039062, -167.37123107910156, -161.8077392578125, -156.24424743652344, -150.68075561523438, -145.11724853515625, -139.5537567138672, -133.99026489257812, -128.4267578125, -122.86326599121094, -117.29977416992188, -111.73628234863281, -106.17278289794922, -100.60928344726562, -95.04579162597656, -89.4822998046875, -83.9188003540039, -78.35530090332031, -72.79180908203125, -67.22831726074219, -61.664817810058594, -56.101322174072266, -50.53782653808594, -44.97433090209961, -39.41083526611328, -33.84733963012695, -28.28384017944336, -22.72034454345703, -17.156848907470703, -11.593353271484375, -6.029857635498047, -0.46636199951171875, 5.097133636474609, 10.660629272460938, 16.224124908447266]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 4.0, 15.0, 3.0, 14.0, 19.0, 15.0, 13.0, 22.0, 28.0, 22.0, 26.0, 35.0, 37.0, 31.0, 42.0, 33.0, 34.0, 50.0, 50.0, 55.0, 42.0, 39.0, 47.0, 33.0, 33.0, 32.0, 33.0, 27.0, 35.0, 17.0, 22.0, 18.0, 11.0, 7.0, 10.0, 10.0, 7.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.351264953613281, -14.917603492736816, -14.483942031860352, -14.050280570983887, -13.616619110107422, -13.182957649230957, -12.749296188354492, -12.315633773803711, -11.881973266601562, -11.448311805725098, -11.014650344848633, -10.580988883972168, -10.147327423095703, -9.713665962219238, -9.280004501342773, -8.846342086791992, -8.412680625915527, -7.9790191650390625, -7.545357704162598, -7.111696243286133, -6.678034782409668, -6.244373321533203, -5.81071138381958, -5.377049922943115, -4.94338846206665, -4.5097270011901855, -4.076065540313721, -3.6424038410186768, -3.208742380142212, -2.775080919265747, -2.341419219970703, -1.9077577590942383, -1.4740962982177734, -1.0404348373413086, -0.6067732572555542, -0.1731116771697998, 0.26054978370666504, 0.6942112445831299, 1.1278729438781738, 1.5615344047546387, 1.9951958656311035, 2.4288573265075684, 2.862518787384033, 3.296180486679077, 3.729841947555542, 4.163503646850586, 4.597165107727051, 5.030826568603516, 5.4644880294799805, 5.898149490356445, 6.33181095123291, 6.765472412109375, 7.19913387298584, 7.632795333862305, 8.066457748413086, 8.500118255615234, 8.933780670166016, 9.36744213104248, 9.801103591918945, 10.23476505279541, 10.668426513671875, 11.10208797454834, 11.535749435424805, 11.969411849975586, 12.403072357177734]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 8.0, 14.0, 11.0, 19.0, 26.0, 25.0, 49.0, 40.0, 40.0, 57.0, 71.0, 53.0, 65.0, 61.0, 61.0, 68.0, 61.0, 45.0, 42.0, 38.0, 35.0, 31.0, 19.0, 11.0, 13.0, 13.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.025390625, -2.9557647705078125, -2.886138916015625, -2.8165130615234375, -2.74688720703125, -2.6772613525390625, -2.607635498046875, -2.5380096435546875, -2.4683837890625, -2.3987579345703125, -2.329132080078125, -2.2595062255859375, -2.18988037109375, -2.1202545166015625, -2.050628662109375, -1.9810028076171875, -1.911376953125, -1.8417510986328125, -1.772125244140625, -1.7024993896484375, -1.63287353515625, -1.5632476806640625, -1.493621826171875, -1.4239959716796875, -1.3543701171875, -1.2847442626953125, -1.215118408203125, -1.1454925537109375, -1.07586669921875, -1.0062408447265625, -0.936614990234375, -0.8669891357421875, -0.79736328125, -0.7277374267578125, -0.658111572265625, -0.5884857177734375, -0.51885986328125, -0.4492340087890625, -0.379608154296875, -0.3099822998046875, -0.2403564453125, -0.1707305908203125, -0.101104736328125, -0.0314788818359375, 0.03814697265625, 0.1077728271484375, 0.177398681640625, 0.2470245361328125, 0.316650390625, 0.3862762451171875, 0.455902099609375, 0.5255279541015625, 0.59515380859375, 0.6647796630859375, 0.734405517578125, 0.8040313720703125, 0.8736572265625, 0.9432830810546875, 1.012908935546875, 1.0825347900390625, 1.15216064453125, 1.2217864990234375, 1.291412353515625, 1.3610382080078125, 1.4306640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 12.0, 9.0, 9.0, 16.0, 29.0, 16.0, 45.0, 66.0, 93.0, 171.0, 379.0, 1046.0, 3059.0, 11998.0, 85074.0, 2615493.0, 1409480.0, 53984.0, 9261.0, 2489.0, 898.0, 303.0, 139.0, 81.0, 36.0, 30.0, 22.0, 14.0, 15.0, 6.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-9.234375, -9.01910400390625, -8.8038330078125, -8.58856201171875, -8.373291015625, -8.15802001953125, -7.9427490234375, -7.72747802734375, -7.51220703125, -7.29693603515625, -7.0816650390625, -6.86639404296875, -6.651123046875, -6.43585205078125, -6.2205810546875, -6.00531005859375, -5.7900390625, -5.57476806640625, -5.3594970703125, -5.14422607421875, -4.928955078125, -4.71368408203125, -4.4984130859375, -4.28314208984375, -4.06787109375, -3.85260009765625, -3.6373291015625, -3.42205810546875, -3.206787109375, -2.99151611328125, -2.7762451171875, -2.56097412109375, -2.345703125, -2.13043212890625, -1.9151611328125, -1.69989013671875, -1.484619140625, -1.26934814453125, -1.0540771484375, -0.83880615234375, -0.62353515625, -0.40826416015625, -0.1929931640625, 0.02227783203125, 0.237548828125, 0.45281982421875, 0.6680908203125, 0.88336181640625, 1.0986328125, 1.31390380859375, 1.5291748046875, 1.74444580078125, 1.959716796875, 2.17498779296875, 2.3902587890625, 2.60552978515625, 2.82080078125, 3.03607177734375, 3.2513427734375, 3.46661376953125, 3.681884765625, 3.89715576171875, 4.1124267578125, 4.32769775390625, 4.54296875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 9.0, 12.0, 12.0, 14.0, 31.0, 45.0, 51.0, 50.0, 88.0, 101.0, 122.0, 175.0, 257.0, 381.0, 501.0, 500.0, 456.0, 350.0, 218.0, 178.0, 139.0, 89.0, 60.0, 57.0, 36.0, 28.0, 21.0, 22.0, 15.0, 13.0, 8.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.56683349609375, -2.4656982421875, -2.36456298828125, -2.263427734375, -2.16229248046875, -2.0611572265625, -1.96002197265625, -1.85888671875, -1.75775146484375, -1.6566162109375, -1.55548095703125, -1.454345703125, -1.35321044921875, -1.2520751953125, -1.15093994140625, -1.0498046875, -0.94866943359375, -0.8475341796875, -0.74639892578125, -0.645263671875, -0.54412841796875, -0.4429931640625, -0.34185791015625, -0.24072265625, -0.13958740234375, -0.0384521484375, 0.06268310546875, 0.163818359375, 0.26495361328125, 0.3660888671875, 0.46722412109375, 0.568359375, 0.66949462890625, 0.7706298828125, 0.87176513671875, 0.972900390625, 1.07403564453125, 1.1751708984375, 1.27630615234375, 1.37744140625, 1.47857666015625, 1.5797119140625, 1.68084716796875, 1.781982421875, 1.88311767578125, 1.9842529296875, 2.08538818359375, 2.1865234375, 2.28765869140625, 2.3887939453125, 2.48992919921875, 2.591064453125, 2.69219970703125, 2.7933349609375, 2.89447021484375, 2.99560546875, 3.09674072265625, 3.1978759765625, 3.29901123046875, 3.400146484375, 3.50128173828125, 3.6024169921875, 3.70355224609375, 3.8046875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 5.0, 6.0, 9.0, 15.0, 21.0, 28.0, 19.0, 35.0, 50.0, 87.0, 107.0, 151.0, 283.0, 608.0, 2031.0, 10866.0, 95935.0, 2735552.0, 1281536.0, 57001.0, 7132.0, 1537.0, 509.0, 261.0, 122.0, 105.0, 62.0, 59.0, 42.0, 30.0, 16.0, 10.0, 16.0, 10.0, 5.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.291015625, -9.99609375, -9.701171875, -9.40625, -9.111328125, -8.81640625, -8.521484375, -8.2265625, -7.931640625, -7.63671875, -7.341796875, -7.046875, -6.751953125, -6.45703125, -6.162109375, -5.8671875, -5.572265625, -5.27734375, -4.982421875, -4.6875, -4.392578125, -4.09765625, -3.802734375, -3.5078125, -3.212890625, -2.91796875, -2.623046875, -2.328125, -2.033203125, -1.73828125, -1.443359375, -1.1484375, -0.853515625, -0.55859375, -0.263671875, 0.03125, 0.326171875, 0.62109375, 0.916015625, 1.2109375, 1.505859375, 1.80078125, 2.095703125, 2.390625, 2.685546875, 2.98046875, 3.275390625, 3.5703125, 3.865234375, 4.16015625, 4.455078125, 4.75, 5.044921875, 5.33984375, 5.634765625, 5.9296875, 6.224609375, 6.51953125, 6.814453125, 7.109375, 7.404296875, 7.69921875, 7.994140625, 8.2890625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 10.0, 14.0, 26.0, 45.0, 85.0, 150.0, 207.0, 193.0, 125.0, 74.0, 46.0, 23.0, 7.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.37080383300781, -37.41209030151367, -36.453372955322266, -35.494659423828125, -34.535945892333984, -33.57722854614258, -32.61851501464844, -31.659799575805664, -30.70108413696289, -29.742368698120117, -28.783655166625977, -27.824939727783203, -26.86622428894043, -25.907508850097656, -24.948795318603516, -23.990079879760742, -23.0313663482666, -22.072650909423828, -21.113937377929688, -20.155221939086914, -19.19650650024414, -18.23779296875, -17.279077529907227, -16.320362091064453, -15.361647605895996, -14.402933120727539, -13.444217681884766, -12.485503196716309, -11.526788711547852, -10.568073272705078, -9.609358787536621, -8.650644302368164, -7.691930770874023, -6.733215808868408, -5.774500846862793, -4.815786361694336, -3.8570713996887207, -2.8983564376831055, -1.9396419525146484, -0.9809269905090332, -0.02221202850341797, 0.9365028142929077, 1.8952176570892334, 2.8539323806762695, 3.8126473426818848, 4.7713623046875, 5.730076789855957, 6.688791751861572, 7.6475067138671875, 8.606221199035645, 9.564936637878418, 10.523651123046875, 11.482366561889648, 12.441081047058105, 13.399795532226562, 14.358510971069336, 15.317225456237793, 16.27593994140625, 17.234655380249023, 18.193370819091797, 19.152084350585938, 20.11079978942871, 21.069515228271484, 22.028228759765625, 22.9869441986084]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 9.0, 16.0, 16.0, 17.0, 11.0, 14.0, 26.0, 22.0, 23.0, 27.0, 25.0, 40.0, 31.0, 35.0, 36.0, 41.0, 41.0, 53.0, 29.0, 46.0, 33.0, 36.0, 36.0, 33.0, 27.0, 28.0, 27.0, 25.0, 26.0, 27.0, 14.0, 13.0, 10.0, 10.0, 9.0, 13.0, 6.0, 6.0, 13.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.077351570129395, -9.769559860229492, -9.461769104003906, -9.153977394104004, -8.846185684204102, -8.538394927978516, -8.230603218078613, -7.922811508178711, -7.615020275115967, -7.307229042053223, -6.99943733215332, -6.691646099090576, -6.383854866027832, -6.07606315612793, -5.7682719230651855, -5.460480690002441, -5.152688980102539, -4.844897747039795, -4.537106037139893, -4.229314804077148, -3.921523332595825, -3.613731861114502, -3.305940628051758, -2.9981491565704346, -2.6903576850891113, -2.382566213607788, -2.074774742126465, -1.7669835090637207, -1.4591920375823975, -1.1514005661010742, -0.8436092138290405, -0.5358178615570068, -0.2280254364013672, 0.07976597547531128, 0.38755738735198975, 0.6953487992286682, 1.0031402111053467, 1.31093168258667, 1.6187230348587036, 1.9265143871307373, 2.2343058586120605, 2.542097330093384, 2.849888801574707, 3.157680034637451, 3.4654715061187744, 3.7732629776000977, 4.081054210662842, 4.388845443725586, 4.696637153625488, 5.004428386688232, 5.312220096588135, 5.620011329650879, 5.927803039550781, 6.235594272613525, 6.5433855056762695, 6.851177215576172, 7.158968448638916, 7.46675968170166, 7.7745513916015625, 8.082343101501465, 8.39013385772705, 8.697925567626953, 9.005717277526855, 9.313508033752441, 9.621299743652344]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 17.0, 8.0, 12.0, 18.0, 24.0, 31.0, 31.0, 33.0, 39.0, 50.0, 65.0, 56.0, 58.0, 56.0, 57.0, 53.0, 60.0, 65.0, 46.0, 46.0, 34.0, 37.0, 29.0, 15.0, 20.0, 16.0, 4.0, 7.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0], "bins": [-2.7734375, -2.710174560546875, -2.64691162109375, -2.583648681640625, -2.5203857421875, -2.457122802734375, -2.39385986328125, -2.330596923828125, -2.267333984375, -2.204071044921875, -2.14080810546875, -2.077545166015625, -2.0142822265625, -1.951019287109375, -1.88775634765625, -1.824493408203125, -1.76123046875, -1.697967529296875, -1.63470458984375, -1.571441650390625, -1.5081787109375, -1.444915771484375, -1.38165283203125, -1.318389892578125, -1.255126953125, -1.191864013671875, -1.12860107421875, -1.065338134765625, -1.0020751953125, -0.938812255859375, -0.87554931640625, -0.812286376953125, -0.7490234375, -0.685760498046875, -0.62249755859375, -0.559234619140625, -0.4959716796875, -0.432708740234375, -0.36944580078125, -0.306182861328125, -0.242919921875, -0.179656982421875, -0.11639404296875, -0.053131103515625, 0.0101318359375, 0.073394775390625, 0.13665771484375, 0.199920654296875, 0.26318359375, 0.326446533203125, 0.38970947265625, 0.452972412109375, 0.5162353515625, 0.579498291015625, 0.64276123046875, 0.706024169921875, 0.769287109375, 0.832550048828125, 0.89581298828125, 0.959075927734375, 1.0223388671875, 1.085601806640625, 1.14886474609375, 1.212127685546875, 1.275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 14.0, 7.0, 12.0, 20.0, 44.0, 66.0, 144.0, 300.0, 616.0, 1715.0, 4784.0, 13293.0, 38175.0, 105157.0, 229050.0, 305972.0, 207756.0, 90395.0, 33169.0, 11267.0, 4024.0, 1497.0, 585.0, 229.0, 112.0, 44.0, 28.0, 27.0, 14.0, 8.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5215301513671875, -1.469818115234375, -1.4181060791015625, -1.36639404296875, -1.3146820068359375, -1.262969970703125, -1.2112579345703125, -1.1595458984375, -1.1078338623046875, -1.056121826171875, -1.0044097900390625, -0.95269775390625, -0.9009857177734375, -0.849273681640625, -0.7975616455078125, -0.745849609375, -0.6941375732421875, -0.642425537109375, -0.5907135009765625, -0.53900146484375, -0.4872894287109375, -0.435577392578125, -0.3838653564453125, -0.3321533203125, -0.2804412841796875, -0.228729248046875, -0.1770172119140625, -0.12530517578125, -0.0735931396484375, -0.021881103515625, 0.0298309326171875, 0.08154296875, 0.1332550048828125, 0.184967041015625, 0.2366790771484375, 0.28839111328125, 0.3401031494140625, 0.391815185546875, 0.4435272216796875, 0.4952392578125, 0.5469512939453125, 0.598663330078125, 0.6503753662109375, 0.70208740234375, 0.7537994384765625, 0.805511474609375, 0.8572235107421875, 0.908935546875, 0.9606475830078125, 1.012359619140625, 1.0640716552734375, 1.11578369140625, 1.1674957275390625, 1.219207763671875, 1.2709197998046875, 1.3226318359375, 1.3743438720703125, 1.426055908203125, 1.4777679443359375, 1.52947998046875, 1.5811920166015625, 1.632904052734375, 1.6846160888671875, 1.736328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 6.0, 5.0, 7.0, 15.0, 11.0, 18.0, 20.0, 21.0, 33.0, 35.0, 43.0, 35.0, 42.0, 44.0, 40.0, 47.0, 1066.0, 56.0, 54.0, 48.0, 49.0, 40.0, 43.0, 29.0, 29.0, 37.0, 24.0, 29.0, 16.0, 17.0, 18.0, 11.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32708740234375, -1.2840576171875, -1.24102783203125, -1.197998046875, -1.15496826171875, -1.1119384765625, -1.06890869140625, -1.02587890625, -0.98284912109375, -0.9398193359375, -0.89678955078125, -0.853759765625, -0.81072998046875, -0.7677001953125, -0.72467041015625, -0.681640625, -0.63861083984375, -0.5955810546875, -0.55255126953125, -0.509521484375, -0.46649169921875, -0.4234619140625, -0.38043212890625, -0.33740234375, -0.29437255859375, -0.2513427734375, -0.20831298828125, -0.165283203125, -0.12225341796875, -0.0792236328125, -0.03619384765625, 0.0068359375, 0.04986572265625, 0.0928955078125, 0.13592529296875, 0.178955078125, 0.22198486328125, 0.2650146484375, 0.30804443359375, 0.35107421875, 0.39410400390625, 0.4371337890625, 0.48016357421875, 0.523193359375, 0.56622314453125, 0.6092529296875, 0.65228271484375, 0.6953125, 0.73834228515625, 0.7813720703125, 0.82440185546875, 0.867431640625, 0.91046142578125, 0.9534912109375, 0.99652099609375, 1.03955078125, 1.08258056640625, 1.1256103515625, 1.16864013671875, 1.211669921875, 1.25469970703125, 1.2977294921875, 1.34075927734375, 1.3837890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 9.0, 5.0, 9.0, 17.0, 25.0, 29.0, 42.0, 84.0, 114.0, 197.0, 284.0, 452.0, 676.0, 1013.0, 1574.0, 2515.0, 3828.0, 5957.0, 9232.0, 14846.0, 26090.0, 72936.0, 1311719.0, 528616.0, 56340.0, 23145.0, 13476.0, 8493.0, 5540.0, 3542.0, 2270.0, 1411.0, 916.0, 610.0, 363.0, 268.0, 168.0, 112.0, 74.0, 41.0, 31.0, 24.0, 14.0, 9.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9939422607421875, -0.959564208984375, -0.9251861572265625, -0.89080810546875, -0.8564300537109375, -0.822052001953125, -0.7876739501953125, -0.7532958984375, -0.7189178466796875, -0.684539794921875, -0.6501617431640625, -0.61578369140625, -0.5814056396484375, -0.547027587890625, -0.5126495361328125, -0.478271484375, -0.4438934326171875, -0.409515380859375, -0.3751373291015625, -0.34075927734375, -0.3063812255859375, -0.272003173828125, -0.2376251220703125, -0.2032470703125, -0.1688690185546875, -0.134490966796875, -0.1001129150390625, -0.06573486328125, -0.0313568115234375, 0.003021240234375, 0.0373992919921875, 0.07177734375, 0.1061553955078125, 0.140533447265625, 0.1749114990234375, 0.20928955078125, 0.2436676025390625, 0.278045654296875, 0.3124237060546875, 0.3468017578125, 0.3811798095703125, 0.415557861328125, 0.4499359130859375, 0.48431396484375, 0.5186920166015625, 0.553070068359375, 0.5874481201171875, 0.621826171875, 0.6562042236328125, 0.690582275390625, 0.7249603271484375, 0.75933837890625, 0.7937164306640625, 0.828094482421875, 0.8624725341796875, 0.8968505859375, 0.9312286376953125, 0.965606689453125, 0.9999847412109375, 1.03436279296875, 1.0687408447265625, 1.103118896484375, 1.1374969482421875, 1.171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 6.0, 16.0, 4.0, 11.0, 25.0, 25.0, 37.0, 64.0, 80.0, 105.0, 116.0, 91.0, 97.0, 74.0, 64.0, 36.0, 27.0, 18.0, 20.0, 19.0, 7.0, 2.0, 4.0, 7.0, 2.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11663818359375, -0.11246013641357422, -0.10828208923339844, -0.10410404205322266, -0.09992599487304688, -0.0957479476928711, -0.09156990051269531, -0.08739185333251953, -0.08321380615234375, -0.07903575897216797, -0.07485771179199219, -0.0706796646118164, -0.06650161743164062, -0.062323570251464844, -0.05814552307128906, -0.05396747589111328, -0.0497894287109375, -0.04561138153076172, -0.04143333435058594, -0.037255287170410156, -0.033077239990234375, -0.028899192810058594, -0.024721145629882812, -0.02054309844970703, -0.01636505126953125, -0.012187004089355469, -0.008008956909179688, -0.0038309097290039062, 0.000347137451171875, 0.004525184631347656, 0.008703231811523438, 0.012881278991699219, 0.017059326171875, 0.02123737335205078, 0.025415420532226562, 0.029593467712402344, 0.033771514892578125, 0.037949562072753906, 0.04212760925292969, 0.04630565643310547, 0.05048370361328125, 0.05466175079345703, 0.05883979797363281, 0.0630178451538086, 0.06719589233398438, 0.07137393951416016, 0.07555198669433594, 0.07973003387451172, 0.0839080810546875, 0.08808612823486328, 0.09226417541503906, 0.09644222259521484, 0.10062026977539062, 0.1047983169555664, 0.10897636413574219, 0.11315441131591797, 0.11733245849609375, 0.12151050567626953, 0.1256885528564453, 0.1298666000366211, 0.13404464721679688, 0.13822269439697266, 0.14240074157714844, 0.14657878875732422, 0.1507568359375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 8.0, 6.0, 9.0, 7.0, 23.0, 15.0, 30.0, 34.0, 51.0, 73.0, 129.0, 279.0, 1245.0, 17482.0, 979857.0, 46290.0, 2200.0, 369.0, 160.0, 74.0, 56.0, 41.0, 16.0, 13.0, 18.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.50390625, -2.435516357421875, -2.36712646484375, -2.298736572265625, -2.2303466796875, -2.161956787109375, -2.09356689453125, -2.025177001953125, -1.956787109375, -1.888397216796875, -1.82000732421875, -1.751617431640625, -1.6832275390625, -1.614837646484375, -1.54644775390625, -1.478057861328125, -1.40966796875, -1.341278076171875, -1.27288818359375, -1.204498291015625, -1.1361083984375, -1.067718505859375, -0.99932861328125, -0.930938720703125, -0.862548828125, -0.794158935546875, -0.72576904296875, -0.657379150390625, -0.5889892578125, -0.520599365234375, -0.45220947265625, -0.383819580078125, -0.3154296875, -0.247039794921875, -0.17864990234375, -0.110260009765625, -0.0418701171875, 0.026519775390625, 0.09490966796875, 0.163299560546875, 0.231689453125, 0.300079345703125, 0.36846923828125, 0.436859130859375, 0.5052490234375, 0.573638916015625, 0.64202880859375, 0.710418701171875, 0.77880859375, 0.847198486328125, 0.91558837890625, 0.983978271484375, 1.0523681640625, 1.120758056640625, 1.18914794921875, 1.257537841796875, 1.325927734375, 1.394317626953125, 1.46270751953125, 1.531097412109375, 1.5994873046875, 1.667877197265625, 1.73626708984375, 1.804656982421875, 1.873046875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 34.0, 113.0, 447.0, 319.0, 78.0, 15.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3178937435150146, -1.2626017332077026, -1.2073097229003906, -1.1520177125930786, -1.0967257022857666, -1.0414336919784546, -0.9861416816711426, -0.9308496713638306, -0.8755576610565186, -0.8202656507492065, -0.7649736404418945, -0.7096816301345825, -0.6543896198272705, -0.5990976095199585, -0.5438055992126465, -0.4885135889053345, -0.43322157859802246, -0.37792956829071045, -0.32263755798339844, -0.2673455476760864, -0.21205353736877441, -0.1567615270614624, -0.10146951675415039, -0.04617750644683838, 0.009114503860473633, 0.06440651416778564, 0.11969852447509766, 0.17499053478240967, 0.23028254508972168, 0.2855745553970337, 0.3408665657043457, 0.3961585760116577, 0.4514505863189697, 0.5067425966262817, 0.5620346069335938, 0.6173266172409058, 0.6726186275482178, 0.7279106378555298, 0.7832026481628418, 0.8384946584701538, 0.8937866687774658, 0.9490786790847778, 1.0043706893920898, 1.0596626996994019, 1.1149547100067139, 1.1702467203140259, 1.225538730621338, 1.28083074092865, 1.336122751235962, 1.391414761543274, 1.446706771850586, 1.501998782157898, 1.55729079246521, 1.612582802772522, 1.667874813079834, 1.723166823387146, 1.778458833694458, 1.83375084400177, 1.889042854309082, 1.944334864616394, 1.999626874923706, 2.0549187660217285, 2.11021089553833, 2.1655030250549316, 2.220794916152954]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 5.0, 12.0, 14.0, 13.0, 22.0, 31.0, 39.0, 39.0, 31.0, 56.0, 55.0, 57.0, 60.0, 69.0, 68.0, 58.0, 53.0, 53.0, 49.0, 45.0, 39.0, 28.0, 29.0, 23.0, 15.0, 13.0, 5.0, 7.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.4890289306640625, -0.4769285023212433, -0.46482810378074646, -0.45272767543792725, -0.4406272768974304, -0.4285268485546112, -0.416426420211792, -0.40432602167129517, -0.39222559332847595, -0.38012516498565674, -0.3680247664451599, -0.3559243381023407, -0.34382393956184387, -0.33172351121902466, -0.31962311267852783, -0.3075226843357086, -0.2954222559928894, -0.2833218276500702, -0.27122142910957336, -0.25912100076675415, -0.24702058732509613, -0.2349201738834381, -0.2228197604417801, -0.21071934700012207, -0.19861894845962524, -0.18651853501796722, -0.1744181215763092, -0.16231769323349, -0.15021727979183197, -0.13811686635017395, -0.12601645290851593, -0.11391603201627731, -0.1018156111240387, -0.08971519768238068, -0.07761477679014206, -0.06551436334848404, -0.05341394618153572, -0.0413135290145874, -0.029213115572929382, -0.017112694680690765, -0.005012281239032745, 0.0070881349965929985, 0.019188551232218742, 0.03128896653652191, 0.04338938370347023, 0.05548980087041855, 0.06759021431207657, 0.07969063520431519, 0.0917910486459732, 0.10389146208763123, 0.11599188297986984, 0.12809228897094727, 0.14019271731376648, 0.1522931307554245, 0.16439354419708252, 0.17649397253990173, 0.18859437108039856, 0.20069478452205658, 0.2127951979637146, 0.2248956263065338, 0.23699603974819183, 0.24909645318984985, 0.2611968517303467, 0.2732972800731659, 0.2853977084159851]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 7.0, 15.0, 11.0, 15.0, 20.0, 26.0, 24.0, 37.0, 42.0, 35.0, 58.0, 57.0, 51.0, 51.0, 62.0, 40.0, 42.0, 54.0, 50.0, 51.0, 48.0, 37.0, 31.0, 27.0, 23.0, 24.0, 14.0, 16.0, 5.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-2.30078125, -2.243133544921875, -2.18548583984375, -2.127838134765625, -2.0701904296875, -2.012542724609375, -1.95489501953125, -1.897247314453125, -1.839599609375, -1.781951904296875, -1.72430419921875, -1.666656494140625, -1.6090087890625, -1.551361083984375, -1.49371337890625, -1.436065673828125, -1.37841796875, -1.320770263671875, -1.26312255859375, -1.205474853515625, -1.1478271484375, -1.090179443359375, -1.03253173828125, -0.974884033203125, -0.917236328125, -0.859588623046875, -0.80194091796875, -0.744293212890625, -0.6866455078125, -0.628997802734375, -0.57135009765625, -0.513702392578125, -0.4560546875, -0.398406982421875, -0.34075927734375, -0.283111572265625, -0.2254638671875, -0.167816162109375, -0.11016845703125, -0.052520751953125, 0.005126953125, 0.062774658203125, 0.12042236328125, 0.178070068359375, 0.2357177734375, 0.293365478515625, 0.35101318359375, 0.408660888671875, 0.46630859375, 0.523956298828125, 0.58160400390625, 0.639251708984375, 0.6968994140625, 0.754547119140625, 0.81219482421875, 0.869842529296875, 0.927490234375, 0.985137939453125, 1.04278564453125, 1.100433349609375, 1.1580810546875, 1.215728759765625, 1.27337646484375, 1.331024169921875, 1.388671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 10.0, 13.0, 15.0, 27.0, 22.0, 47.0, 65.0, 118.0, 155.0, 281.0, 486.0, 952.0, 1933.0, 4221.0, 10191.0, 30103.0, 105209.0, 394514.0, 360890.0, 94341.0, 27732.0, 9528.0, 3879.0, 1732.0, 924.0, 476.0, 236.0, 158.0, 92.0, 75.0, 42.0, 24.0, 22.0, 3.0, 8.0, 3.0, 8.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.791015625, -2.691192626953125, -2.59136962890625, -2.491546630859375, -2.3917236328125, -2.291900634765625, -2.19207763671875, -2.092254638671875, -1.992431640625, -1.892608642578125, -1.79278564453125, -1.692962646484375, -1.5931396484375, -1.493316650390625, -1.39349365234375, -1.293670654296875, -1.19384765625, -1.094024658203125, -0.99420166015625, -0.894378662109375, -0.7945556640625, -0.694732666015625, -0.59490966796875, -0.495086669921875, -0.395263671875, -0.295440673828125, -0.19561767578125, -0.095794677734375, 0.0040283203125, 0.103851318359375, 0.20367431640625, 0.303497314453125, 0.4033203125, 0.503143310546875, 0.60296630859375, 0.702789306640625, 0.8026123046875, 0.902435302734375, 1.00225830078125, 1.102081298828125, 1.201904296875, 1.301727294921875, 1.40155029296875, 1.501373291015625, 1.6011962890625, 1.701019287109375, 1.80084228515625, 1.900665283203125, 2.00048828125, 2.100311279296875, 2.20013427734375, 2.299957275390625, 2.3997802734375, 2.499603271484375, 2.59942626953125, 2.699249267578125, 2.799072265625, 2.898895263671875, 2.99871826171875, 3.098541259765625, 3.1983642578125, 3.298187255859375, 3.39801025390625, 3.497833251953125, 3.59765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 10.0, 15.0, 11.0, 22.0, 19.0, 37.0, 43.0, 28.0, 28.0, 68.0, 67.0, 74.0, 128.0, 213.0, 1423.0, 262.0, 151.0, 64.0, 63.0, 55.0, 31.0, 21.0, 31.0, 30.0, 23.0, 27.0, 17.0, 12.0, 16.0, 9.0, 6.0, 4.0, 4.0, 7.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.80859375, -5.64605712890625, -5.4835205078125, -5.32098388671875, -5.158447265625, -4.99591064453125, -4.8333740234375, -4.67083740234375, -4.50830078125, -4.34576416015625, -4.1832275390625, -4.02069091796875, -3.858154296875, -3.69561767578125, -3.5330810546875, -3.37054443359375, -3.2080078125, -3.04547119140625, -2.8829345703125, -2.72039794921875, -2.557861328125, -2.39532470703125, -2.2327880859375, -2.07025146484375, -1.90771484375, -1.74517822265625, -1.5826416015625, -1.42010498046875, -1.257568359375, -1.09503173828125, -0.9324951171875, -0.76995849609375, -0.607421875, -0.44488525390625, -0.2823486328125, -0.11981201171875, 0.042724609375, 0.20526123046875, 0.3677978515625, 0.53033447265625, 0.69287109375, 0.85540771484375, 1.0179443359375, 1.18048095703125, 1.343017578125, 1.50555419921875, 1.6680908203125, 1.83062744140625, 1.9931640625, 2.15570068359375, 2.3182373046875, 2.48077392578125, 2.643310546875, 2.80584716796875, 2.9683837890625, 3.13092041015625, 3.29345703125, 3.45599365234375, 3.6185302734375, 3.78106689453125, 3.943603515625, 4.10614013671875, 4.2686767578125, 4.43121337890625, 4.59375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 10.0, 17.0, 10.0, 22.0, 29.0, 40.0, 37.0, 77.0, 80.0, 103.0, 135.0, 156.0, 324.0, 761.0, 3720.0, 48759.0, 2769228.0, 310006.0, 9340.0, 1428.0, 482.0, 248.0, 179.0, 136.0, 87.0, 63.0, 40.0, 53.0, 31.0, 17.0, 20.0, 12.0, 12.0, 14.0, 5.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.0897216796875, -8.773193359375, -8.4566650390625, -8.14013671875, -7.8236083984375, -7.507080078125, -7.1905517578125, -6.8740234375, -6.5574951171875, -6.240966796875, -5.9244384765625, -5.60791015625, -5.2913818359375, -4.974853515625, -4.6583251953125, -4.341796875, -4.0252685546875, -3.708740234375, -3.3922119140625, -3.07568359375, -2.7591552734375, -2.442626953125, -2.1260986328125, -1.8095703125, -1.4930419921875, -1.176513671875, -0.8599853515625, -0.54345703125, -0.2269287109375, 0.089599609375, 0.4061279296875, 0.72265625, 1.0391845703125, 1.355712890625, 1.6722412109375, 1.98876953125, 2.3052978515625, 2.621826171875, 2.9383544921875, 3.2548828125, 3.5714111328125, 3.887939453125, 4.2044677734375, 4.52099609375, 4.8375244140625, 5.154052734375, 5.4705810546875, 5.787109375, 6.1036376953125, 6.420166015625, 6.7366943359375, 7.05322265625, 7.3697509765625, 7.686279296875, 8.0028076171875, 8.3193359375, 8.6358642578125, 8.952392578125, 9.2689208984375, 9.58544921875, 9.9019775390625, 10.218505859375, 10.5350341796875, 10.8515625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 90.0, 697.0, 216.0, 12.0], "bins": [-134.36468505859375, -132.18492126464844, -130.00514221191406, -127.82537841796875, -125.64561462402344, -123.4658432006836, -121.28607940673828, -119.10630798339844, -116.92654418945312, -114.74677276611328, -112.56700897216797, -110.38723754882812, -108.20747375488281, -106.02770233154297, -103.84793853759766, -101.66816711425781, -99.48839569091797, -97.30862426757812, -95.12886047363281, -92.94908905029297, -90.76932525634766, -88.58955383300781, -86.4097900390625, -84.23001861572266, -82.05024719238281, -79.87047576904297, -77.69071197509766, -75.51094055175781, -73.3311767578125, -71.15140533447266, -68.97164154052734, -66.7918701171875, -64.61210632324219, -62.43233871459961, -60.25257110595703, -58.07280349731445, -55.893035888671875, -53.71326446533203, -51.53349685668945, -49.353729248046875, -47.17395782470703, -44.99419021606445, -42.814422607421875, -40.6346549987793, -38.45488739013672, -36.275115966796875, -34.0953483581543, -31.91558074951172, -29.735815048217773, -27.556047439575195, -25.376277923583984, -23.196510314941406, -21.016742706298828, -18.83697509765625, -16.657207489013672, -14.477437973022461, -12.297670364379883, -10.117902755737305, -7.93813419342041, -5.758366107940674, -3.5785980224609375, -1.3988304138183594, 0.7809381484985352, 2.9607067108154297, 5.140474319458008]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 9.0, 7.0, 9.0, 10.0, 18.0, 13.0, 12.0, 13.0, 25.0, 29.0, 36.0, 27.0, 31.0, 35.0, 41.0, 42.0, 28.0, 35.0, 49.0, 45.0, 39.0, 41.0, 42.0, 30.0, 50.0, 36.0, 31.0, 37.0, 20.0, 23.0, 22.0, 12.0, 15.0, 24.0, 11.0, 9.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.524447441101074, -13.106252670288086, -12.688056945800781, -12.269862174987793, -11.851666450500488, -11.4334716796875, -11.015275955200195, -10.597081184387207, -10.178886413574219, -9.76069164276123, -9.342495918273926, -8.924301147460938, -8.506105422973633, -8.087910652160645, -7.669715404510498, -7.251520156860352, -6.833324909210205, -6.415129661560059, -5.996934413909912, -5.578739166259766, -5.160544395446777, -4.742349147796631, -4.324153900146484, -3.905958890914917, -3.4877636432647705, -3.069568395614624, -2.6513733863830566, -2.23317813873291, -1.8149830102920532, -1.3967878818511963, -0.9785926342010498, -0.5603976249694824, -0.14220237731933594, 0.2759927809238434, 0.6941879391670227, 1.1123831272125244, 1.5305782556533813, 1.9487733840942383, 2.3669686317443848, 2.785163640975952, 3.2033588886260986, 3.621554136276245, 4.0397491455078125, 4.457944393157959, 4.8761396408081055, 5.294334411621094, 5.712530136108398, 6.130724906921387, 6.548920154571533, 6.96711540222168, 7.385310649871826, 7.803505897521973, 8.221700668334961, 8.639896392822266, 9.058091163635254, 9.476285934448242, 9.894481658935547, 10.312676429748535, 10.73087215423584, 11.149066925048828, 11.567262649536133, 11.985457420349121, 12.40365219116211, 12.821847915649414, 13.240042686462402]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 13.0, 12.0, 15.0, 15.0, 27.0, 44.0, 37.0, 38.0, 50.0, 63.0, 55.0, 62.0, 58.0, 58.0, 53.0, 54.0, 71.0, 62.0, 26.0, 39.0, 28.0, 29.0, 17.0, 17.0, 19.0, 14.0, 5.0, 5.0, 9.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0], "bins": [-2.966796875, -2.8966064453125, -2.826416015625, -2.7562255859375, -2.68603515625, -2.6158447265625, -2.545654296875, -2.4754638671875, -2.4052734375, -2.3350830078125, -2.264892578125, -2.1947021484375, -2.12451171875, -2.0543212890625, -1.984130859375, -1.9139404296875, -1.84375, -1.7735595703125, -1.703369140625, -1.6331787109375, -1.56298828125, -1.4927978515625, -1.422607421875, -1.3524169921875, -1.2822265625, -1.2120361328125, -1.141845703125, -1.0716552734375, -1.00146484375, -0.9312744140625, -0.861083984375, -0.7908935546875, -0.720703125, -0.6505126953125, -0.580322265625, -0.5101318359375, -0.43994140625, -0.3697509765625, -0.299560546875, -0.2293701171875, -0.1591796875, -0.0889892578125, -0.018798828125, 0.0513916015625, 0.12158203125, 0.1917724609375, 0.261962890625, 0.3321533203125, 0.40234375, 0.4725341796875, 0.542724609375, 0.6129150390625, 0.68310546875, 0.7532958984375, 0.823486328125, 0.8936767578125, 0.9638671875, 1.0340576171875, 1.104248046875, 1.1744384765625, 1.24462890625, 1.3148193359375, 1.385009765625, 1.4552001953125, 1.525390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 16.0, 27.0, 37.0, 51.0, 114.0, 179.0, 333.0, 598.0, 1283.0, 2831.0, 6708.0, 19174.0, 74847.0, 624383.0, 2866093.0, 498922.0, 67850.0, 18894.0, 6712.0, 2723.0, 1237.0, 571.0, 306.0, 162.0, 82.0, 38.0, 35.0, 24.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.82867431640625, -4.6925048828125, -4.55633544921875, -4.420166015625, -4.28399658203125, -4.1478271484375, -4.01165771484375, -3.87548828125, -3.73931884765625, -3.6031494140625, -3.46697998046875, -3.330810546875, -3.19464111328125, -3.0584716796875, -2.92230224609375, -2.7861328125, -2.64996337890625, -2.5137939453125, -2.37762451171875, -2.241455078125, -2.10528564453125, -1.9691162109375, -1.83294677734375, -1.69677734375, -1.56060791015625, -1.4244384765625, -1.28826904296875, -1.152099609375, -1.01593017578125, -0.8797607421875, -0.74359130859375, -0.607421875, -0.47125244140625, -0.3350830078125, -0.19891357421875, -0.062744140625, 0.07342529296875, 0.2095947265625, 0.34576416015625, 0.48193359375, 0.61810302734375, 0.7542724609375, 0.89044189453125, 1.026611328125, 1.16278076171875, 1.2989501953125, 1.43511962890625, 1.5712890625, 1.70745849609375, 1.8436279296875, 1.97979736328125, 2.115966796875, 2.25213623046875, 2.3883056640625, 2.52447509765625, 2.66064453125, 2.79681396484375, 2.9329833984375, 3.06915283203125, 3.205322265625, 3.34149169921875, 3.4776611328125, 3.61383056640625, 3.75]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 3.0, 11.0, 8.0, 9.0, 12.0, 22.0, 25.0, 23.0, 55.0, 39.0, 60.0, 73.0, 116.0, 159.0, 208.0, 302.0, 445.0, 535.0, 538.0, 385.0, 272.0, 201.0, 138.0, 100.0, 86.0, 49.0, 36.0, 41.0, 25.0, 25.0, 11.0, 13.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-3.689453125, -3.58660888671875, -3.4837646484375, -3.38092041015625, -3.278076171875, -3.17523193359375, -3.0723876953125, -2.96954345703125, -2.86669921875, -2.76385498046875, -2.6610107421875, -2.55816650390625, -2.455322265625, -2.35247802734375, -2.2496337890625, -2.14678955078125, -2.0439453125, -1.94110107421875, -1.8382568359375, -1.73541259765625, -1.632568359375, -1.52972412109375, -1.4268798828125, -1.32403564453125, -1.22119140625, -1.11834716796875, -1.0155029296875, -0.91265869140625, -0.809814453125, -0.70697021484375, -0.6041259765625, -0.50128173828125, -0.3984375, -0.29559326171875, -0.1927490234375, -0.08990478515625, 0.012939453125, 0.11578369140625, 0.2186279296875, 0.32147216796875, 0.42431640625, 0.52716064453125, 0.6300048828125, 0.73284912109375, 0.835693359375, 0.93853759765625, 1.0413818359375, 1.14422607421875, 1.2470703125, 1.34991455078125, 1.4527587890625, 1.55560302734375, 1.658447265625, 1.76129150390625, 1.8641357421875, 1.96697998046875, 2.06982421875, 2.17266845703125, 2.2755126953125, 2.37835693359375, 2.481201171875, 2.58404541015625, 2.6868896484375, 2.78973388671875, 2.892578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 12.0, 15.0, 26.0, 22.0, 35.0, 56.0, 63.0, 101.0, 180.0, 306.0, 613.0, 1430.0, 5770.0, 36065.0, 530053.0, 3423588.0, 172690.0, 17536.0, 3443.0, 1094.0, 410.0, 244.0, 157.0, 89.0, 70.0, 40.0, 35.0, 31.0, 16.0, 16.0, 6.0, 10.0, 11.0, 4.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3046875, -8.011474609375, -7.71826171875, -7.425048828125, -7.1318359375, -6.838623046875, -6.54541015625, -6.252197265625, -5.958984375, -5.665771484375, -5.37255859375, -5.079345703125, -4.7861328125, -4.492919921875, -4.19970703125, -3.906494140625, -3.61328125, -3.320068359375, -3.02685546875, -2.733642578125, -2.4404296875, -2.147216796875, -1.85400390625, -1.560791015625, -1.267578125, -0.974365234375, -0.68115234375, -0.387939453125, -0.0947265625, 0.198486328125, 0.49169921875, 0.784912109375, 1.078125, 1.371337890625, 1.66455078125, 1.957763671875, 2.2509765625, 2.544189453125, 2.83740234375, 3.130615234375, 3.423828125, 3.717041015625, 4.01025390625, 4.303466796875, 4.5966796875, 4.889892578125, 5.18310546875, 5.476318359375, 5.76953125, 6.062744140625, 6.35595703125, 6.649169921875, 6.9423828125, 7.235595703125, 7.52880859375, 7.822021484375, 8.115234375, 8.408447265625, 8.70166015625, 8.994873046875, 9.2880859375, 9.581298828125, 9.87451171875, 10.167724609375, 10.4609375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 20.0, 46.0, 91.0, 180.0, 235.0, 205.0, 120.0, 62.0, 28.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.397518157958984, -32.31162643432617, -31.22573471069336, -30.139842987060547, -29.053951263427734, -27.968059539794922, -26.88216781616211, -25.796276092529297, -24.710384368896484, -23.624492645263672, -22.53860092163086, -21.452709197998047, -20.366817474365234, -19.280925750732422, -18.19503402709961, -17.109142303466797, -16.023250579833984, -14.937358856201172, -13.85146713256836, -12.765575408935547, -11.679683685302734, -10.593791961669922, -9.50790023803711, -8.422008514404297, -7.336116790771484, -6.250225067138672, -5.164333343505859, -4.078441619873047, -2.9925498962402344, -1.9066581726074219, -0.8207664489746094, 0.2651252746582031, 1.3510169982910156, 2.436908721923828, 3.5228004455566406, 4.608692169189453, 5.694583892822266, 6.780475616455078, 7.866367340087891, 8.952259063720703, 10.038150787353516, 11.124042510986328, 12.20993423461914, 13.295825958251953, 14.381717681884766, 15.467609405517578, 16.55350112915039, 17.639392852783203, 18.725284576416016, 19.811176300048828, 20.89706802368164, 21.982959747314453, 23.068851470947266, 24.154743194580078, 25.24063491821289, 26.326526641845703, 27.412418365478516, 28.498310089111328, 29.58420181274414, 30.670093536376953, 31.755985260009766, 32.84187698364258, 33.92776870727539, 35.0136604309082, 36.099552154541016]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 16.0, 12.0, 7.0, 14.0, 22.0, 30.0, 22.0, 29.0, 36.0, 40.0, 40.0, 49.0, 47.0, 56.0, 44.0, 54.0, 59.0, 55.0, 49.0, 34.0, 51.0, 44.0, 33.0, 33.0, 25.0, 19.0, 23.0, 16.0, 8.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.893991470336914, -16.441286087036133, -15.988581657409668, -15.535876274108887, -15.083171844482422, -14.63046646118164, -14.17776107788086, -13.725056648254395, -13.272351264953613, -12.819645881652832, -12.366941452026367, -11.914236068725586, -11.461531639099121, -11.00882625579834, -10.556121826171875, -10.103416442871094, -9.650711059570312, -9.198005676269531, -8.745301246643066, -8.292595863342285, -7.839890956878662, -7.387186050415039, -6.934481143951416, -6.481776237487793, -6.029071807861328, -5.576366901397705, -5.123661994934082, -4.670956611633301, -4.218251705169678, -3.7655467987060547, -3.3128418922424316, -2.8601367473602295, -2.4074316024780273, -1.9547265768051147, -1.5020215511322021, -1.049316644668579, -0.5966116189956665, -0.1439065933227539, 0.30879831314086914, 0.7615034580230713, 1.2142083644866943, 1.666913390159607, 2.1196184158325195, 2.5723233222961426, 3.0250282287597656, 3.4777333736419678, 3.930438280105591, 4.383143424987793, 4.835848331451416, 5.288553237915039, 5.741258144378662, 6.193963050842285, 6.646668434143066, 7.0993733406066895, 7.5520782470703125, 8.004783630371094, 8.457488059997559, 8.91019344329834, 9.362897872924805, 9.815603256225586, 10.26830768585205, 10.721013069152832, 11.173717498779297, 11.626422882080078, 12.07912826538086]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 14.0, 19.0, 28.0, 30.0, 36.0, 33.0, 54.0, 45.0, 55.0, 55.0, 70.0, 55.0, 58.0, 46.0, 68.0, 44.0, 53.0, 40.0, 34.0, 36.0, 22.0, 19.0, 17.0, 17.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.5405731201171875, -2.473724365234375, -2.4068756103515625, -2.34002685546875, -2.2731781005859375, -2.206329345703125, -2.1394805908203125, -2.0726318359375, -2.0057830810546875, -1.938934326171875, -1.8720855712890625, -1.80523681640625, -1.7383880615234375, -1.671539306640625, -1.6046905517578125, -1.537841796875, -1.4709930419921875, -1.404144287109375, -1.3372955322265625, -1.27044677734375, -1.2035980224609375, -1.136749267578125, -1.0699005126953125, -1.0030517578125, -0.9362030029296875, -0.869354248046875, -0.8025054931640625, -0.73565673828125, -0.6688079833984375, -0.601959228515625, -0.5351104736328125, -0.46826171875, -0.4014129638671875, -0.334564208984375, -0.2677154541015625, -0.20086669921875, -0.1340179443359375, -0.067169189453125, -0.0003204345703125, 0.0665283203125, 0.1333770751953125, 0.200225830078125, 0.2670745849609375, 0.33392333984375, 0.4007720947265625, 0.467620849609375, 0.5344696044921875, 0.601318359375, 0.6681671142578125, 0.735015869140625, 0.8018646240234375, 0.86871337890625, 0.9355621337890625, 1.002410888671875, 1.0692596435546875, 1.1361083984375, 1.2029571533203125, 1.269805908203125, 1.3366546630859375, 1.40350341796875, 1.4703521728515625, 1.537200927734375, 1.6040496826171875, 1.6708984375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 11.0, 11.0, 21.0, 21.0, 50.0, 76.0, 90.0, 155.0, 244.0, 374.0, 670.0, 1070.0, 1974.0, 3733.0, 7343.0, 15197.0, 32493.0, 69858.0, 144586.0, 246136.0, 245936.0, 144736.0, 70301.0, 32589.0, 15184.0, 7248.0, 3610.0, 1995.0, 1122.0, 620.0, 374.0, 240.0, 157.0, 92.0, 79.0, 55.0, 29.0, 23.0, 19.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1416015625, -1.105926513671875, -1.07025146484375, -1.034576416015625, -0.9989013671875, -0.963226318359375, -0.92755126953125, -0.891876220703125, -0.856201171875, -0.820526123046875, -0.78485107421875, -0.749176025390625, -0.7135009765625, -0.677825927734375, -0.64215087890625, -0.606475830078125, -0.57080078125, -0.535125732421875, -0.49945068359375, -0.463775634765625, -0.4281005859375, -0.392425537109375, -0.35675048828125, -0.321075439453125, -0.285400390625, -0.249725341796875, -0.21405029296875, -0.178375244140625, -0.1427001953125, -0.107025146484375, -0.07135009765625, -0.035675048828125, 0.0, 0.035675048828125, 0.07135009765625, 0.107025146484375, 0.1427001953125, 0.178375244140625, 0.21405029296875, 0.249725341796875, 0.285400390625, 0.321075439453125, 0.35675048828125, 0.392425537109375, 0.4281005859375, 0.463775634765625, 0.49945068359375, 0.535125732421875, 0.57080078125, 0.606475830078125, 0.64215087890625, 0.677825927734375, 0.7135009765625, 0.749176025390625, 0.78485107421875, 0.820526123046875, 0.856201171875, 0.891876220703125, 0.92755126953125, 0.963226318359375, 0.9989013671875, 1.034576416015625, 1.07025146484375, 1.105926513671875, 1.1416015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 1.0, 17.0, 5.0, 15.0, 12.0, 15.0, 11.0, 19.0, 16.0, 23.0, 30.0, 26.0, 43.0, 40.0, 42.0, 47.0, 46.0, 34.0, 1067.0, 54.0, 41.0, 32.0, 43.0, 28.0, 37.0, 43.0, 25.0, 26.0, 38.0, 26.0, 22.0, 21.0, 16.0, 10.0, 14.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.226226806640625, -1.18389892578125, -1.141571044921875, -1.0992431640625, -1.056915283203125, -1.01458740234375, -0.972259521484375, -0.929931640625, -0.887603759765625, -0.84527587890625, -0.802947998046875, -0.7606201171875, -0.718292236328125, -0.67596435546875, -0.633636474609375, -0.59130859375, -0.548980712890625, -0.50665283203125, -0.464324951171875, -0.4219970703125, -0.379669189453125, -0.33734130859375, -0.295013427734375, -0.252685546875, -0.210357666015625, -0.16802978515625, -0.125701904296875, -0.0833740234375, -0.041046142578125, 0.00128173828125, 0.043609619140625, 0.0859375, 0.128265380859375, 0.17059326171875, 0.212921142578125, 0.2552490234375, 0.297576904296875, 0.33990478515625, 0.382232666015625, 0.424560546875, 0.466888427734375, 0.50921630859375, 0.551544189453125, 0.5938720703125, 0.636199951171875, 0.67852783203125, 0.720855712890625, 0.76318359375, 0.805511474609375, 0.84783935546875, 0.890167236328125, 0.9324951171875, 0.974822998046875, 1.01715087890625, 1.059478759765625, 1.101806640625, 1.144134521484375, 1.18646240234375, 1.228790283203125, 1.2711181640625, 1.313446044921875, 1.35577392578125, 1.398101806640625, 1.4404296875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 14.0, 19.0, 22.0, 33.0, 37.0, 58.0, 92.0, 159.0, 196.0, 308.0, 419.0, 674.0, 956.0, 1361.0, 2142.0, 3104.0, 4850.0, 7674.0, 12469.0, 21644.0, 48651.0, 285415.0, 1514618.0, 113467.0, 32843.0, 17030.0, 10130.0, 6392.0, 4076.0, 2724.0, 1856.0, 1211.0, 809.0, 536.0, 360.0, 238.0, 156.0, 113.0, 99.0, 51.0, 33.0, 29.0, 19.0, 18.0, 4.0, 8.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.099609375, -1.0675430297851562, -1.0354766845703125, -1.0034103393554688, -0.971343994140625, -0.9392776489257812, -0.9072113037109375, -0.8751449584960938, -0.84307861328125, -0.8110122680664062, -0.7789459228515625, -0.7468795776367188, -0.714813232421875, -0.6827468872070312, -0.6506805419921875, -0.6186141967773438, -0.5865478515625, -0.5544815063476562, -0.5224151611328125, -0.49034881591796875, -0.458282470703125, -0.42621612548828125, -0.3941497802734375, -0.36208343505859375, -0.33001708984375, -0.29795074462890625, -0.2658843994140625, -0.23381805419921875, -0.201751708984375, -0.16968536376953125, -0.1376190185546875, -0.10555267333984375, -0.073486328125, -0.04141998291015625, -0.0093536376953125, 0.02271270751953125, 0.054779052734375, 0.08684539794921875, 0.1189117431640625, 0.15097808837890625, 0.18304443359375, 0.21511077880859375, 0.2471771240234375, 0.27924346923828125, 0.311309814453125, 0.34337615966796875, 0.3754425048828125, 0.40750885009765625, 0.4395751953125, 0.47164154052734375, 0.5037078857421875, 0.5357742309570312, 0.567840576171875, 0.5999069213867188, 0.6319732666015625, 0.6640396118164062, 0.69610595703125, 0.7281723022460938, 0.7602386474609375, 0.7923049926757812, 0.824371337890625, 0.8564376831054688, 0.8885040283203125, 0.9205703735351562, 0.95263671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 16.0, 32.0, 42.0, 48.0, 98.0, 110.0, 163.0, 146.0, 112.0, 75.0, 51.0, 25.0, 25.0, 17.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.258544921875, -0.25188255310058594, -0.24522018432617188, -0.2385578155517578, -0.23189544677734375, -0.2252330780029297, -0.21857070922851562, -0.21190834045410156, -0.2052459716796875, -0.19858360290527344, -0.19192123413085938, -0.1852588653564453, -0.17859649658203125, -0.1719341278076172, -0.16527175903320312, -0.15860939025878906, -0.151947021484375, -0.14528465270996094, -0.13862228393554688, -0.1319599151611328, -0.12529754638671875, -0.11863517761230469, -0.11197280883789062, -0.10531044006347656, -0.0986480712890625, -0.09198570251464844, -0.08532333374023438, -0.07866096496582031, -0.07199859619140625, -0.06533622741699219, -0.058673858642578125, -0.05201148986816406, -0.04534912109375, -0.03868675231933594, -0.032024383544921875, -0.025362014770507812, -0.01869964599609375, -0.012037277221679688, -0.005374908447265625, 0.0012874603271484375, 0.0079498291015625, 0.014612197875976562, 0.021274566650390625, 0.027936935424804688, 0.03459930419921875, 0.04126167297363281, 0.047924041748046875, 0.05458641052246094, 0.061248779296875, 0.06791114807128906, 0.07457351684570312, 0.08123588562011719, 0.08789825439453125, 0.09456062316894531, 0.10122299194335938, 0.10788536071777344, 0.1145477294921875, 0.12121009826660156, 0.12787246704101562, 0.1345348358154297, 0.14119720458984375, 0.1478595733642578, 0.15452194213867188, 0.16118431091308594, 0.1678466796875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 13.0, 21.0, 33.0, 43.0, 95.0, 200.0, 1350.0, 883465.0, 162181.0, 765.0, 159.0, 84.0, 47.0, 33.0, 20.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.6171875, -3.47760009765625, -3.3380126953125, -3.19842529296875, -3.058837890625, -2.91925048828125, -2.7796630859375, -2.64007568359375, -2.50048828125, -2.36090087890625, -2.2213134765625, -2.08172607421875, -1.942138671875, -1.80255126953125, -1.6629638671875, -1.52337646484375, -1.3837890625, -1.24420166015625, -1.1046142578125, -0.96502685546875, -0.825439453125, -0.68585205078125, -0.5462646484375, -0.40667724609375, -0.26708984375, -0.12750244140625, 0.0120849609375, 0.15167236328125, 0.291259765625, 0.43084716796875, 0.5704345703125, 0.71002197265625, 0.849609375, 0.98919677734375, 1.1287841796875, 1.26837158203125, 1.407958984375, 1.54754638671875, 1.6871337890625, 1.82672119140625, 1.96630859375, 2.10589599609375, 2.2454833984375, 2.38507080078125, 2.524658203125, 2.66424560546875, 2.8038330078125, 2.94342041015625, 3.0830078125, 3.22259521484375, 3.3621826171875, 3.50177001953125, 3.641357421875, 3.78094482421875, 3.9205322265625, 4.06011962890625, 4.19970703125, 4.33929443359375, 4.4788818359375, 4.61846923828125, 4.758056640625, 4.89764404296875, 5.0372314453125, 5.17681884765625, 5.31640625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 21.0, 76.0, 231.0, 431.0, 175.0, 46.0, 19.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8177696466445923, -1.763284683227539, -1.7087998390197754, -1.6543148756027222, -1.599829912185669, -1.5453450679779053, -1.490860104560852, -1.4363751411437988, -1.3818902969360352, -1.327405333518982, -1.2729204893112183, -1.218435525894165, -1.1639506816864014, -1.1094657182693481, -1.054980754852295, -1.0004959106445312, -0.946010947227478, -0.8915260434150696, -0.8370411396026611, -0.7825561761856079, -0.7280712723731995, -0.673586368560791, -0.6191014051437378, -0.5646165013313293, -0.5101315975189209, -0.45564669370651245, -0.4011617600917816, -0.3466768264770508, -0.29219192266464233, -0.2377070188522339, -0.18322208523750305, -0.12873715162277222, -0.07425224781036377, -0.01976732909679413, 0.03471758961677551, 0.08920250833034515, 0.1436874270439148, 0.19817233085632324, 0.2526572644710541, 0.3071421980857849, 0.36162710189819336, 0.4161120057106018, 0.47059693932533264, 0.5250818729400635, 0.5795667767524719, 0.6340516805648804, 0.6885366439819336, 0.743021547794342, 0.7975064516067505, 0.8519913554191589, 0.9064762592315674, 0.9609612226486206, 1.0154461860656738, 1.0699310302734375, 1.1244159936904907, 1.178900957107544, 1.2333858013153076, 1.2878707647323608, 1.3423556089401245, 1.3968405723571777, 1.4513254165649414, 1.5058103799819946, 1.5602953433990479, 1.6147801876068115, 1.6692651510238647]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 8.0, 6.0, 13.0, 9.0, 19.0, 31.0, 23.0, 36.0, 50.0, 40.0, 41.0, 58.0, 51.0, 54.0, 56.0, 41.0, 49.0, 47.0, 52.0, 48.0, 53.0, 37.0, 35.0, 24.0, 21.0, 24.0, 17.0, 11.0, 8.0, 9.0, 11.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4721947908401489, -0.4602656066417694, -0.4483364224433899, -0.43640726804733276, -0.42447808384895325, -0.41254889965057373, -0.4006197452545166, -0.3886905610561371, -0.37676137685775757, -0.36483219265937805, -0.35290300846099854, -0.3409738540649414, -0.3290446698665619, -0.3171154856681824, -0.30518633127212524, -0.2932571470737457, -0.2813279628753662, -0.2693987786769867, -0.2574695944786072, -0.24554044008255005, -0.23361125588417053, -0.22168207168579102, -0.2097529023885727, -0.19782373309135437, -0.18589454889297485, -0.17396536469459534, -0.16203619539737701, -0.1501070261001587, -0.13817784190177917, -0.12624865770339966, -0.11431948840618134, -0.10239031165838242, -0.0904611349105835, -0.07853195816278458, -0.06660278141498566, -0.05467360466718674, -0.04274442791938782, -0.030815251171588898, -0.018886074423789978, -0.006956897675991058, 0.004972279071807861, 0.01690145581960678, 0.0288306325674057, 0.04075980931520462, 0.05268898606300354, 0.06461816281080246, 0.07654733955860138, 0.0884765163064003, 0.10040569305419922, 0.11233486980199814, 0.12426404654979706, 0.13619321584701538, 0.1481224000453949, 0.16005158424377441, 0.17198075354099274, 0.18390992283821106, 0.19583910703659058, 0.2077682912349701, 0.21969746053218842, 0.23162662982940674, 0.24355581402778625, 0.25548499822616577, 0.2674141526222229, 0.2793433368206024, 0.29127252101898193]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 12.0, 11.0, 14.0, 11.0, 14.0, 22.0, 22.0, 34.0, 23.0, 40.0, 40.0, 45.0, 47.0, 50.0, 49.0, 37.0, 43.0, 41.0, 32.0, 47.0, 53.0, 34.0, 33.0, 36.0, 33.0, 31.0, 25.0, 19.0, 25.0, 11.0, 8.0, 11.0, 11.0, 11.0, 3.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.8046875, -1.752716064453125, -1.70074462890625, -1.648773193359375, -1.5968017578125, -1.544830322265625, -1.49285888671875, -1.440887451171875, -1.388916015625, -1.336944580078125, -1.28497314453125, -1.233001708984375, -1.1810302734375, -1.129058837890625, -1.07708740234375, -1.025115966796875, -0.97314453125, -0.921173095703125, -0.86920166015625, -0.817230224609375, -0.7652587890625, -0.713287353515625, -0.66131591796875, -0.609344482421875, -0.557373046875, -0.505401611328125, -0.45343017578125, -0.401458740234375, -0.3494873046875, -0.297515869140625, -0.24554443359375, -0.193572998046875, -0.1416015625, -0.089630126953125, -0.03765869140625, 0.014312744140625, 0.0662841796875, 0.118255615234375, 0.17022705078125, 0.222198486328125, 0.274169921875, 0.326141357421875, 0.37811279296875, 0.430084228515625, 0.4820556640625, 0.534027099609375, 0.58599853515625, 0.637969970703125, 0.68994140625, 0.741912841796875, 0.79388427734375, 0.845855712890625, 0.8978271484375, 0.949798583984375, 1.00177001953125, 1.053741455078125, 1.105712890625, 1.157684326171875, 1.20965576171875, 1.261627197265625, 1.3135986328125, 1.365570068359375, 1.41754150390625, 1.469512939453125, 1.521484375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 18.0, 21.0, 37.0, 54.0, 71.0, 126.0, 204.0, 304.0, 478.0, 794.0, 1293.0, 2252.0, 4269.0, 8160.0, 18303.0, 47086.0, 152110.0, 459404.0, 236343.0, 69653.0, 24676.0, 10687.0, 5278.0, 2790.0, 1626.0, 929.0, 572.0, 370.0, 232.0, 144.0, 89.0, 54.0, 33.0, 22.0, 22.0, 22.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.259765625, -2.175048828125, -2.09033203125, -2.005615234375, -1.9208984375, -1.836181640625, -1.75146484375, -1.666748046875, -1.58203125, -1.497314453125, -1.41259765625, -1.327880859375, -1.2431640625, -1.158447265625, -1.07373046875, -0.989013671875, -0.904296875, -0.819580078125, -0.73486328125, -0.650146484375, -0.5654296875, -0.480712890625, -0.39599609375, -0.311279296875, -0.2265625, -0.141845703125, -0.05712890625, 0.027587890625, 0.1123046875, 0.197021484375, 0.28173828125, 0.366455078125, 0.451171875, 0.535888671875, 0.62060546875, 0.705322265625, 0.7900390625, 0.874755859375, 0.95947265625, 1.044189453125, 1.12890625, 1.213623046875, 1.29833984375, 1.383056640625, 1.4677734375, 1.552490234375, 1.63720703125, 1.721923828125, 1.806640625, 1.891357421875, 1.97607421875, 2.060791015625, 2.1455078125, 2.230224609375, 2.31494140625, 2.399658203125, 2.484375, 2.569091796875, 2.65380859375, 2.738525390625, 2.8232421875, 2.907958984375, 2.99267578125, 3.077392578125, 3.162109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 13.0, 12.0, 11.0, 19.0, 17.0, 24.0, 21.0, 31.0, 37.0, 40.0, 28.0, 41.0, 71.0, 112.0, 145.0, 276.0, 1375.0, 217.0, 132.0, 61.0, 59.0, 42.0, 39.0, 33.0, 28.0, 27.0, 17.0, 27.0, 16.0, 14.0, 9.0, 4.0, 7.0, 7.0, 9.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.15234375, -5.9727783203125, -5.793212890625, -5.6136474609375, -5.43408203125, -5.2545166015625, -5.074951171875, -4.8953857421875, -4.7158203125, -4.5362548828125, -4.356689453125, -4.1771240234375, -3.99755859375, -3.8179931640625, -3.638427734375, -3.4588623046875, -3.279296875, -3.0997314453125, -2.920166015625, -2.7406005859375, -2.56103515625, -2.3814697265625, -2.201904296875, -2.0223388671875, -1.8427734375, -1.6632080078125, -1.483642578125, -1.3040771484375, -1.12451171875, -0.9449462890625, -0.765380859375, -0.5858154296875, -0.40625, -0.2266845703125, -0.047119140625, 0.1324462890625, 0.31201171875, 0.4915771484375, 0.671142578125, 0.8507080078125, 1.0302734375, 1.2098388671875, 1.389404296875, 1.5689697265625, 1.74853515625, 1.9281005859375, 2.107666015625, 2.2872314453125, 2.466796875, 2.6463623046875, 2.825927734375, 3.0054931640625, 3.18505859375, 3.3646240234375, 3.544189453125, 3.7237548828125, 3.9033203125, 4.0828857421875, 4.262451171875, 4.4420166015625, 4.62158203125, 4.8011474609375, 4.980712890625, 5.1602783203125, 5.33984375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 19.0, 16.0, 17.0, 30.0, 30.0, 56.0, 59.0, 61.0, 99.0, 174.0, 264.0, 493.0, 1300.0, 4972.0, 32624.0, 2197296.0, 880498.0, 21539.0, 3777.0, 1061.0, 457.0, 230.0, 164.0, 97.0, 82.0, 59.0, 46.0, 37.0, 26.0, 27.0, 22.0, 10.0, 9.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5625, -12.1920166015625, -11.821533203125, -11.4510498046875, -11.08056640625, -10.7100830078125, -10.339599609375, -9.9691162109375, -9.5986328125, -9.2281494140625, -8.857666015625, -8.4871826171875, -8.11669921875, -7.7462158203125, -7.375732421875, -7.0052490234375, -6.634765625, -6.2642822265625, -5.893798828125, -5.5233154296875, -5.15283203125, -4.7823486328125, -4.411865234375, -4.0413818359375, -3.6708984375, -3.3004150390625, -2.929931640625, -2.5594482421875, -2.18896484375, -1.8184814453125, -1.447998046875, -1.0775146484375, -0.70703125, -0.3365478515625, 0.033935546875, 0.4044189453125, 0.77490234375, 1.1453857421875, 1.515869140625, 1.8863525390625, 2.2568359375, 2.6273193359375, 2.997802734375, 3.3682861328125, 3.73876953125, 4.1092529296875, 4.479736328125, 4.8502197265625, 5.220703125, 5.5911865234375, 5.961669921875, 6.3321533203125, 6.70263671875, 7.0731201171875, 7.443603515625, 7.8140869140625, 8.1845703125, 8.5550537109375, 8.925537109375, 9.2960205078125, 9.66650390625, 10.0369873046875, 10.407470703125, 10.7779541015625, 11.1484375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 22.0, 719.0, 273.0, 4.0, 1.0, 1.0], "bins": [-201.0170440673828, -197.65365600585938, -194.29025268554688, -190.92686462402344, -187.5634765625, -184.2000732421875, -180.83668518066406, -177.47328186035156, -174.10989379882812, -170.7465057373047, -167.3831024169922, -164.01971435546875, -160.65631103515625, -157.2929229736328, -153.92953491210938, -150.56613159179688, -147.20274353027344, -143.83935546875, -140.4759521484375, -137.11256408691406, -133.74917602539062, -130.38577270507812, -127.02238464355469, -123.65898895263672, -120.29559326171875, -116.93219757080078, -113.56880187988281, -110.20541381835938, -106.8420181274414, -103.47862243652344, -100.115234375, -96.75183868408203, -93.3884506225586, -90.02505493164062, -86.66166687011719, -83.29827117919922, -79.93487548828125, -76.57147979736328, -73.20808410644531, -69.84469604492188, -66.4813003540039, -63.11790466308594, -59.754512786865234, -56.39112091064453, -53.02772521972656, -49.664329528808594, -46.30093765258789, -42.93754577636719, -39.57415008544922, -36.21075439453125, -32.84736251831055, -29.48396873474121, -26.120574951171875, -22.75718116760254, -19.393787384033203, -16.030393600463867, -12.666997909545898, -9.303604125976562, -5.940210342407227, -2.5768165588378906, 0.7865772247314453, 4.149971008300781, 7.513364791870117, 10.876758575439453, 14.240152359008789]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 10.0, 14.0, 13.0, 15.0, 22.0, 19.0, 33.0, 24.0, 42.0, 33.0, 37.0, 46.0, 53.0, 41.0, 54.0, 48.0, 46.0, 47.0, 44.0, 31.0, 31.0, 30.0, 32.0, 30.0, 39.0, 25.0, 22.0, 14.0, 11.0, 20.0, 9.0, 9.0, 9.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.38605499267578, -15.87166976928711, -15.357284545898438, -14.842899322509766, -14.328514099121094, -13.814128875732422, -13.29974365234375, -12.785358428955078, -12.270973205566406, -11.756587982177734, -11.242202758789062, -10.72781753540039, -10.213432312011719, -9.699047088623047, -9.184661865234375, -8.670276641845703, -8.155890464782715, -7.641505241394043, -7.127120018005371, -6.612734794616699, -6.098349571228027, -5.5839643478393555, -5.069578647613525, -4.5551934242248535, -4.040808200836182, -3.5264229774475098, -3.012037754058838, -2.497652292251587, -1.983267068862915, -1.4688818454742432, -0.9544963836669922, -0.4401111602783203, 0.07427406311035156, 0.5886593461036682, 1.1030446290969849, 1.6174299716949463, 2.131815195083618, 2.64620041847229, 3.160585880279541, 3.674971103668213, 4.189356327056885, 4.703741550445557, 5.2181267738342285, 5.732512474060059, 6.2468976974487305, 6.761282920837402, 7.275668144226074, 7.790053367614746, 8.304438591003418, 8.81882381439209, 9.333209037780762, 9.847594261169434, 10.361979484558105, 10.876364707946777, 11.390750885009766, 11.905136108398438, 12.41952133178711, 12.933906555175781, 13.448291778564453, 13.962677001953125, 14.477062225341797, 14.991447448730469, 15.50583267211914, 16.020217895507812, 16.534603118896484]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 0.0, 4.0, 6.0, 9.0, 11.0, 17.0, 13.0, 18.0, 24.0, 18.0, 22.0, 38.0, 38.0, 40.0, 48.0, 38.0, 48.0, 42.0, 38.0, 44.0, 45.0, 30.0, 37.0, 43.0, 38.0, 38.0, 35.0, 30.0, 30.0, 21.0, 24.0, 18.0, 17.0, 15.0, 13.0, 13.0, 6.0, 7.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.009765625, -1.9550933837890625, -1.900421142578125, -1.8457489013671875, -1.79107666015625, -1.7364044189453125, -1.681732177734375, -1.6270599365234375, -1.5723876953125, -1.5177154541015625, -1.463043212890625, -1.4083709716796875, -1.35369873046875, -1.2990264892578125, -1.244354248046875, -1.1896820068359375, -1.135009765625, -1.0803375244140625, -1.025665283203125, -0.9709930419921875, -0.91632080078125, -0.8616485595703125, -0.806976318359375, -0.7523040771484375, -0.6976318359375, -0.6429595947265625, -0.588287353515625, -0.5336151123046875, -0.47894287109375, -0.4242706298828125, -0.369598388671875, -0.3149261474609375, -0.26025390625, -0.2055816650390625, -0.150909423828125, -0.0962371826171875, -0.04156494140625, 0.0131072998046875, 0.067779541015625, 0.1224517822265625, 0.1771240234375, 0.2317962646484375, 0.286468505859375, 0.3411407470703125, 0.39581298828125, 0.4504852294921875, 0.505157470703125, 0.5598297119140625, 0.614501953125, 0.6691741943359375, 0.723846435546875, 0.7785186767578125, 0.83319091796875, 0.8878631591796875, 0.942535400390625, 0.9972076416015625, 1.0518798828125, 1.1065521240234375, 1.161224365234375, 1.2158966064453125, 1.27056884765625, 1.3252410888671875, 1.379913330078125, 1.4345855712890625, 1.4892578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 11.0, 7.0, 11.0, 20.0, 30.0, 32.0, 58.0, 99.0, 120.0, 220.0, 380.0, 652.0, 1329.0, 2607.0, 5914.0, 15521.0, 51388.0, 323646.0, 2481733.0, 1145833.0, 119203.0, 27867.0, 9509.0, 4128.0, 1888.0, 898.0, 473.0, 268.0, 168.0, 79.0, 46.0, 61.0, 22.0, 21.0, 18.0, 12.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0], "bins": [-5.0625, -4.931884765625, -4.80126953125, -4.670654296875, -4.5400390625, -4.409423828125, -4.27880859375, -4.148193359375, -4.017578125, -3.886962890625, -3.75634765625, -3.625732421875, -3.4951171875, -3.364501953125, -3.23388671875, -3.103271484375, -2.97265625, -2.842041015625, -2.71142578125, -2.580810546875, -2.4501953125, -2.319580078125, -2.18896484375, -2.058349609375, -1.927734375, -1.797119140625, -1.66650390625, -1.535888671875, -1.4052734375, -1.274658203125, -1.14404296875, -1.013427734375, -0.8828125, -0.752197265625, -0.62158203125, -0.490966796875, -0.3603515625, -0.229736328125, -0.09912109375, 0.031494140625, 0.162109375, 0.292724609375, 0.42333984375, 0.553955078125, 0.6845703125, 0.815185546875, 0.94580078125, 1.076416015625, 1.20703125, 1.337646484375, 1.46826171875, 1.598876953125, 1.7294921875, 1.860107421875, 1.99072265625, 2.121337890625, 2.251953125, 2.382568359375, 2.51318359375, 2.643798828125, 2.7744140625, 2.905029296875, 3.03564453125, 3.166259765625, 3.296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 24.0, 19.0, 40.0, 34.0, 68.0, 94.0, 117.0, 200.0, 296.0, 542.0, 782.0, 689.0, 448.0, 249.0, 160.0, 99.0, 58.0, 44.0, 40.0, 16.0, 20.0, 13.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.58050537109375, -4.4266357421875, -4.27276611328125, -4.118896484375, -3.96502685546875, -3.8111572265625, -3.65728759765625, -3.50341796875, -3.34954833984375, -3.1956787109375, -3.04180908203125, -2.887939453125, -2.73406982421875, -2.5802001953125, -2.42633056640625, -2.2724609375, -2.11859130859375, -1.9647216796875, -1.81085205078125, -1.656982421875, -1.50311279296875, -1.3492431640625, -1.19537353515625, -1.04150390625, -0.88763427734375, -0.7337646484375, -0.57989501953125, -0.426025390625, -0.27215576171875, -0.1182861328125, 0.03558349609375, 0.189453125, 0.34332275390625, 0.4971923828125, 0.65106201171875, 0.804931640625, 0.95880126953125, 1.1126708984375, 1.26654052734375, 1.42041015625, 1.57427978515625, 1.7281494140625, 1.88201904296875, 2.035888671875, 2.18975830078125, 2.3436279296875, 2.49749755859375, 2.6513671875, 2.80523681640625, 2.9591064453125, 3.11297607421875, 3.266845703125, 3.42071533203125, 3.5745849609375, 3.72845458984375, 3.88232421875, 4.03619384765625, 4.1900634765625, 4.34393310546875, 4.497802734375, 4.65167236328125, 4.8055419921875, 4.95941162109375, 5.11328125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 9.0, 19.0, 25.0, 38.0, 46.0, 96.0, 133.0, 243.0, 575.0, 2865.0, 151032.0, 3997331.0, 39347.0, 1494.0, 421.0, 217.0, 127.0, 75.0, 57.0, 41.0, 25.0, 22.0, 15.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.639404296875, -19.01318359375, -18.386962890625, -17.7607421875, -17.134521484375, -16.50830078125, -15.882080078125, -15.255859375, -14.629638671875, -14.00341796875, -13.377197265625, -12.7509765625, -12.124755859375, -11.49853515625, -10.872314453125, -10.24609375, -9.619873046875, -8.99365234375, -8.367431640625, -7.7412109375, -7.114990234375, -6.48876953125, -5.862548828125, -5.236328125, -4.610107421875, -3.98388671875, -3.357666015625, -2.7314453125, -2.105224609375, -1.47900390625, -0.852783203125, -0.2265625, 0.399658203125, 1.02587890625, 1.652099609375, 2.2783203125, 2.904541015625, 3.53076171875, 4.156982421875, 4.783203125, 5.409423828125, 6.03564453125, 6.661865234375, 7.2880859375, 7.914306640625, 8.54052734375, 9.166748046875, 9.79296875, 10.419189453125, 11.04541015625, 11.671630859375, 12.2978515625, 12.924072265625, 13.55029296875, 14.176513671875, 14.802734375, 15.428955078125, 16.05517578125, 16.681396484375, 17.3076171875, 17.933837890625, 18.56005859375, 19.186279296875, 19.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 15.0, 76.0, 250.0, 382.0, 214.0, 62.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.24877166748047, -69.34900665283203, -67.44923400878906, -65.54946899414062, -63.649696350097656, -61.74993133544922, -59.85015869140625, -57.95039367675781, -56.05062484741211, -54.150856018066406, -52.2510871887207, -50.351318359375, -48.4515495300293, -46.551780700683594, -44.652015686035156, -42.75224685668945, -40.85247802734375, -38.95270919799805, -37.052940368652344, -35.15317153930664, -33.25340270996094, -31.353635787963867, -29.453866958618164, -27.554100036621094, -25.654327392578125, -23.754558563232422, -21.85478973388672, -19.955020904541016, -18.055253982543945, -16.155485153198242, -14.255716323852539, -12.355948448181152, -10.456180572509766, -8.556411743164062, -6.656643867492676, -4.756875038146973, -2.8571066856384277, -0.9573383331298828, 0.9424304962158203, 2.842198371887207, 4.74196720123291, 6.641735553741455, 8.54150390625, 10.441272735595703, 12.341041564941406, 14.240809440612793, 16.140579223632812, 18.040346145629883, 19.940114974975586, 21.83988380432129, 23.739652633666992, 25.639419555664062, 27.539188385009766, 29.43895721435547, 31.338726043701172, 33.238494873046875, 35.13826370239258, 37.03803253173828, 38.937801361083984, 40.83757019042969, 42.73733901977539, 44.637107849121094, 46.53687286376953, 48.436641693115234, 50.33641052246094]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 19.0, 21.0, 29.0, 27.0, 35.0, 26.0, 37.0, 38.0, 50.0, 43.0, 45.0, 49.0, 52.0, 50.0, 35.0, 53.0, 34.0, 46.0, 38.0, 25.0, 22.0, 22.0, 29.0, 28.0, 11.0, 21.0, 11.0, 9.0, 10.0, 4.0, 12.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.414841651916504, -11.030830383300781, -10.646818161010742, -10.262805938720703, -9.87879467010498, -9.494783401489258, -9.110771179199219, -8.72675895690918, -8.342747688293457, -7.958735942840576, -7.574724197387695, -7.1907124519348145, -6.806700706481934, -6.422688961029053, -6.038677215576172, -5.654665470123291, -5.27065372467041, -4.886641979217529, -4.502630233764648, -4.118618488311768, -3.7346067428588867, -3.350594997406006, -2.966583251953125, -2.582571506500244, -2.1985597610473633, -1.8145480155944824, -1.4305362701416016, -1.0465245246887207, -0.6625127792358398, -0.278501033782959, 0.10551071166992188, 0.48952245712280273, 0.87353515625, 1.2575469017028809, 1.6415586471557617, 2.0255703926086426, 2.4095821380615234, 2.7935938835144043, 3.177605628967285, 3.561617374420166, 3.945629119873047, 4.329640865325928, 4.713652610778809, 5.0976643562316895, 5.48167610168457, 5.865687847137451, 6.249699592590332, 6.633711338043213, 7.017723083496094, 7.401734828948975, 7.7857465744018555, 8.169757843017578, 8.553770065307617, 8.937782287597656, 9.321793556213379, 9.705804824829102, 10.08981704711914, 10.47382926940918, 10.857840538024902, 11.241851806640625, 11.625864028930664, 12.009876251220703, 12.393887519836426, 12.777898788452148, 13.161911010742188]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 6.0, 11.0, 8.0, 12.0, 13.0, 21.0, 17.0, 24.0, 30.0, 44.0, 38.0, 35.0, 56.0, 52.0, 31.0, 48.0, 50.0, 55.0, 33.0, 46.0, 43.0, 36.0, 35.0, 38.0, 28.0, 33.0, 29.0, 14.0, 17.0, 26.0, 12.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.69378662109375, -1.6405029296875, -1.58721923828125, -1.533935546875, -1.48065185546875, -1.4273681640625, -1.37408447265625, -1.32080078125, -1.26751708984375, -1.2142333984375, -1.16094970703125, -1.107666015625, -1.05438232421875, -1.0010986328125, -0.94781494140625, -0.89453125, -0.84124755859375, -0.7879638671875, -0.73468017578125, -0.681396484375, -0.62811279296875, -0.5748291015625, -0.52154541015625, -0.46826171875, -0.41497802734375, -0.3616943359375, -0.30841064453125, -0.255126953125, -0.20184326171875, -0.1485595703125, -0.09527587890625, -0.0419921875, 0.01129150390625, 0.0645751953125, 0.11785888671875, 0.171142578125, 0.22442626953125, 0.2777099609375, 0.33099365234375, 0.38427734375, 0.43756103515625, 0.4908447265625, 0.54412841796875, 0.597412109375, 0.65069580078125, 0.7039794921875, 0.75726318359375, 0.810546875, 0.86383056640625, 0.9171142578125, 0.97039794921875, 1.023681640625, 1.07696533203125, 1.1302490234375, 1.18353271484375, 1.23681640625, 1.29010009765625, 1.3433837890625, 1.39666748046875, 1.449951171875, 1.50323486328125, 1.5565185546875, 1.60980224609375, 1.6630859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 8.0, 15.0, 22.0, 28.0, 42.0, 64.0, 83.0, 160.0, 241.0, 382.0, 570.0, 905.0, 1514.0, 2439.0, 3915.0, 6395.0, 10633.0, 17516.0, 28901.0, 48375.0, 78775.0, 122383.0, 169847.0, 179864.0, 139014.0, 92095.0, 56686.0, 34517.0, 20835.0, 12534.0, 7608.0, 4576.0, 2807.0, 1760.0, 1150.0, 671.0, 455.0, 264.0, 157.0, 106.0, 79.0, 45.0, 44.0, 27.0, 13.0, 9.0, 4.0, 7.0, 0.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.6572265625, -0.6367950439453125, -0.616363525390625, -0.5959320068359375, -0.57550048828125, -0.5550689697265625, -0.534637451171875, -0.5142059326171875, -0.4937744140625, -0.4733428955078125, -0.452911376953125, -0.4324798583984375, -0.41204833984375, -0.3916168212890625, -0.371185302734375, -0.3507537841796875, -0.330322265625, -0.3098907470703125, -0.289459228515625, -0.2690277099609375, -0.24859619140625, -0.2281646728515625, -0.207733154296875, -0.1873016357421875, -0.1668701171875, -0.1464385986328125, -0.126007080078125, -0.1055755615234375, -0.08514404296875, -0.0647125244140625, -0.044281005859375, -0.0238494873046875, -0.00341796875, 0.0170135498046875, 0.037445068359375, 0.0578765869140625, 0.07830810546875, 0.0987396240234375, 0.119171142578125, 0.1396026611328125, 0.1600341796875, 0.1804656982421875, 0.200897216796875, 0.2213287353515625, 0.24176025390625, 0.2621917724609375, 0.282623291015625, 0.3030548095703125, 0.323486328125, 0.3439178466796875, 0.364349365234375, 0.3847808837890625, 0.40521240234375, 0.4256439208984375, 0.446075439453125, 0.4665069580078125, 0.4869384765625, 0.5073699951171875, 0.527801513671875, 0.5482330322265625, 0.56866455078125, 0.5890960693359375, 0.609527587890625, 0.6299591064453125, 0.650390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 12.0, 11.0, 19.0, 24.0, 19.0, 25.0, 21.0, 40.0, 25.0, 36.0, 38.0, 42.0, 35.0, 32.0, 35.0, 47.0, 41.0, 1073.0, 44.0, 39.0, 40.0, 32.0, 29.0, 36.0, 32.0, 25.0, 24.0, 15.0, 19.0, 24.0, 10.0, 14.0, 9.0, 11.0, 8.0, 5.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.172576904296875, -1.13226318359375, -1.091949462890625, -1.0516357421875, -1.011322021484375, -0.97100830078125, -0.930694580078125, -0.890380859375, -0.850067138671875, -0.80975341796875, -0.769439697265625, -0.7291259765625, -0.688812255859375, -0.64849853515625, -0.608184814453125, -0.56787109375, -0.527557373046875, -0.48724365234375, -0.446929931640625, -0.4066162109375, -0.366302490234375, -0.32598876953125, -0.285675048828125, -0.245361328125, -0.205047607421875, -0.16473388671875, -0.124420166015625, -0.0841064453125, -0.043792724609375, -0.00347900390625, 0.036834716796875, 0.0771484375, 0.117462158203125, 0.15777587890625, 0.198089599609375, 0.2384033203125, 0.278717041015625, 0.31903076171875, 0.359344482421875, 0.399658203125, 0.439971923828125, 0.48028564453125, 0.520599365234375, 0.5609130859375, 0.601226806640625, 0.64154052734375, 0.681854248046875, 0.72216796875, 0.762481689453125, 0.80279541015625, 0.843109130859375, 0.8834228515625, 0.923736572265625, 0.96405029296875, 1.004364013671875, 1.044677734375, 1.084991455078125, 1.12530517578125, 1.165618896484375, 1.2059326171875, 1.246246337890625, 1.28656005859375, 1.326873779296875, 1.3671875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 14.0, 8.0, 14.0, 19.0, 27.0, 54.0, 76.0, 101.0, 195.0, 259.0, 380.0, 618.0, 1007.0, 1590.0, 2366.0, 3783.0, 6403.0, 10864.0, 19369.0, 42720.0, 233930.0, 1580125.0, 120505.0, 32323.0, 16314.0, 9248.0, 5610.0, 3359.0, 2130.0, 1308.0, 811.0, 579.0, 366.0, 247.0, 161.0, 87.0, 57.0, 42.0, 26.0, 19.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.962890625, -0.9311676025390625, -0.899444580078125, -0.8677215576171875, -0.83599853515625, -0.8042755126953125, -0.772552490234375, -0.7408294677734375, -0.7091064453125, -0.6773834228515625, -0.645660400390625, -0.6139373779296875, -0.58221435546875, -0.5504913330078125, -0.518768310546875, -0.4870452880859375, -0.455322265625, -0.4235992431640625, -0.391876220703125, -0.3601531982421875, -0.32843017578125, -0.2967071533203125, -0.264984130859375, -0.2332611083984375, -0.2015380859375, -0.1698150634765625, -0.138092041015625, -0.1063690185546875, -0.07464599609375, -0.0429229736328125, -0.011199951171875, 0.0205230712890625, 0.05224609375, 0.0839691162109375, 0.115692138671875, 0.1474151611328125, 0.17913818359375, 0.2108612060546875, 0.242584228515625, 0.2743072509765625, 0.3060302734375, 0.3377532958984375, 0.369476318359375, 0.4011993408203125, 0.43292236328125, 0.4646453857421875, 0.496368408203125, 0.5280914306640625, 0.559814453125, 0.5915374755859375, 0.623260498046875, 0.6549835205078125, 0.68670654296875, 0.7184295654296875, 0.750152587890625, 0.7818756103515625, 0.8135986328125, 0.8453216552734375, 0.877044677734375, 0.9087677001953125, 0.94049072265625, 0.9722137451171875, 1.003936767578125, 1.0356597900390625, 1.0673828125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 2.0, 4.0, 9.0, 18.0, 17.0, 19.0, 19.0, 19.0, 24.0, 27.0, 31.0, 28.0, 41.0, 49.0, 50.0, 57.0, 61.0, 83.0, 66.0, 52.0, 38.0, 38.0, 32.0, 35.0, 34.0, 27.0, 26.0, 26.0, 15.0, 11.0, 15.0, 8.0, 2.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11669921875, -0.11336708068847656, -0.11003494262695312, -0.10670280456542969, -0.10337066650390625, -0.10003852844238281, -0.09670639038085938, -0.09337425231933594, -0.0900421142578125, -0.08670997619628906, -0.08337783813476562, -0.08004570007324219, -0.07671356201171875, -0.07338142395019531, -0.07004928588867188, -0.06671714782714844, -0.063385009765625, -0.06005287170410156, -0.056720733642578125, -0.05338859558105469, -0.05005645751953125, -0.04672431945800781, -0.043392181396484375, -0.04006004333496094, -0.0367279052734375, -0.03339576721191406, -0.030063629150390625, -0.026731491088867188, -0.02339935302734375, -0.020067214965820312, -0.016735076904296875, -0.013402938842773438, -0.01007080078125, -0.0067386627197265625, -0.003406524658203125, -7.43865966796875e-05, 0.00325775146484375, 0.0065898895263671875, 0.009922027587890625, 0.013254165649414062, 0.0165863037109375, 0.019918441772460938, 0.023250579833984375, 0.026582717895507812, 0.02991485595703125, 0.03324699401855469, 0.036579132080078125, 0.03991127014160156, 0.043243408203125, 0.04657554626464844, 0.049907684326171875, 0.05323982238769531, 0.05657196044921875, 0.05990409851074219, 0.06323623657226562, 0.06656837463378906, 0.0699005126953125, 0.07323265075683594, 0.07656478881835938, 0.07989692687988281, 0.08322906494140625, 0.08656120300292969, 0.08989334106445312, 0.09322547912597656, 0.0965576171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 14.0, 18.0, 23.0, 44.0, 36.0, 53.0, 43.0, 98.0, 142.0, 265.0, 988.0, 48211.0, 986827.0, 10450.0, 655.0, 204.0, 128.0, 93.0, 45.0, 39.0, 25.0, 30.0, 21.0, 13.0, 22.0, 15.0, 4.0, 5.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.045074462890625, -1.97296142578125, -1.900848388671875, -1.8287353515625, -1.756622314453125, -1.68450927734375, -1.612396240234375, -1.540283203125, -1.468170166015625, -1.39605712890625, -1.323944091796875, -1.2518310546875, -1.179718017578125, -1.10760498046875, -1.035491943359375, -0.96337890625, -0.891265869140625, -0.81915283203125, -0.747039794921875, -0.6749267578125, -0.602813720703125, -0.53070068359375, -0.458587646484375, -0.386474609375, -0.314361572265625, -0.24224853515625, -0.170135498046875, -0.0980224609375, -0.025909423828125, 0.04620361328125, 0.118316650390625, 0.1904296875, 0.262542724609375, 0.33465576171875, 0.406768798828125, 0.4788818359375, 0.550994873046875, 0.62310791015625, 0.695220947265625, 0.767333984375, 0.839447021484375, 0.91156005859375, 0.983673095703125, 1.0557861328125, 1.127899169921875, 1.20001220703125, 1.272125244140625, 1.34423828125, 1.416351318359375, 1.48846435546875, 1.560577392578125, 1.6326904296875, 1.704803466796875, 1.77691650390625, 1.849029541015625, 1.921142578125, 1.993255615234375, 2.06536865234375, 2.137481689453125, 2.2095947265625, 2.281707763671875, 2.35382080078125, 2.425933837890625, 2.498046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 11.0, 59.0, 558.0, 350.0, 36.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73728346824646, -2.639051914215088, -2.540820598602295, -2.442589044570923, -2.34435772895813, -2.246126174926758, -2.147894859313965, -2.0496633052825928, -1.9514319896697998, -1.8532005548477173, -1.7549691200256348, -1.6567376852035522, -1.5585062503814697, -1.4602748155593872, -1.3620433807373047, -1.2638118267059326, -1.16558039188385, -1.0673489570617676, -0.9691175222396851, -0.8708860874176025, -0.77265465259552, -0.6744232177734375, -0.5761917233467102, -0.4779602885246277, -0.37972885370254517, -0.28149741888046265, -0.18326596915721893, -0.08503451943397522, 0.0131969153881073, 0.11142835021018982, 0.20965981483459473, 0.30789124965667725, 0.40612268447875977, 0.5043541193008423, 0.6025855541229248, 0.7008169889450073, 0.7990484237670898, 0.8972798585891724, 0.9955113530158997, 1.093742847442627, 1.19197416305542, 1.2902055978775024, 1.388437032699585, 1.4866684675216675, 1.58489990234375, 1.6831313371658325, 1.781362771987915, 1.879594326019287, 1.9778257608413696, 2.076057195663452, 2.174288749694824, 2.272520065307617, 2.3707516193389893, 2.4689829349517822, 2.5672144889831543, 2.6654458045959473, 2.7636773586273193, 2.8619089126586914, 2.9601402282714844, 3.0583717823028564, 3.1566030979156494, 3.2548346519470215, 3.3530659675598145, 3.4512975215911865, 3.5495288372039795]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 8.0, 6.0, 7.0, 9.0, 12.0, 20.0, 18.0, 25.0, 29.0, 31.0, 38.0, 59.0, 53.0, 35.0, 57.0, 51.0, 57.0, 55.0, 58.0, 47.0, 50.0, 49.0, 39.0, 29.0, 31.0, 27.0, 19.0, 25.0, 18.0, 10.0, 8.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6050333380699158, -0.5891799330711365, -0.5733264684677124, -0.5574730634689331, -0.541619598865509, -0.5257661938667297, -0.5099127292633057, -0.49405932426452637, -0.47820591926574707, -0.4623524844646454, -0.4464990496635437, -0.4306456446647644, -0.4147922098636627, -0.39893877506256104, -0.38308534026145935, -0.36723190546035767, -0.351378470659256, -0.3355250358581543, -0.3196716010570526, -0.3038181662559509, -0.28796476125717163, -0.27211132645606995, -0.25625789165496826, -0.24040445685386658, -0.2245510369539261, -0.2086976021528244, -0.1928441822528839, -0.17699074745178223, -0.16113731265068054, -0.14528389275074005, -0.12943045794963837, -0.11357703059911728, -0.09772360324859619, -0.0818701758980751, -0.06601674854755402, -0.05016331374645233, -0.034309886395931244, -0.018456459045410156, -0.0026030242443084717, 0.013250403106212616, 0.029103830456733704, 0.04495725780725479, 0.06081068888306618, 0.07666411995887756, 0.09251754730939865, 0.10837097465991974, 0.12422440946102142, 0.14007782936096191, 0.1559312641620636, 0.17178469896316528, 0.18763811886310577, 0.20349155366420746, 0.21934497356414795, 0.23519840836524963, 0.2510518431663513, 0.266905277967453, 0.2827587127685547, 0.29861214756965637, 0.31446558237075806, 0.33031898736953735, 0.34617242217063904, 0.3620258569717407, 0.3778792917728424, 0.3937327265739441, 0.4095861315727234]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 24.0, 18.0, 27.0, 30.0, 43.0, 39.0, 60.0, 49.0, 65.0, 75.0, 56.0, 70.0, 52.0, 67.0, 52.0, 50.0, 47.0, 30.0, 30.0, 28.0, 29.0, 17.0, 13.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.287506103515625, -2.21173095703125, -2.135955810546875, -2.0601806640625, -1.984405517578125, -1.90863037109375, -1.832855224609375, -1.757080078125, -1.681304931640625, -1.60552978515625, -1.529754638671875, -1.4539794921875, -1.378204345703125, -1.30242919921875, -1.226654052734375, -1.15087890625, -1.075103759765625, -0.99932861328125, -0.923553466796875, -0.8477783203125, -0.772003173828125, -0.69622802734375, -0.620452880859375, -0.544677734375, -0.468902587890625, -0.39312744140625, -0.317352294921875, -0.2415771484375, -0.165802001953125, -0.09002685546875, -0.014251708984375, 0.0615234375, 0.137298583984375, 0.21307373046875, 0.288848876953125, 0.3646240234375, 0.440399169921875, 0.51617431640625, 0.591949462890625, 0.667724609375, 0.743499755859375, 0.81927490234375, 0.895050048828125, 0.9708251953125, 1.046600341796875, 1.12237548828125, 1.198150634765625, 1.27392578125, 1.349700927734375, 1.42547607421875, 1.501251220703125, 1.5770263671875, 1.652801513671875, 1.72857666015625, 1.804351806640625, 1.880126953125, 1.955902099609375, 2.03167724609375, 2.107452392578125, 2.1832275390625, 2.259002685546875, 2.33477783203125, 2.410552978515625, 2.486328125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 10.0, 9.0, 13.0, 29.0, 54.0, 86.0, 175.0, 310.0, 619.0, 1397.0, 2983.0, 6853.0, 18012.0, 51120.0, 172640.0, 482953.0, 214090.0, 61633.0, 21241.0, 7928.0, 3341.0, 1495.0, 750.0, 348.0, 192.0, 110.0, 60.0, 36.0, 22.0, 12.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.25933837890625, -2.1710205078125, -2.08270263671875, -1.994384765625, -1.90606689453125, -1.8177490234375, -1.72943115234375, -1.64111328125, -1.55279541015625, -1.4644775390625, -1.37615966796875, -1.287841796875, -1.19952392578125, -1.1112060546875, -1.02288818359375, -0.9345703125, -0.84625244140625, -0.7579345703125, -0.66961669921875, -0.581298828125, -0.49298095703125, -0.4046630859375, -0.31634521484375, -0.22802734375, -0.13970947265625, -0.0513916015625, 0.03692626953125, 0.125244140625, 0.21356201171875, 0.3018798828125, 0.39019775390625, 0.478515625, 0.56683349609375, 0.6551513671875, 0.74346923828125, 0.831787109375, 0.92010498046875, 1.0084228515625, 1.09674072265625, 1.18505859375, 1.27337646484375, 1.3616943359375, 1.45001220703125, 1.538330078125, 1.62664794921875, 1.7149658203125, 1.80328369140625, 1.8916015625, 1.97991943359375, 2.0682373046875, 2.15655517578125, 2.244873046875, 2.33319091796875, 2.4215087890625, 2.50982666015625, 2.59814453125, 2.68646240234375, 2.7747802734375, 2.86309814453125, 2.951416015625, 3.03973388671875, 3.1280517578125, 3.21636962890625, 3.3046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 12.0, 7.0, 15.0, 12.0, 28.0, 24.0, 37.0, 39.0, 39.0, 53.0, 56.0, 68.0, 123.0, 221.0, 1519.0, 224.0, 124.0, 66.0, 56.0, 47.0, 46.0, 34.0, 34.0, 24.0, 24.0, 20.0, 15.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7176513671875, -6.517333984375, -6.3170166015625, -6.11669921875, -5.9163818359375, -5.716064453125, -5.5157470703125, -5.3154296875, -5.1151123046875, -4.914794921875, -4.7144775390625, -4.51416015625, -4.3138427734375, -4.113525390625, -3.9132080078125, -3.712890625, -3.5125732421875, -3.312255859375, -3.1119384765625, -2.91162109375, -2.7113037109375, -2.510986328125, -2.3106689453125, -2.1103515625, -1.9100341796875, -1.709716796875, -1.5093994140625, -1.30908203125, -1.1087646484375, -0.908447265625, -0.7081298828125, -0.5078125, -0.3074951171875, -0.107177734375, 0.0931396484375, 0.29345703125, 0.4937744140625, 0.694091796875, 0.8944091796875, 1.0947265625, 1.2950439453125, 1.495361328125, 1.6956787109375, 1.89599609375, 2.0963134765625, 2.296630859375, 2.4969482421875, 2.697265625, 2.8975830078125, 3.097900390625, 3.2982177734375, 3.49853515625, 3.6988525390625, 3.899169921875, 4.0994873046875, 4.2998046875, 4.5001220703125, 4.700439453125, 4.9007568359375, 5.10107421875, 5.3013916015625, 5.501708984375, 5.7020263671875, 5.90234375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 15.0, 14.0, 10.0, 21.0, 31.0, 39.0, 51.0, 61.0, 99.0, 166.0, 197.0, 398.0, 1222.0, 8865.0, 673348.0, 2441671.0, 16589.0, 1606.0, 473.0, 260.0, 144.0, 103.0, 96.0, 48.0, 38.0, 31.0, 22.0, 18.0, 16.0, 10.0, 5.0, 9.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.8668212890625, -11.444580078125, -11.0223388671875, -10.60009765625, -10.1778564453125, -9.755615234375, -9.3333740234375, -8.9111328125, -8.4888916015625, -8.066650390625, -7.6444091796875, -7.22216796875, -6.7999267578125, -6.377685546875, -5.9554443359375, -5.533203125, -5.1109619140625, -4.688720703125, -4.2664794921875, -3.84423828125, -3.4219970703125, -2.999755859375, -2.5775146484375, -2.1552734375, -1.7330322265625, -1.310791015625, -0.8885498046875, -0.46630859375, -0.0440673828125, 0.378173828125, 0.8004150390625, 1.22265625, 1.6448974609375, 2.067138671875, 2.4893798828125, 2.91162109375, 3.3338623046875, 3.756103515625, 4.1783447265625, 4.6005859375, 5.0228271484375, 5.445068359375, 5.8673095703125, 6.28955078125, 6.7117919921875, 7.134033203125, 7.5562744140625, 7.978515625, 8.4007568359375, 8.822998046875, 9.2452392578125, 9.66748046875, 10.0897216796875, 10.511962890625, 10.9342041015625, 11.3564453125, 11.7786865234375, 12.200927734375, 12.6231689453125, 13.04541015625, 13.4676513671875, 13.889892578125, 14.3121337890625, 14.734375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 528.0, 482.0, 4.0], "bins": [-254.04322814941406, -249.94281005859375, -245.84239196777344, -241.74197387695312, -237.6415557861328, -233.5411376953125, -229.4407196044922, -225.34030151367188, -221.2398681640625, -217.1394500732422, -213.03903198242188, -208.93861389160156, -204.83819580078125, -200.73777770996094, -196.63735961914062, -192.53692626953125, -188.4365234375, -184.3361053466797, -180.23568725585938, -176.13526916503906, -172.03485107421875, -167.93443298339844, -163.83401489257812, -159.73358154296875, -155.6331787109375, -151.5327606201172, -147.43234252929688, -143.33192443847656, -139.23150634765625, -135.13108825683594, -131.03067016601562, -126.93024444580078, -122.82980346679688, -118.72938537597656, -114.62896728515625, -110.52854919433594, -106.42813110351562, -102.32771301269531, -98.22728729248047, -94.12686920166016, -90.02645111083984, -85.92603302001953, -81.82561492919922, -77.7251968383789, -73.62477111816406, -69.52435302734375, -65.42393493652344, -61.323516845703125, -57.22309875488281, -53.1226806640625, -49.02226257324219, -44.92184066772461, -40.8214225769043, -36.721004486083984, -32.620582580566406, -28.520164489746094, -24.41974639892578, -20.31932830810547, -16.218908309936523, -12.118489265441895, -8.018070220947266, -3.917652130126953, 0.1827678680419922, 4.2831878662109375, 8.38360595703125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 10.0, 6.0, 14.0, 17.0, 12.0, 17.0, 22.0, 27.0, 31.0, 33.0, 39.0, 42.0, 39.0, 33.0, 52.0, 50.0, 42.0, 35.0, 31.0, 44.0, 38.0, 44.0, 30.0, 35.0, 35.0, 37.0, 24.0, 26.0, 25.0, 16.0, 22.0, 15.0, 12.0, 7.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.349242210388184, -14.865498542785645, -14.381753921508789, -13.89801025390625, -13.414265632629395, -12.930521965026855, -12.44677734375, -11.963033676147461, -11.479289054870605, -10.995545387268066, -10.511800765991211, -10.028057098388672, -9.544312477111816, -9.060568809509277, -8.576824188232422, -8.093080520629883, -7.6093363761901855, -7.125592231750488, -6.641848087310791, -6.158103942871094, -5.6743597984313965, -5.190615653991699, -4.70687198638916, -4.223127365112305, -3.7393834590911865, -3.2556393146514893, -2.771895170211792, -2.288151264190674, -1.804407000541687, -1.3206629753112793, -0.836918830871582, -0.35317468643188477, 0.1305694580078125, 0.6143136024475098, 1.098057746887207, 1.5818017721176147, 2.0655460357666016, 2.5492899417877197, 3.033034086227417, 3.5167782306671143, 4.000522613525391, 4.484266757965088, 4.968010902404785, 5.451755046844482, 5.93549919128418, 6.419242858886719, 6.902987480163574, 7.386731147766113, 7.8704752922058105, 8.354219436645508, 8.837963104248047, 9.321707725524902, 9.805451393127441, 10.289196014404297, 10.772939682006836, 11.256684303283691, 11.74042797088623, 12.22417163848877, 12.707916259765625, 13.191659927368164, 13.67540454864502, 14.159148216247559, 14.642892837524414, 15.126636505126953, 15.610381126403809]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 13.0, 12.0, 12.0, 10.0, 27.0, 19.0, 29.0, 35.0, 35.0, 39.0, 45.0, 44.0, 67.0, 53.0, 60.0, 41.0, 52.0, 51.0, 62.0, 42.0, 37.0, 38.0, 39.0, 28.0, 26.0, 14.0, 22.0, 7.0, 11.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.16497802734375, -2.0975341796875, -2.03009033203125, -1.962646484375, -1.89520263671875, -1.8277587890625, -1.76031494140625, -1.69287109375, -1.62542724609375, -1.5579833984375, -1.49053955078125, -1.423095703125, -1.35565185546875, -1.2882080078125, -1.22076416015625, -1.1533203125, -1.08587646484375, -1.0184326171875, -0.95098876953125, -0.883544921875, -0.81610107421875, -0.7486572265625, -0.68121337890625, -0.61376953125, -0.54632568359375, -0.4788818359375, -0.41143798828125, -0.343994140625, -0.27655029296875, -0.2091064453125, -0.14166259765625, -0.07421875, -0.00677490234375, 0.0606689453125, 0.12811279296875, 0.195556640625, 0.26300048828125, 0.3304443359375, 0.39788818359375, 0.46533203125, 0.53277587890625, 0.6002197265625, 0.66766357421875, 0.735107421875, 0.80255126953125, 0.8699951171875, 0.93743896484375, 1.0048828125, 1.07232666015625, 1.1397705078125, 1.20721435546875, 1.274658203125, 1.34210205078125, 1.4095458984375, 1.47698974609375, 1.54443359375, 1.61187744140625, 1.6793212890625, 1.74676513671875, 1.814208984375, 1.88165283203125, 1.9490966796875, 2.01654052734375, 2.083984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 11.0, 18.0, 10.0, 30.0, 37.0, 59.0, 86.0, 131.0, 196.0, 370.0, 614.0, 1140.0, 2390.0, 5033.0, 12120.0, 32575.0, 129362.0, 1099910.0, 2454789.0, 359602.0, 61196.0, 19613.0, 7805.0, 3534.0, 1657.0, 800.0, 468.0, 262.0, 166.0, 101.0, 70.0, 49.0, 22.0, 21.0, 13.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.70538330078125, -3.5787353515625, -3.45208740234375, -3.325439453125, -3.19879150390625, -3.0721435546875, -2.94549560546875, -2.81884765625, -2.69219970703125, -2.5655517578125, -2.43890380859375, -2.312255859375, -2.18560791015625, -2.0589599609375, -1.93231201171875, -1.8056640625, -1.67901611328125, -1.5523681640625, -1.42572021484375, -1.299072265625, -1.17242431640625, -1.0457763671875, -0.91912841796875, -0.79248046875, -0.66583251953125, -0.5391845703125, -0.41253662109375, -0.285888671875, -0.15924072265625, -0.0325927734375, 0.09405517578125, 0.220703125, 0.34735107421875, 0.4739990234375, 0.60064697265625, 0.727294921875, 0.85394287109375, 0.9805908203125, 1.10723876953125, 1.23388671875, 1.36053466796875, 1.4871826171875, 1.61383056640625, 1.740478515625, 1.86712646484375, 1.9937744140625, 2.12042236328125, 2.2470703125, 2.37371826171875, 2.5003662109375, 2.62701416015625, 2.753662109375, 2.88031005859375, 3.0069580078125, 3.13360595703125, 3.26025390625, 3.38690185546875, 3.5135498046875, 3.64019775390625, 3.766845703125, 3.89349365234375, 4.0201416015625, 4.14678955078125, 4.2734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 7.0, 6.0, 9.0, 18.0, 21.0, 37.0, 52.0, 80.0, 78.0, 119.0, 193.0, 294.0, 452.0, 685.0, 683.0, 465.0, 325.0, 200.0, 114.0, 69.0, 49.0, 38.0, 21.0, 16.0, 8.0, 9.0, 11.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.7578125, -5.620849609375, -5.48388671875, -5.346923828125, -5.2099609375, -5.072998046875, -4.93603515625, -4.799072265625, -4.662109375, -4.525146484375, -4.38818359375, -4.251220703125, -4.1142578125, -3.977294921875, -3.84033203125, -3.703369140625, -3.56640625, -3.429443359375, -3.29248046875, -3.155517578125, -3.0185546875, -2.881591796875, -2.74462890625, -2.607666015625, -2.470703125, -2.333740234375, -2.19677734375, -2.059814453125, -1.9228515625, -1.785888671875, -1.64892578125, -1.511962890625, -1.375, -1.238037109375, -1.10107421875, -0.964111328125, -0.8271484375, -0.690185546875, -0.55322265625, -0.416259765625, -0.279296875, -0.142333984375, -0.00537109375, 0.131591796875, 0.2685546875, 0.405517578125, 0.54248046875, 0.679443359375, 0.81640625, 0.953369140625, 1.09033203125, 1.227294921875, 1.3642578125, 1.501220703125, 1.63818359375, 1.775146484375, 1.912109375, 2.049072265625, 2.18603515625, 2.322998046875, 2.4599609375, 2.596923828125, 2.73388671875, 2.870849609375, 3.0078125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 12.0, 14.0, 12.0, 12.0, 37.0, 46.0, 69.0, 103.0, 225.0, 534.0, 2860.0, 66386.0, 3999605.0, 119169.0, 3887.0, 631.0, 250.0, 120.0, 89.0, 74.0, 43.0, 35.0, 15.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1640625, -12.5806884765625, -11.997314453125, -11.4139404296875, -10.83056640625, -10.2471923828125, -9.663818359375, -9.0804443359375, -8.4970703125, -7.9136962890625, -7.330322265625, -6.7469482421875, -6.16357421875, -5.5802001953125, -4.996826171875, -4.4134521484375, -3.830078125, -3.2467041015625, -2.663330078125, -2.0799560546875, -1.49658203125, -0.9132080078125, -0.329833984375, 0.2535400390625, 0.8369140625, 1.4202880859375, 2.003662109375, 2.5870361328125, 3.17041015625, 3.7537841796875, 4.337158203125, 4.9205322265625, 5.50390625, 6.0872802734375, 6.670654296875, 7.2540283203125, 7.83740234375, 8.4207763671875, 9.004150390625, 9.5875244140625, 10.1708984375, 10.7542724609375, 11.337646484375, 11.9210205078125, 12.50439453125, 13.0877685546875, 13.671142578125, 14.2545166015625, 14.837890625, 15.4212646484375, 16.004638671875, 16.5880126953125, 17.17138671875, 17.7547607421875, 18.338134765625, 18.9215087890625, 19.5048828125, 20.0882568359375, 20.671630859375, 21.2550048828125, 21.83837890625, 22.4217529296875, 23.005126953125, 23.5885009765625, 24.171875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 29.0, 54.0, 128.0, 248.0, 262.0, 144.0, 71.0, 38.0, 11.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.337215423583984, -15.11185073852539, -13.886486053466797, -12.661120414733887, -11.435755729675293, -10.2103910446167, -8.985025405883789, -7.759660720825195, -6.534296035766602, -5.308931350708008, -4.083566188812256, -2.858201265335083, -1.6328363418579102, -0.4074716567993164, 0.8178935050964355, 2.0432586669921875, 3.2686233520507812, 4.493988037109375, 5.719353199005127, 6.944718360900879, 8.170083045959473, 9.395447731018066, 10.620813369750977, 11.84617805480957, 13.071542739868164, 14.296907424926758, 15.522272109985352, 16.747636795043945, 17.973003387451172, 19.198368072509766, 20.42373275756836, 21.649097442626953, 22.874462127685547, 24.09982681274414, 25.325191497802734, 26.550556182861328, 27.775920867919922, 29.001285552978516, 30.226652145385742, 31.452016830444336, 32.67738342285156, 33.902748107910156, 35.12811279296875, 36.353477478027344, 37.57884216308594, 38.80420684814453, 40.029571533203125, 41.25493621826172, 42.48030090332031, 43.705665588378906, 44.9310302734375, 46.156394958496094, 47.38175964355469, 48.60712432861328, 49.832489013671875, 51.05785369873047, 52.28321838378906, 53.508583068847656, 54.73394775390625, 55.959312438964844, 57.18467712402344, 58.41004180908203, 59.635406494140625, 60.86077117919922, 62.08613967895508]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 6.0, 12.0, 5.0, 11.0, 15.0, 12.0, 15.0, 21.0, 22.0, 24.0, 29.0, 35.0, 36.0, 42.0, 36.0, 46.0, 32.0, 43.0, 59.0, 51.0, 34.0, 29.0, 32.0, 33.0, 44.0, 35.0, 27.0, 20.0, 25.0, 29.0, 23.0, 14.0, 13.0, 15.0, 20.0, 7.0, 6.0, 8.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-13.171545028686523, -12.812033653259277, -12.452521324157715, -12.093009948730469, -11.733498573303223, -11.373987197875977, -11.014474868774414, -10.654963493347168, -10.295452117919922, -9.935940742492676, -9.576428413391113, -9.216917037963867, -8.857405662536621, -8.497894287109375, -8.138381958007812, -7.778870582580566, -7.419358730316162, -7.059846878051758, -6.700335502624512, -6.340823650360107, -5.981312274932861, -5.621800422668457, -5.262289047241211, -4.902777194976807, -4.543265342712402, -4.183753490447998, -3.824242115020752, -3.4647302627563477, -3.1052188873291016, -2.7457070350646973, -2.386195421218872, -2.026683807373047, -1.6671724319458008, -1.3076608180999756, -0.9481491446495056, -0.5886374711990356, -0.22912585735321045, 0.13038575649261475, 0.4898974895477295, 0.8494091033935547, 1.2089207172393799, 1.568432331085205, 1.9279439449310303, 2.2874555587768555, 2.6469674110412598, 3.006478786468506, 3.36599063873291, 3.7255022525787354, 4.0850138664245605, 4.444525718688965, 4.804037094116211, 5.163548946380615, 5.523060321807861, 5.882572174072266, 6.242083549499512, 6.601595401763916, 6.96110725402832, 7.320619106292725, 7.680130481719971, 8.039642333984375, 8.399153709411621, 8.758665084838867, 9.11817741394043, 9.477688789367676, 9.837200164794922]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 8.0, 16.0, 8.0, 19.0, 33.0, 29.0, 37.0, 35.0, 55.0, 54.0, 59.0, 68.0, 62.0, 55.0, 68.0, 69.0, 53.0, 50.0, 38.0, 28.0, 33.0, 28.0, 22.0, 20.0, 12.0, 11.0, 10.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.873626708984375, -2.79803466796875, -2.722442626953125, -2.6468505859375, -2.571258544921875, -2.49566650390625, -2.420074462890625, -2.344482421875, -2.268890380859375, -2.19329833984375, -2.117706298828125, -2.0421142578125, -1.966522216796875, -1.89093017578125, -1.815338134765625, -1.73974609375, -1.664154052734375, -1.58856201171875, -1.512969970703125, -1.4373779296875, -1.361785888671875, -1.28619384765625, -1.210601806640625, -1.135009765625, -1.059417724609375, -0.98382568359375, -0.908233642578125, -0.8326416015625, -0.757049560546875, -0.68145751953125, -0.605865478515625, -0.5302734375, -0.454681396484375, -0.37908935546875, -0.303497314453125, -0.2279052734375, -0.152313232421875, -0.07672119140625, -0.001129150390625, 0.074462890625, 0.150054931640625, 0.22564697265625, 0.301239013671875, 0.3768310546875, 0.452423095703125, 0.52801513671875, 0.603607177734375, 0.67919921875, 0.754791259765625, 0.83038330078125, 0.905975341796875, 0.9815673828125, 1.057159423828125, 1.13275146484375, 1.208343505859375, 1.283935546875, 1.359527587890625, 1.43511962890625, 1.510711669921875, 1.5863037109375, 1.661895751953125, 1.73748779296875, 1.813079833984375, 1.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 12.0, 18.0, 22.0, 43.0, 43.0, 91.0, 175.0, 299.0, 618.0, 1163.0, 2252.0, 4801.0, 10004.0, 22454.0, 50934.0, 115490.0, 234311.0, 287268.0, 174021.0, 80062.0, 35054.0, 15427.0, 7091.0, 3458.0, 1629.0, 824.0, 421.0, 220.0, 132.0, 72.0, 57.0, 28.0, 15.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.0546875, -1.0229873657226562, -0.9912872314453125, -0.9595870971679688, -0.927886962890625, -0.8961868286132812, -0.8644866943359375, -0.8327865600585938, -0.80108642578125, -0.7693862915039062, -0.7376861572265625, -0.7059860229492188, -0.674285888671875, -0.6425857543945312, -0.6108856201171875, -0.5791854858398438, -0.5474853515625, -0.5157852172851562, -0.4840850830078125, -0.45238494873046875, -0.420684814453125, -0.38898468017578125, -0.3572845458984375, -0.32558441162109375, -0.29388427734375, -0.26218414306640625, -0.2304840087890625, -0.19878387451171875, -0.167083740234375, -0.13538360595703125, -0.1036834716796875, -0.07198333740234375, -0.040283203125, -0.00858306884765625, 0.0231170654296875, 0.05481719970703125, 0.086517333984375, 0.11821746826171875, 0.1499176025390625, 0.18161773681640625, 0.21331787109375, 0.24501800537109375, 0.2767181396484375, 0.30841827392578125, 0.340118408203125, 0.37181854248046875, 0.4035186767578125, 0.43521881103515625, 0.4669189453125, 0.49861907958984375, 0.5303192138671875, 0.5620193481445312, 0.593719482421875, 0.6254196166992188, 0.6571197509765625, 0.6888198852539062, 0.72052001953125, 0.7522201538085938, 0.7839202880859375, 0.8156204223632812, 0.847320556640625, 0.8790206909179688, 0.9107208251953125, 0.9424209594726562, 0.97412109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 13.0, 13.0, 9.0, 14.0, 13.0, 16.0, 28.0, 24.0, 31.0, 36.0, 43.0, 45.0, 38.0, 41.0, 38.0, 44.0, 1062.0, 47.0, 44.0, 45.0, 40.0, 36.0, 37.0, 31.0, 27.0, 22.0, 30.0, 20.0, 18.0, 15.0, 19.0, 14.0, 18.0, 11.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1650390625, -1.1261138916015625, -1.087188720703125, -1.0482635498046875, -1.00933837890625, -0.9704132080078125, -0.931488037109375, -0.8925628662109375, -0.8536376953125, -0.8147125244140625, -0.775787353515625, -0.7368621826171875, -0.69793701171875, -0.6590118408203125, -0.620086669921875, -0.5811614990234375, -0.542236328125, -0.5033111572265625, -0.464385986328125, -0.4254608154296875, -0.38653564453125, -0.3476104736328125, -0.308685302734375, -0.2697601318359375, -0.2308349609375, -0.1919097900390625, -0.152984619140625, -0.1140594482421875, -0.07513427734375, -0.0362091064453125, 0.002716064453125, 0.0416412353515625, 0.08056640625, 0.1194915771484375, 0.158416748046875, 0.1973419189453125, 0.23626708984375, 0.2751922607421875, 0.314117431640625, 0.3530426025390625, 0.3919677734375, 0.4308929443359375, 0.469818115234375, 0.5087432861328125, 0.54766845703125, 0.5865936279296875, 0.625518798828125, 0.6644439697265625, 0.703369140625, 0.7422943115234375, 0.781219482421875, 0.8201446533203125, 0.85906982421875, 0.8979949951171875, 0.936920166015625, 0.9758453369140625, 1.0147705078125, 1.0536956787109375, 1.092620849609375, 1.1315460205078125, 1.17047119140625, 1.2093963623046875, 1.248321533203125, 1.2872467041015625, 1.326171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 8.0, 9.0, 15.0, 31.0, 49.0, 97.0, 149.0, 224.0, 314.0, 577.0, 838.0, 1389.0, 2334.0, 3769.0, 6003.0, 10328.0, 18782.0, 41056.0, 255919.0, 1597340.0, 94406.0, 27646.0, 14431.0, 8284.0, 5124.0, 3082.0, 1882.0, 1186.0, 731.0, 407.0, 257.0, 176.0, 89.0, 71.0, 47.0, 32.0, 11.0, 16.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.957672119140625, -0.92706298828125, -0.896453857421875, -0.8658447265625, -0.835235595703125, -0.80462646484375, -0.774017333984375, -0.743408203125, -0.712799072265625, -0.68218994140625, -0.651580810546875, -0.6209716796875, -0.590362548828125, -0.55975341796875, -0.529144287109375, -0.49853515625, -0.467926025390625, -0.43731689453125, -0.406707763671875, -0.3760986328125, -0.345489501953125, -0.31488037109375, -0.284271240234375, -0.253662109375, -0.223052978515625, -0.19244384765625, -0.161834716796875, -0.1312255859375, -0.100616455078125, -0.07000732421875, -0.039398193359375, -0.0087890625, 0.021820068359375, 0.05242919921875, 0.083038330078125, 0.1136474609375, 0.144256591796875, 0.17486572265625, 0.205474853515625, 0.236083984375, 0.266693115234375, 0.29730224609375, 0.327911376953125, 0.3585205078125, 0.389129638671875, 0.41973876953125, 0.450347900390625, 0.48095703125, 0.511566162109375, 0.54217529296875, 0.572784423828125, 0.6033935546875, 0.634002685546875, 0.66461181640625, 0.695220947265625, 0.725830078125, 0.756439208984375, 0.78704833984375, 0.817657470703125, 0.8482666015625, 0.878875732421875, 0.90948486328125, 0.940093994140625, 0.970703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 11.0, 11.0, 13.0, 24.0, 32.0, 34.0, 37.0, 48.0, 51.0, 67.0, 87.0, 72.0, 77.0, 73.0, 60.0, 63.0, 41.0, 37.0, 30.0, 22.0, 22.0, 15.0, 11.0, 6.0, 9.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.0738062858581543, -0.0716848373413086, -0.06956338882446289, -0.06744194030761719, -0.06532049179077148, -0.06319904327392578, -0.06107759475708008, -0.058956146240234375, -0.05683469772338867, -0.05471324920654297, -0.052591800689697266, -0.05047035217285156, -0.04834890365600586, -0.046227455139160156, -0.04410600662231445, -0.04198455810546875, -0.03986310958862305, -0.037741661071777344, -0.03562021255493164, -0.03349876403808594, -0.031377315521240234, -0.02925586700439453, -0.027134418487548828, -0.025012969970703125, -0.022891521453857422, -0.02077007293701172, -0.018648624420166016, -0.016527175903320312, -0.01440572738647461, -0.012284278869628906, -0.010162830352783203, -0.0080413818359375, -0.005919933319091797, -0.0037984848022460938, -0.0016770362854003906, 0.0004444122314453125, 0.0025658607482910156, 0.004687309265136719, 0.006808757781982422, 0.008930206298828125, 0.011051654815673828, 0.013173103332519531, 0.015294551849365234, 0.017416000366210938, 0.01953744888305664, 0.021658897399902344, 0.023780345916748047, 0.02590179443359375, 0.028023242950439453, 0.030144691467285156, 0.03226613998413086, 0.03438758850097656, 0.036509037017822266, 0.03863048553466797, 0.04075193405151367, 0.042873382568359375, 0.04499483108520508, 0.04711627960205078, 0.049237728118896484, 0.05135917663574219, 0.05348062515258789, 0.055602073669433594, 0.0577235221862793, 0.059844970703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 9.0, 10.0, 14.0, 22.0, 21.0, 29.0, 45.0, 93.0, 121.0, 268.0, 810.0, 3876.0, 349814.0, 686482.0, 5339.0, 908.0, 282.0, 129.0, 77.0, 51.0, 38.0, 23.0, 18.0, 13.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.144561767578125, -1.10064697265625, -1.056732177734375, -1.0128173828125, -0.968902587890625, -0.92498779296875, -0.881072998046875, -0.837158203125, -0.793243408203125, -0.74932861328125, -0.705413818359375, -0.6614990234375, -0.617584228515625, -0.57366943359375, -0.529754638671875, -0.48583984375, -0.441925048828125, -0.39801025390625, -0.354095458984375, -0.3101806640625, -0.266265869140625, -0.22235107421875, -0.178436279296875, -0.134521484375, -0.090606689453125, -0.04669189453125, -0.002777099609375, 0.0411376953125, 0.085052490234375, 0.12896728515625, 0.172882080078125, 0.216796875, 0.260711669921875, 0.30462646484375, 0.348541259765625, 0.3924560546875, 0.436370849609375, 0.48028564453125, 0.524200439453125, 0.568115234375, 0.612030029296875, 0.65594482421875, 0.699859619140625, 0.7437744140625, 0.787689208984375, 0.83160400390625, 0.875518798828125, 0.91943359375, 0.963348388671875, 1.00726318359375, 1.051177978515625, 1.0950927734375, 1.139007568359375, 1.18292236328125, 1.226837158203125, 1.270751953125, 1.314666748046875, 1.35858154296875, 1.402496337890625, 1.4464111328125, 1.490325927734375, 1.53424072265625, 1.578155517578125, 1.6220703125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 26.0, 91.0, 381.0, 386.0, 83.0, 25.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7072547674179077, -0.6764556169509888, -0.6456565260887146, -0.6148573756217957, -0.5840582251548767, -0.5532591342926025, -0.5224599838256836, -0.49166086316108704, -0.4608617424964905, -0.4300626218318939, -0.399263471364975, -0.3684643507003784, -0.33766523003578186, -0.3068661093711853, -0.27606695890426636, -0.2452678382396698, -0.21446868777275085, -0.1836695522069931, -0.15287043154239655, -0.1220712959766388, -0.09127216786146164, -0.060473039746284485, -0.029673904180526733, 0.0011252164840698242, 0.031924352049827576, 0.06272348016500473, 0.09352260828018188, 0.12432174384593964, 0.1551208794116974, 0.18592000007629395, 0.2167191356420517, 0.24751825630664825, 0.278317391872406, 0.30911651253700256, 0.3399156630039215, 0.37071478366851807, 0.4015139043331146, 0.4323130249977112, 0.4631121754646301, 0.4939112961292267, 0.5247104167938232, 0.5555095672607422, 0.5863086581230164, 0.6171078085899353, 0.6479069590568542, 0.6787060499191284, 0.7095052003860474, 0.7403043508529663, 0.7711035013198853, 0.8019026517868042, 0.8327017426490784, 0.8635008931159973, 0.8943000435829163, 0.9250991344451904, 0.9558982849121094, 0.9866974353790283, 1.0174964666366577, 1.0482956171035767, 1.0790947675704956, 1.109893798828125, 1.140692949295044, 1.171492099761963, 1.2022912502288818, 1.2330904006958008, 1.2638895511627197]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 19.0, 26.0, 23.0, 38.0, 35.0, 48.0, 48.0, 56.0, 67.0, 84.0, 81.0, 72.0, 62.0, 62.0, 57.0, 40.0, 33.0, 30.0, 35.0, 16.0, 20.0, 12.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2954719662666321, -0.2875341475009918, -0.2795962989330292, -0.2716584801673889, -0.26372063159942627, -0.255782812833786, -0.24784497916698456, -0.2399071455001831, -0.23196931183338165, -0.2240314781665802, -0.21609364449977875, -0.2081558108329773, -0.20021799206733704, -0.1922801434993744, -0.18434232473373413, -0.17640449106693268, -0.16846665740013123, -0.16052882373332977, -0.15259099006652832, -0.14465315639972687, -0.13671532273292542, -0.12877750396728516, -0.1208396703004837, -0.11290183663368225, -0.1049640029668808, -0.09702616930007935, -0.0890883356332779, -0.08115050941705704, -0.07321267575025558, -0.06527484208345413, -0.05733701214194298, -0.049399182200431824, -0.04146134853363037, -0.03352351486682892, -0.025585684925317764, -0.01764785312116146, -0.009710021317005157, -0.0017721876502037048, 0.006165642291307449, 0.014103472232818604, 0.022041305899620056, 0.02997913770377636, 0.03791696950793266, 0.04585479944944382, 0.05379263311624527, 0.06173046678304672, 0.06966829299926758, 0.07760612666606903, 0.08554396033287048, 0.09348179399967194, 0.10141962766647339, 0.10935745388269424, 0.1172952875494957, 0.12523311376571655, 0.133170947432518, 0.14110878109931946, 0.1490466147661209, 0.15698444843292236, 0.16492228209972382, 0.17286011576652527, 0.18079793453216553, 0.18873578310012817, 0.19667360186576843, 0.20461143553256989, 0.21254926919937134]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 10.0, 3.0, 9.0, 9.0, 9.0, 12.0, 21.0, 21.0, 32.0, 35.0, 43.0, 51.0, 71.0, 72.0, 63.0, 67.0, 53.0, 65.0, 61.0, 55.0, 54.0, 41.0, 33.0, 31.0, 19.0, 27.0, 16.0, 12.0, 2.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.2890625, -3.2107391357421875, -3.132415771484375, -3.0540924072265625, -2.97576904296875, -2.8974456787109375, -2.819122314453125, -2.7407989501953125, -2.6624755859375, -2.5841522216796875, -2.505828857421875, -2.4275054931640625, -2.34918212890625, -2.2708587646484375, -2.192535400390625, -2.1142120361328125, -2.035888671875, -1.9575653076171875, -1.879241943359375, -1.8009185791015625, -1.72259521484375, -1.6442718505859375, -1.565948486328125, -1.4876251220703125, -1.4093017578125, -1.3309783935546875, -1.252655029296875, -1.1743316650390625, -1.09600830078125, -1.0176849365234375, -0.939361572265625, -0.8610382080078125, -0.78271484375, -0.7043914794921875, -0.626068115234375, -0.5477447509765625, -0.46942138671875, -0.3910980224609375, -0.312774658203125, -0.2344512939453125, -0.1561279296875, -0.0778045654296875, 0.000518798828125, 0.0788421630859375, 0.15716552734375, 0.2354888916015625, 0.313812255859375, 0.3921356201171875, 0.470458984375, 0.5487823486328125, 0.627105712890625, 0.7054290771484375, 0.78375244140625, 0.8620758056640625, 0.940399169921875, 1.0187225341796875, 1.0970458984375, 1.1753692626953125, 1.253692626953125, 1.3320159912109375, 1.41033935546875, 1.4886627197265625, 1.566986083984375, 1.6453094482421875, 1.7236328125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 20.0, 31.0, 35.0, 78.0, 139.0, 181.0, 298.0, 484.0, 829.0, 1380.0, 2692.0, 5606.0, 12208.0, 29577.0, 83819.0, 326402.0, 418860.0, 103477.0, 35188.0, 14056.0, 6204.0, 3064.0, 1639.0, 889.0, 528.0, 300.0, 201.0, 132.0, 95.0, 51.0, 35.0, 26.0, 11.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28515625, -3.18878173828125, -3.0924072265625, -2.99603271484375, -2.899658203125, -2.80328369140625, -2.7069091796875, -2.61053466796875, -2.51416015625, -2.41778564453125, -2.3214111328125, -2.22503662109375, -2.128662109375, -2.03228759765625, -1.9359130859375, -1.83953857421875, -1.7431640625, -1.64678955078125, -1.5504150390625, -1.45404052734375, -1.357666015625, -1.26129150390625, -1.1649169921875, -1.06854248046875, -0.97216796875, -0.87579345703125, -0.7794189453125, -0.68304443359375, -0.586669921875, -0.49029541015625, -0.3939208984375, -0.29754638671875, -0.201171875, -0.10479736328125, -0.0084228515625, 0.08795166015625, 0.184326171875, 0.28070068359375, 0.3770751953125, 0.47344970703125, 0.56982421875, 0.66619873046875, 0.7625732421875, 0.85894775390625, 0.955322265625, 1.05169677734375, 1.1480712890625, 1.24444580078125, 1.3408203125, 1.43719482421875, 1.5335693359375, 1.62994384765625, 1.726318359375, 1.82269287109375, 1.9190673828125, 2.01544189453125, 2.11181640625, 2.20819091796875, 2.3045654296875, 2.40093994140625, 2.497314453125, 2.59368896484375, 2.6900634765625, 2.78643798828125, 2.8828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 15.0, 12.0, 16.0, 26.0, 26.0, 31.0, 35.0, 39.0, 46.0, 57.0, 61.0, 78.0, 150.0, 904.0, 852.0, 160.0, 88.0, 73.0, 74.0, 45.0, 33.0, 27.0, 39.0, 23.0, 22.0, 12.0, 14.0, 15.0, 16.0, 12.0, 6.0, 5.0, 0.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.7216796875, -5.537109375, -5.3525390625, -5.16796875, -4.9833984375, -4.798828125, -4.6142578125, -4.4296875, -4.2451171875, -4.060546875, -3.8759765625, -3.69140625, -3.5068359375, -3.322265625, -3.1376953125, -2.953125, -2.7685546875, -2.583984375, -2.3994140625, -2.21484375, -2.0302734375, -1.845703125, -1.6611328125, -1.4765625, -1.2919921875, -1.107421875, -0.9228515625, -0.73828125, -0.5537109375, -0.369140625, -0.1845703125, 0.0, 0.1845703125, 0.369140625, 0.5537109375, 0.73828125, 0.9228515625, 1.107421875, 1.2919921875, 1.4765625, 1.6611328125, 1.845703125, 2.0302734375, 2.21484375, 2.3994140625, 2.583984375, 2.7685546875, 2.953125, 3.1376953125, 3.322265625, 3.5068359375, 3.69140625, 3.8759765625, 4.060546875, 4.2451171875, 4.4296875, 4.6142578125, 4.798828125, 4.9833984375, 5.16796875, 5.3525390625, 5.537109375, 5.7216796875, 5.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 6.0, 5.0, 13.0, 26.0, 25.0, 36.0, 58.0, 88.0, 93.0, 156.0, 246.0, 492.0, 1474.0, 10531.0, 434833.0, 2670489.0, 23226.0, 2484.0, 588.0, 246.0, 174.0, 112.0, 90.0, 54.0, 34.0, 30.0, 22.0, 22.0, 15.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.681396484375, -15.22216796875, -14.762939453125, -14.3037109375, -13.844482421875, -13.38525390625, -12.926025390625, -12.466796875, -12.007568359375, -11.54833984375, -11.089111328125, -10.6298828125, -10.170654296875, -9.71142578125, -9.252197265625, -8.79296875, -8.333740234375, -7.87451171875, -7.415283203125, -6.9560546875, -6.496826171875, -6.03759765625, -5.578369140625, -5.119140625, -4.659912109375, -4.20068359375, -3.741455078125, -3.2822265625, -2.822998046875, -2.36376953125, -1.904541015625, -1.4453125, -0.986083984375, -0.52685546875, -0.067626953125, 0.3916015625, 0.850830078125, 1.31005859375, 1.769287109375, 2.228515625, 2.687744140625, 3.14697265625, 3.606201171875, 4.0654296875, 4.524658203125, 4.98388671875, 5.443115234375, 5.90234375, 6.361572265625, 6.82080078125, 7.280029296875, 7.7392578125, 8.198486328125, 8.65771484375, 9.116943359375, 9.576171875, 10.035400390625, 10.49462890625, 10.953857421875, 11.4130859375, 11.872314453125, 12.33154296875, 12.790771484375, 13.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 63.0, 809.0, 141.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.6790008544922, -189.33090209960938, -185.98280334472656, -182.63470458984375, -179.28662109375, -175.9385223388672, -172.59042358398438, -169.24232482910156, -165.89422607421875, -162.54612731933594, -159.19802856445312, -155.8499298095703, -152.5018310546875, -149.15374755859375, -145.80564880371094, -142.45755004882812, -139.1094512939453, -135.7613525390625, -132.4132537841797, -129.06515502929688, -125.7170639038086, -122.36896514892578, -119.0208740234375, -115.67277526855469, -112.32467651367188, -108.97657775878906, -105.62847900390625, -102.28038787841797, -98.93228912353516, -95.58419036865234, -92.23609924316406, -88.88800048828125, -85.53990173339844, -82.19180297851562, -78.84370422363281, -75.49561309814453, -72.14751434326172, -68.7994155883789, -65.45132446289062, -62.10322570800781, -58.755126953125, -55.40702819824219, -52.05893325805664, -48.710838317871094, -45.36273956298828, -42.01464080810547, -38.66654586791992, -35.318450927734375, -31.970354080200195, -28.622257232666016, -25.274160385131836, -21.926063537597656, -18.577966690063477, -15.229869842529297, -11.881772994995117, -8.533676147460938, -5.185579299926758, -1.8374824523925781, 1.5106143951416016, 4.858711242675781, 8.206808090209961, 11.55490493774414, 14.90300178527832, 18.2510986328125, 21.59919548034668]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 8.0, 13.0, 16.0, 14.0, 22.0, 18.0, 25.0, 21.0, 37.0, 29.0, 35.0, 35.0, 29.0, 44.0, 31.0, 31.0, 44.0, 50.0, 46.0, 48.0, 44.0, 40.0, 35.0, 36.0, 39.0, 24.0, 29.0, 16.0, 27.0, 22.0, 18.0, 14.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.94007396697998, -15.442998886108398, -14.945924758911133, -14.44884967803955, -13.951775550842285, -13.454700469970703, -12.957626342773438, -12.460551261901855, -11.963476181030273, -11.466401100158691, -10.969326972961426, -10.472251892089844, -9.975177764892578, -9.478102684020996, -8.981027603149414, -8.483953475952148, -7.986879348754883, -7.489804744720459, -6.992730140686035, -6.495655059814453, -5.9985809326171875, -5.5015058517456055, -5.004431247711182, -4.507356643676758, -4.010282039642334, -3.51320743560791, -3.0161328315734863, -2.5190579891204834, -2.0219833850860596, -1.5249087810516357, -1.0278339385986328, -0.530759334564209, -0.03368568420410156, 0.46338897943496704, 0.9604636430740356, 1.457538366317749, 1.9546129703521729, 2.4516875743865967, 2.9487624168395996, 3.4458370208740234, 3.9429116249084473, 4.439986228942871, 4.937060832977295, 5.434135437011719, 5.931210517883301, 6.428284645080566, 6.925359725952148, 7.422434329986572, 7.919508934020996, 8.416584014892578, 8.913658142089844, 9.410733222961426, 9.907807350158691, 10.404882431030273, 10.901956558227539, 11.399031639099121, 11.896106719970703, 12.393181800842285, 12.89025592803955, 13.387331008911133, 13.884405136108398, 14.38148021697998, 14.878555297851562, 15.375629425048828, 15.872703552246094]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 9.0, 6.0, 15.0, 9.0, 16.0, 16.0, 26.0, 33.0, 43.0, 55.0, 43.0, 68.0, 52.0, 42.0, 64.0, 60.0, 66.0, 53.0, 41.0, 51.0, 48.0, 35.0, 41.0, 17.0, 16.0, 16.0, 16.0, 12.0, 13.0, 8.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0], "bins": [-3.373046875, -3.2945098876953125, -3.215972900390625, -3.1374359130859375, -3.05889892578125, -2.9803619384765625, -2.901824951171875, -2.8232879638671875, -2.7447509765625, -2.6662139892578125, -2.587677001953125, -2.5091400146484375, -2.43060302734375, -2.3520660400390625, -2.273529052734375, -2.1949920654296875, -2.116455078125, -2.0379180908203125, -1.959381103515625, -1.8808441162109375, -1.80230712890625, -1.7237701416015625, -1.645233154296875, -1.5666961669921875, -1.4881591796875, -1.4096221923828125, -1.331085205078125, -1.2525482177734375, -1.17401123046875, -1.0954742431640625, -1.016937255859375, -0.9384002685546875, -0.85986328125, -0.7813262939453125, -0.702789306640625, -0.6242523193359375, -0.54571533203125, -0.4671783447265625, -0.388641357421875, -0.3101043701171875, -0.2315673828125, -0.1530303955078125, -0.074493408203125, 0.0040435791015625, 0.08258056640625, 0.1611175537109375, 0.239654541015625, 0.3181915283203125, 0.396728515625, 0.4752655029296875, 0.553802490234375, 0.6323394775390625, 0.71087646484375, 0.7894134521484375, 0.867950439453125, 0.9464874267578125, 1.0250244140625, 1.1035614013671875, 1.182098388671875, 1.2606353759765625, 1.33917236328125, 1.4177093505859375, 1.496246337890625, 1.5747833251953125, 1.6533203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 10.0, 16.0, 25.0, 26.0, 52.0, 66.0, 123.0, 188.0, 416.0, 836.0, 1990.0, 5851.0, 20786.0, 130452.0, 2395873.0, 1526432.0, 87050.0, 16502.0, 4590.0, 1630.0, 626.0, 311.0, 159.0, 85.0, 61.0, 40.0, 25.0, 23.0, 10.0, 8.0, 1.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0], "bins": [-7.67578125, -7.49261474609375, -7.3094482421875, -7.12628173828125, -6.943115234375, -6.75994873046875, -6.5767822265625, -6.39361572265625, -6.21044921875, -6.02728271484375, -5.8441162109375, -5.66094970703125, -5.477783203125, -5.29461669921875, -5.1114501953125, -4.92828369140625, -4.7451171875, -4.56195068359375, -4.3787841796875, -4.19561767578125, -4.012451171875, -3.82928466796875, -3.6461181640625, -3.46295166015625, -3.27978515625, -3.09661865234375, -2.9134521484375, -2.73028564453125, -2.547119140625, -2.36395263671875, -2.1807861328125, -1.99761962890625, -1.814453125, -1.63128662109375, -1.4481201171875, -1.26495361328125, -1.081787109375, -0.89862060546875, -0.7154541015625, -0.53228759765625, -0.34912109375, -0.16595458984375, 0.0172119140625, 0.20037841796875, 0.383544921875, 0.56671142578125, 0.7498779296875, 0.93304443359375, 1.1162109375, 1.29937744140625, 1.4825439453125, 1.66571044921875, 1.848876953125, 2.03204345703125, 2.2152099609375, 2.39837646484375, 2.58154296875, 2.76470947265625, 2.9478759765625, 3.13104248046875, 3.314208984375, 3.49737548828125, 3.6805419921875, 3.86370849609375, 4.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 17.0, 16.0, 35.0, 51.0, 75.0, 83.0, 140.0, 197.0, 337.0, 554.0, 730.0, 646.0, 437.0, 247.0, 163.0, 96.0, 73.0, 47.0, 31.0, 27.0, 17.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27496337890625, -4.1358642578125, -3.99676513671875, -3.857666015625, -3.71856689453125, -3.5794677734375, -3.44036865234375, -3.30126953125, -3.16217041015625, -3.0230712890625, -2.88397216796875, -2.744873046875, -2.60577392578125, -2.4666748046875, -2.32757568359375, -2.1884765625, -2.04937744140625, -1.9102783203125, -1.77117919921875, -1.632080078125, -1.49298095703125, -1.3538818359375, -1.21478271484375, -1.07568359375, -0.93658447265625, -0.7974853515625, -0.65838623046875, -0.519287109375, -0.38018798828125, -0.2410888671875, -0.10198974609375, 0.037109375, 0.17620849609375, 0.3153076171875, 0.45440673828125, 0.593505859375, 0.73260498046875, 0.8717041015625, 1.01080322265625, 1.14990234375, 1.28900146484375, 1.4281005859375, 1.56719970703125, 1.706298828125, 1.84539794921875, 1.9844970703125, 2.12359619140625, 2.2626953125, 2.40179443359375, 2.5408935546875, 2.67999267578125, 2.819091796875, 2.95819091796875, 3.0972900390625, 3.23638916015625, 3.37548828125, 3.51458740234375, 3.6536865234375, 3.79278564453125, 3.931884765625, 4.07098388671875, 4.2100830078125, 4.34918212890625, 4.48828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 10.0, 12.0, 19.0, 26.0, 43.0, 51.0, 77.0, 117.0, 227.0, 595.0, 2928.0, 149001.0, 4012036.0, 26701.0, 1438.0, 436.0, 187.0, 112.0, 85.0, 46.0, 44.0, 29.0, 15.0, 9.0, 14.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.561767578125, -20.87353515625, -20.185302734375, -19.4970703125, -18.808837890625, -18.12060546875, -17.432373046875, -16.744140625, -16.055908203125, -15.36767578125, -14.679443359375, -13.9912109375, -13.302978515625, -12.61474609375, -11.926513671875, -11.23828125, -10.550048828125, -9.86181640625, -9.173583984375, -8.4853515625, -7.797119140625, -7.10888671875, -6.420654296875, -5.732421875, -5.044189453125, -4.35595703125, -3.667724609375, -2.9794921875, -2.291259765625, -1.60302734375, -0.914794921875, -0.2265625, 0.461669921875, 1.14990234375, 1.838134765625, 2.5263671875, 3.214599609375, 3.90283203125, 4.591064453125, 5.279296875, 5.967529296875, 6.65576171875, 7.343994140625, 8.0322265625, 8.720458984375, 9.40869140625, 10.096923828125, 10.78515625, 11.473388671875, 12.16162109375, 12.849853515625, 13.5380859375, 14.226318359375, 14.91455078125, 15.602783203125, 16.291015625, 16.979248046875, 17.66748046875, 18.355712890625, 19.0439453125, 19.732177734375, 20.42041015625, 21.108642578125, 21.796875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 39.0, 101.0, 211.0, 280.0, 210.0, 109.0, 35.0, 10.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.667701721191406, -13.407197952270508, -12.14669418334961, -10.886191368103027, -9.625687599182129, -8.36518383026123, -7.10468053817749, -5.84417724609375, -4.583673477172852, -3.3231699466705322, -2.062666416168213, -0.8021628856658936, 0.4583406448364258, 1.7188444137573242, 2.9793477058410645, 4.239850997924805, 5.500354766845703, 6.760858535766602, 8.0213623046875, 9.281865119934082, 10.54236888885498, 11.802872657775879, 13.063375473022461, 14.32387924194336, 15.584383010864258, 16.844886779785156, 18.105390548706055, 19.365894317626953, 20.62639617919922, 21.88690185546875, 23.147403717041016, 24.407907485961914, 25.668411254882812, 26.92891502380371, 28.18941879272461, 29.449922561645508, 30.710426330566406, 31.970928192138672, 33.2314338684082, 34.49193572998047, 35.75244140625, 37.012943267822266, 38.2734489440918, 39.53395080566406, 40.794456481933594, 42.05495834350586, 43.31546401977539, 44.575965881347656, 45.83646774291992, 47.09696960449219, 48.35747528076172, 49.617977142333984, 50.878482818603516, 52.13898468017578, 53.39949035644531, 54.65999221801758, 55.920494079589844, 57.18099594116211, 58.44150161743164, 59.702003479003906, 60.96250915527344, 62.2230110168457, 63.483516693115234, 64.7440185546875, 66.00452423095703]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 9.0, 13.0, 22.0, 14.0, 15.0, 22.0, 26.0, 22.0, 29.0, 28.0, 34.0, 41.0, 24.0, 48.0, 39.0, 43.0, 41.0, 43.0, 41.0, 61.0, 37.0, 42.0, 45.0, 30.0, 35.0, 35.0, 28.0, 22.0, 27.0, 16.0, 10.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-13.631193161010742, -13.263228416442871, -12.895262718200684, -12.527297973632812, -12.159332275390625, -11.791367530822754, -11.423402786254883, -11.055437088012695, -10.687472343444824, -10.319507598876953, -9.951541900634766, -9.583577156066895, -9.215612411499023, -8.847646713256836, -8.479681968688965, -8.111717224121094, -7.743751525878906, -7.375786304473877, -7.007821083068848, -6.639856338500977, -6.271891117095947, -5.903925895690918, -5.535961151123047, -5.167995929718018, -4.800030708312988, -4.432065486907959, -4.06410026550293, -3.6961355209350586, -3.3281702995300293, -2.960205078125, -2.59224009513855, -2.2242751121520996, -1.856308937072754, -1.4883438348770142, -1.1203787326812744, -0.7524136304855347, -0.3844485282897949, -0.016483426094055176, 0.35148167610168457, 0.7194466590881348, 1.087411880493164, 1.4553769826889038, 1.8233420848846436, 2.1913070678710938, 2.559272289276123, 2.9272375106811523, 3.2952024936676025, 3.6631674766540527, 4.031132698059082, 4.399097919464111, 4.767063140869141, 5.135027885437012, 5.502993106842041, 5.87095832824707, 6.238923072814941, 6.606888294219971, 6.974853515625, 7.342818737030029, 7.710783958435059, 8.07874870300293, 8.446714401245117, 8.814679145812988, 9.18264389038086, 9.550609588623047, 9.918574333190918]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 11.0, 11.0, 12.0, 19.0, 21.0, 24.0, 20.0, 35.0, 47.0, 49.0, 50.0, 65.0, 53.0, 57.0, 67.0, 59.0, 46.0, 50.0, 53.0, 43.0, 31.0, 34.0, 34.0, 16.0, 20.0, 21.0, 13.0, 5.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.36773681640625, -2.2960205078125, -2.22430419921875, -2.152587890625, -2.08087158203125, -2.0091552734375, -1.93743896484375, -1.86572265625, -1.79400634765625, -1.7222900390625, -1.65057373046875, -1.578857421875, -1.50714111328125, -1.4354248046875, -1.36370849609375, -1.2919921875, -1.22027587890625, -1.1485595703125, -1.07684326171875, -1.005126953125, -0.93341064453125, -0.8616943359375, -0.78997802734375, -0.71826171875, -0.64654541015625, -0.5748291015625, -0.50311279296875, -0.431396484375, -0.35968017578125, -0.2879638671875, -0.21624755859375, -0.14453125, -0.07281494140625, -0.0010986328125, 0.07061767578125, 0.142333984375, 0.21405029296875, 0.2857666015625, 0.35748291015625, 0.42919921875, 0.50091552734375, 0.5726318359375, 0.64434814453125, 0.716064453125, 0.78778076171875, 0.8594970703125, 0.93121337890625, 1.0029296875, 1.07464599609375, 1.1463623046875, 1.21807861328125, 1.289794921875, 1.36151123046875, 1.4332275390625, 1.50494384765625, 1.57666015625, 1.64837646484375, 1.7200927734375, 1.79180908203125, 1.863525390625, 1.93524169921875, 2.0069580078125, 2.07867431640625, 2.150390625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 6.0, 23.0, 26.0, 25.0, 58.0, 111.0, 164.0, 349.0, 649.0, 1232.0, 2483.0, 5419.0, 12222.0, 28389.0, 68945.0, 164093.0, 300547.0, 255405.0, 120534.0, 49821.0, 21021.0, 8951.0, 4099.0, 1945.0, 937.0, 465.0, 252.0, 136.0, 82.0, 69.0, 37.0, 17.0, 15.0, 10.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9326858520507812, -0.9058990478515625, -0.8791122436523438, -0.852325439453125, -0.8255386352539062, -0.7987518310546875, -0.7719650268554688, -0.74517822265625, -0.7183914184570312, -0.6916046142578125, -0.6648178100585938, -0.638031005859375, -0.6112442016601562, -0.5844573974609375, -0.5576705932617188, -0.5308837890625, -0.5040969848632812, -0.4773101806640625, -0.45052337646484375, -0.423736572265625, -0.39694976806640625, -0.3701629638671875, -0.34337615966796875, -0.31658935546875, -0.28980255126953125, -0.2630157470703125, -0.23622894287109375, -0.209442138671875, -0.18265533447265625, -0.1558685302734375, -0.12908172607421875, -0.102294921875, -0.07550811767578125, -0.0487213134765625, -0.02193450927734375, 0.004852294921875, 0.03163909912109375, 0.0584259033203125, 0.08521270751953125, 0.11199951171875, 0.13878631591796875, 0.1655731201171875, 0.19235992431640625, 0.219146728515625, 0.24593353271484375, 0.2727203369140625, 0.29950714111328125, 0.3262939453125, 0.35308074951171875, 0.3798675537109375, 0.40665435791015625, 0.433441162109375, 0.46022796630859375, 0.4870147705078125, 0.5138015747070312, 0.54058837890625, 0.5673751831054688, 0.5941619873046875, 0.6209487915039062, 0.647735595703125, 0.6745223999023438, 0.7013092041015625, 0.7280960083007812, 0.7548828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 14.0, 9.0, 26.0, 7.0, 18.0, 27.0, 32.0, 16.0, 31.0, 37.0, 29.0, 38.0, 56.0, 49.0, 42.0, 39.0, 1064.0, 30.0, 59.0, 41.0, 48.0, 35.0, 30.0, 24.0, 32.0, 24.0, 29.0, 15.0, 23.0, 15.0, 20.0, 8.0, 13.0, 7.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.482421875, -1.4412689208984375, -1.400115966796875, -1.3589630126953125, -1.31781005859375, -1.2766571044921875, -1.235504150390625, -1.1943511962890625, -1.1531982421875, -1.1120452880859375, -1.070892333984375, -1.0297393798828125, -0.98858642578125, -0.9474334716796875, -0.906280517578125, -0.8651275634765625, -0.823974609375, -0.7828216552734375, -0.741668701171875, -0.7005157470703125, -0.65936279296875, -0.6182098388671875, -0.577056884765625, -0.5359039306640625, -0.4947509765625, -0.4535980224609375, -0.412445068359375, -0.3712921142578125, -0.33013916015625, -0.2889862060546875, -0.247833251953125, -0.2066802978515625, -0.16552734375, -0.1243743896484375, -0.083221435546875, -0.0420684814453125, -0.00091552734375, 0.0402374267578125, 0.081390380859375, 0.1225433349609375, 0.1636962890625, 0.2048492431640625, 0.246002197265625, 0.2871551513671875, 0.32830810546875, 0.3694610595703125, 0.410614013671875, 0.4517669677734375, 0.492919921875, 0.5340728759765625, 0.575225830078125, 0.6163787841796875, 0.65753173828125, 0.6986846923828125, 0.739837646484375, 0.7809906005859375, 0.8221435546875, 0.8632965087890625, 0.904449462890625, 0.9456024169921875, 0.98675537109375, 1.0279083251953125, 1.069061279296875, 1.1102142333984375, 1.1513671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 18.0, 23.0, 36.0, 43.0, 100.0, 166.0, 264.0, 433.0, 678.0, 1120.0, 1904.0, 3414.0, 6090.0, 11368.0, 21745.0, 61803.0, 1515956.0, 388402.0, 43175.0, 18367.0, 9453.0, 5318.0, 2954.0, 1758.0, 988.0, 620.0, 399.0, 208.0, 129.0, 64.0, 58.0, 28.0, 16.0, 14.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7846145629882812, -0.7542877197265625, -0.7239608764648438, -0.693634033203125, -0.6633071899414062, -0.6329803466796875, -0.6026535034179688, -0.57232666015625, -0.5419998168945312, -0.5116729736328125, -0.48134613037109375, -0.451019287109375, -0.42069244384765625, -0.3903656005859375, -0.36003875732421875, -0.3297119140625, -0.29938507080078125, -0.2690582275390625, -0.23873138427734375, -0.208404541015625, -0.17807769775390625, -0.1477508544921875, -0.11742401123046875, -0.08709716796875, -0.05677032470703125, -0.0264434814453125, 0.00388336181640625, 0.034210205078125, 0.06453704833984375, 0.0948638916015625, 0.12519073486328125, 0.155517578125, 0.18584442138671875, 0.2161712646484375, 0.24649810791015625, 0.276824951171875, 0.30715179443359375, 0.3374786376953125, 0.36780548095703125, 0.39813232421875, 0.42845916748046875, 0.4587860107421875, 0.48911285400390625, 0.519439697265625, 0.5497665405273438, 0.5800933837890625, 0.6104202270507812, 0.6407470703125, 0.6710739135742188, 0.7014007568359375, 0.7317276000976562, 0.762054443359375, 0.7923812866210938, 0.8227081298828125, 0.8530349731445312, 0.88336181640625, 0.9136886596679688, 0.9440155029296875, 0.9743423461914062, 1.004669189453125, 1.0349960327148438, 1.0653228759765625, 1.0956497192382812, 1.1259765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 4.0, 16.0, 23.0, 30.0, 25.0, 39.0, 38.0, 43.0, 53.0, 74.0, 82.0, 84.0, 50.0, 56.0, 70.0, 49.0, 62.0, 36.0, 35.0, 30.0, 23.0, 16.0, 10.0, 7.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034423828125, -0.03293609619140625, -0.0314483642578125, -0.02996063232421875, -0.028472900390625, -0.02698516845703125, -0.0254974365234375, -0.02400970458984375, -0.02252197265625, -0.02103424072265625, -0.0195465087890625, -0.01805877685546875, -0.016571044921875, -0.01508331298828125, -0.0135955810546875, -0.01210784912109375, -0.0106201171875, -0.00913238525390625, -0.0076446533203125, -0.00615692138671875, -0.004669189453125, -0.00318145751953125, -0.0016937255859375, -0.00020599365234375, 0.00128173828125, 0.00276947021484375, 0.0042572021484375, 0.00574493408203125, 0.007232666015625, 0.00872039794921875, 0.0102081298828125, 0.01169586181640625, 0.01318359375, 0.01467132568359375, 0.0161590576171875, 0.01764678955078125, 0.019134521484375, 0.02062225341796875, 0.0221099853515625, 0.02359771728515625, 0.02508544921875, 0.02657318115234375, 0.0280609130859375, 0.02954864501953125, 0.031036376953125, 0.03252410888671875, 0.0340118408203125, 0.03549957275390625, 0.0369873046875, 0.03847503662109375, 0.0399627685546875, 0.04145050048828125, 0.042938232421875, 0.04442596435546875, 0.0459136962890625, 0.04740142822265625, 0.04888916015625, 0.05037689208984375, 0.0518646240234375, 0.05335235595703125, 0.054840087890625, 0.05632781982421875, 0.0578155517578125, 0.05930328369140625, 0.060791015625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 7.0, 5.0, 9.0, 6.0, 18.0, 20.0, 28.0, 34.0, 62.0, 79.0, 132.0, 261.0, 852.0, 34930.0, 999366.0, 11476.0, 636.0, 232.0, 119.0, 82.0, 46.0, 41.0, 27.0, 26.0, 17.0, 13.0, 9.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2457275390625, -1.214111328125, -1.1824951171875, -1.15087890625, -1.1192626953125, -1.087646484375, -1.0560302734375, -1.0244140625, -0.9927978515625, -0.961181640625, -0.9295654296875, -0.89794921875, -0.8663330078125, -0.834716796875, -0.8031005859375, -0.771484375, -0.7398681640625, -0.708251953125, -0.6766357421875, -0.64501953125, -0.6134033203125, -0.581787109375, -0.5501708984375, -0.5185546875, -0.4869384765625, -0.455322265625, -0.4237060546875, -0.39208984375, -0.3604736328125, -0.328857421875, -0.2972412109375, -0.265625, -0.2340087890625, -0.202392578125, -0.1707763671875, -0.13916015625, -0.1075439453125, -0.075927734375, -0.0443115234375, -0.0126953125, 0.0189208984375, 0.050537109375, 0.0821533203125, 0.11376953125, 0.1453857421875, 0.177001953125, 0.2086181640625, 0.240234375, 0.2718505859375, 0.303466796875, 0.3350830078125, 0.36669921875, 0.3983154296875, 0.429931640625, 0.4615478515625, 0.4931640625, 0.5247802734375, 0.556396484375, 0.5880126953125, 0.61962890625, 0.6512451171875, 0.682861328125, 0.7144775390625, 0.74609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 43.0, 125.0, 267.0, 310.0, 160.0, 61.0, 23.0, 6.0, 1.0, 0.0, 2.0], "bins": [-0.5731314420700073, -0.5629009008407593, -0.5526703000068665, -0.5424397587776184, -0.5322091579437256, -0.5219786167144775, -0.5117480754852295, -0.5015174746513367, -0.49128690361976624, -0.4810563325881958, -0.47082576155662537, -0.46059519052505493, -0.4503646492958069, -0.44013407826423645, -0.429903507232666, -0.4196729362010956, -0.40944236516952515, -0.3992117941379547, -0.3889812231063843, -0.37875068187713623, -0.3685201108455658, -0.35828953981399536, -0.3480589687824249, -0.3378283977508545, -0.32759785652160645, -0.317367285490036, -0.3071367144584656, -0.29690617322921753, -0.2866756021976471, -0.27644503116607666, -0.2662144601345062, -0.2559838891029358, -0.24575331807136536, -0.23552274703979492, -0.22529219090938568, -0.21506161987781525, -0.2048310488462448, -0.19460049271583557, -0.18436992168426514, -0.1741393506526947, -0.16390877962112427, -0.15367820858955383, -0.1434476524591446, -0.13321708142757416, -0.12298651039600372, -0.11275594681501389, -0.10252538323402405, -0.09229481220245361, -0.08206425607204437, -0.07183369249105453, -0.0616031214594841, -0.05137255787849426, -0.04114199057221413, -0.03091142326593399, -0.020680859684944153, -0.010450288653373718, -0.00021972507238388062, 0.010010841302573681, 0.020241407677531242, 0.03047197312116623, 0.040702540427446365, 0.0509331077337265, 0.06116367131471634, 0.07139424234628677, 0.08162480592727661]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 8.0, 8.0, 6.0, 8.0, 26.0, 20.0, 37.0, 45.0, 40.0, 45.0, 52.0, 59.0, 60.0, 61.0, 66.0, 86.0, 57.0, 55.0, 47.0, 46.0, 49.0, 34.0, 17.0, 24.0, 20.0, 6.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07222437858581543, -0.0683198943734169, -0.06441541016101837, -0.060510922223329544, -0.056606438010931015, -0.052701953798532486, -0.04879746586084366, -0.04489298164844513, -0.0409884974360466, -0.03708401322364807, -0.03317952901124954, -0.029275041073560715, -0.025370556861162186, -0.021466072648763657, -0.01756158657371998, -0.0136571004986763, -0.009752616286277771, -0.005848131142556667, -0.0019436459988355637, 0.00196083914488554, 0.005865324288606644, 0.009769808501005173, 0.013674294576048851, 0.01757878065109253, 0.02148326486349106, 0.025387749075889587, 0.029292235150933266, 0.033196721225976944, 0.03710120543837547, 0.041005689650774, 0.04491017758846283, 0.04881466180086136, 0.05271914601325989, 0.05662363022565842, 0.060528114438056946, 0.06443259865045547, 0.068337082862854, 0.07224157452583313, 0.07614605873823166, 0.08005054295063019, 0.08395502716302872, 0.08785951137542725, 0.09176399558782578, 0.0956684798002243, 0.09957297146320343, 0.10347744822502136, 0.10738193988800049, 0.11128642410039902, 0.11519090831279755, 0.11909539252519608, 0.1229998767375946, 0.12690436840057373, 0.13080884516239166, 0.1347133368253708, 0.13861781358718872, 0.14252230525016785, 0.14642679691314697, 0.1503312885761261, 0.15423576533794403, 0.15814025700092316, 0.1620447337627411, 0.16594922542572021, 0.16985370218753815, 0.17375819385051727, 0.1776626706123352]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 17.0, 15.0, 15.0, 26.0, 31.0, 32.0, 42.0, 51.0, 55.0, 49.0, 45.0, 68.0, 55.0, 63.0, 67.0, 42.0, 56.0, 39.0, 38.0, 39.0, 21.0, 29.0, 22.0, 23.0, 15.0, 12.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.591400146484375, -2.51678466796875, -2.442169189453125, -2.3675537109375, -2.292938232421875, -2.21832275390625, -2.143707275390625, -2.069091796875, -1.994476318359375, -1.91986083984375, -1.845245361328125, -1.7706298828125, -1.696014404296875, -1.62139892578125, -1.546783447265625, -1.47216796875, -1.397552490234375, -1.32293701171875, -1.248321533203125, -1.1737060546875, -1.099090576171875, -1.02447509765625, -0.949859619140625, -0.875244140625, -0.800628662109375, -0.72601318359375, -0.651397705078125, -0.5767822265625, -0.502166748046875, -0.42755126953125, -0.352935791015625, -0.2783203125, -0.203704833984375, -0.12908935546875, -0.054473876953125, 0.0201416015625, 0.094757080078125, 0.16937255859375, 0.243988037109375, 0.318603515625, 0.393218994140625, 0.46783447265625, 0.542449951171875, 0.6170654296875, 0.691680908203125, 0.76629638671875, 0.840911865234375, 0.91552734375, 0.990142822265625, 1.06475830078125, 1.139373779296875, 1.2139892578125, 1.288604736328125, 1.36322021484375, 1.437835693359375, 1.512451171875, 1.587066650390625, 1.66168212890625, 1.736297607421875, 1.8109130859375, 1.885528564453125, 1.96014404296875, 2.034759521484375, 2.109375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 12.0, 11.0, 23.0, 37.0, 28.0, 38.0, 60.0, 61.0, 107.0, 148.0, 221.0, 359.0, 484.0, 847.0, 1361.0, 2833.0, 6194.0, 16249.0, 54168.0, 288776.0, 537241.0, 96861.0, 24988.0, 8922.0, 3728.0, 1890.0, 1015.0, 585.0, 376.0, 266.0, 180.0, 128.0, 85.0, 72.0, 45.0, 29.0, 37.0, 14.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.525390625, -3.412384033203125, -3.29937744140625, -3.186370849609375, -3.0733642578125, -2.960357666015625, -2.84735107421875, -2.734344482421875, -2.621337890625, -2.508331298828125, -2.39532470703125, -2.282318115234375, -2.1693115234375, -2.056304931640625, -1.94329833984375, -1.830291748046875, -1.71728515625, -1.604278564453125, -1.49127197265625, -1.378265380859375, -1.2652587890625, -1.152252197265625, -1.03924560546875, -0.926239013671875, -0.813232421875, -0.700225830078125, -0.58721923828125, -0.474212646484375, -0.3612060546875, -0.248199462890625, -0.13519287109375, -0.022186279296875, 0.0908203125, 0.203826904296875, 0.31683349609375, 0.429840087890625, 0.5428466796875, 0.655853271484375, 0.76885986328125, 0.881866455078125, 0.994873046875, 1.107879638671875, 1.22088623046875, 1.333892822265625, 1.4468994140625, 1.559906005859375, 1.67291259765625, 1.785919189453125, 1.89892578125, 2.011932373046875, 2.12493896484375, 2.237945556640625, 2.3509521484375, 2.463958740234375, 2.57696533203125, 2.689971923828125, 2.802978515625, 2.915985107421875, 3.02899169921875, 3.141998291015625, 3.2550048828125, 3.368011474609375, 3.48101806640625, 3.594024658203125, 3.70703125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 6.0, 13.0, 12.0, 18.0, 17.0, 20.0, 21.0, 28.0, 29.0, 35.0, 53.0, 45.0, 48.0, 62.0, 84.0, 178.0, 1419.0, 339.0, 136.0, 98.0, 51.0, 54.0, 33.0, 43.0, 38.0, 24.0, 21.0, 23.0, 14.0, 14.0, 6.0, 12.0, 6.0, 7.0, 5.0, 10.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.90765380859375, -5.7098388671875, -5.51202392578125, -5.314208984375, -5.11639404296875, -4.9185791015625, -4.72076416015625, -4.52294921875, -4.32513427734375, -4.1273193359375, -3.92950439453125, -3.731689453125, -3.53387451171875, -3.3360595703125, -3.13824462890625, -2.9404296875, -2.74261474609375, -2.5447998046875, -2.34698486328125, -2.149169921875, -1.95135498046875, -1.7535400390625, -1.55572509765625, -1.35791015625, -1.16009521484375, -0.9622802734375, -0.76446533203125, -0.566650390625, -0.36883544921875, -0.1710205078125, 0.02679443359375, 0.224609375, 0.42242431640625, 0.6202392578125, 0.81805419921875, 1.015869140625, 1.21368408203125, 1.4114990234375, 1.60931396484375, 1.80712890625, 2.00494384765625, 2.2027587890625, 2.40057373046875, 2.598388671875, 2.79620361328125, 2.9940185546875, 3.19183349609375, 3.3896484375, 3.58746337890625, 3.7852783203125, 3.98309326171875, 4.180908203125, 4.37872314453125, 4.5765380859375, 4.77435302734375, 4.97216796875, 5.16998291015625, 5.3677978515625, 5.56561279296875, 5.763427734375, 5.96124267578125, 6.1590576171875, 6.35687255859375, 6.5546875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 8.0, 8.0, 10.0, 10.0, 6.0, 23.0, 19.0, 22.0, 30.0, 52.0, 57.0, 76.0, 140.0, 205.0, 445.0, 1194.0, 4870.0, 48421.0, 2905449.0, 172375.0, 9018.0, 1824.0, 616.0, 273.0, 162.0, 100.0, 62.0, 51.0, 34.0, 27.0, 30.0, 20.0, 19.0, 9.0, 8.0, 8.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.4453125, -14.999755859375, -14.55419921875, -14.108642578125, -13.6630859375, -13.217529296875, -12.77197265625, -12.326416015625, -11.880859375, -11.435302734375, -10.98974609375, -10.544189453125, -10.0986328125, -9.653076171875, -9.20751953125, -8.761962890625, -8.31640625, -7.870849609375, -7.42529296875, -6.979736328125, -6.5341796875, -6.088623046875, -5.64306640625, -5.197509765625, -4.751953125, -4.306396484375, -3.86083984375, -3.415283203125, -2.9697265625, -2.524169921875, -2.07861328125, -1.633056640625, -1.1875, -0.741943359375, -0.29638671875, 0.149169921875, 0.5947265625, 1.040283203125, 1.48583984375, 1.931396484375, 2.376953125, 2.822509765625, 3.26806640625, 3.713623046875, 4.1591796875, 4.604736328125, 5.05029296875, 5.495849609375, 5.94140625, 6.386962890625, 6.83251953125, 7.278076171875, 7.7236328125, 8.169189453125, 8.61474609375, 9.060302734375, 9.505859375, 9.951416015625, 10.39697265625, 10.842529296875, 11.2880859375, 11.733642578125, 12.17919921875, 12.624755859375, 13.0703125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 20.0, 588.0, 399.0, 14.0], "bins": [-184.0859832763672, -181.1138916015625, -178.1417999267578, -175.16970825195312, -172.19761657714844, -169.22552490234375, -166.25343322753906, -163.28134155273438, -160.3092498779297, -157.337158203125, -154.3650665283203, -151.39297485351562, -148.42088317871094, -145.44879150390625, -142.47669982910156, -139.50460815429688, -136.53250122070312, -133.56040954589844, -130.58831787109375, -127.61622619628906, -124.64413452148438, -121.67204284667969, -118.699951171875, -115.72785186767578, -112.75576782226562, -109.78367614746094, -106.81158447265625, -103.83949279785156, -100.86740112304688, -97.89530944824219, -94.9232177734375, -91.95111846923828, -88.9790267944336, -86.0069351196289, -83.03484344482422, -80.06275177001953, -77.09066009521484, -74.11856079101562, -71.14646911621094, -68.17437744140625, -65.20228576660156, -62.230194091796875, -59.25810241699219, -56.2860107421875, -53.31391525268555, -50.34182357788086, -47.36973190307617, -44.39763641357422, -41.4255485534668, -38.45345687866211, -35.48136520385742, -32.50926971435547, -29.53717803955078, -26.565086364746094, -23.592994689941406, -20.620901107788086, -17.6488094329834, -14.676716804504395, -11.70462417602539, -8.732532501220703, -5.760439872741699, -2.7883472442626953, 0.1837444305419922, 3.1558380126953125, 6.127929210662842]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 12.0, 2.0, 14.0, 12.0, 11.0, 12.0, 14.0, 17.0, 25.0, 34.0, 35.0, 41.0, 32.0, 23.0, 35.0, 48.0, 39.0, 44.0, 34.0, 44.0, 41.0, 38.0, 43.0, 33.0, 35.0, 34.0, 30.0, 33.0, 27.0, 19.0, 20.0, 19.0, 11.0, 14.0, 12.0, 8.0, 8.0, 8.0, 10.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.396547317504883, -17.863195419311523, -17.329843521118164, -16.796491622924805, -16.263139724731445, -15.729787826538086, -15.196435928344727, -14.663084030151367, -14.129732131958008, -13.596380233764648, -13.063028335571289, -12.52967643737793, -11.99632453918457, -11.462972640991211, -10.929620742797852, -10.396268844604492, -9.86291790008545, -9.32956600189209, -8.79621410369873, -8.262862205505371, -7.729510307312012, -7.196158409118652, -6.662806987762451, -6.129455089569092, -5.596103191375732, -5.062751293182373, -4.529399394989014, -3.9960477352142334, -3.462695837020874, -2.9293439388275146, -2.3959922790527344, -1.862640380859375, -1.3292875289916992, -0.7959356904029846, -0.26258385181427, 0.2707679271697998, 0.8041198253631592, 1.3374717235565186, 1.8708233833312988, 2.404175281524658, 2.9375271797180176, 3.470879077911377, 4.004230976104736, 4.5375823974609375, 5.070934295654297, 5.604286193847656, 6.137638092041016, 6.670989990234375, 7.204341888427734, 7.737693786621094, 8.271045684814453, 8.804397583007812, 9.337749481201172, 9.871101379394531, 10.40445327758789, 10.93780517578125, 11.47115707397461, 12.004508972167969, 12.537860870361328, 13.071212768554688, 13.604564666748047, 14.137916564941406, 14.671268463134766, 15.204620361328125, 15.737971305847168]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 4.0, 11.0, 11.0, 9.0, 14.0, 15.0, 23.0, 28.0, 28.0, 35.0, 48.0, 43.0, 43.0, 48.0, 51.0, 46.0, 39.0, 64.0, 59.0, 48.0, 47.0, 35.0, 50.0, 25.0, 38.0, 23.0, 23.0, 17.0, 18.0, 10.0, 7.0, 13.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.580078125, -2.50921630859375, -2.4383544921875, -2.36749267578125, -2.296630859375, -2.22576904296875, -2.1549072265625, -2.08404541015625, -2.01318359375, -1.94232177734375, -1.8714599609375, -1.80059814453125, -1.729736328125, -1.65887451171875, -1.5880126953125, -1.51715087890625, -1.4462890625, -1.37542724609375, -1.3045654296875, -1.23370361328125, -1.162841796875, -1.09197998046875, -1.0211181640625, -0.95025634765625, -0.87939453125, -0.80853271484375, -0.7376708984375, -0.66680908203125, -0.595947265625, -0.52508544921875, -0.4542236328125, -0.38336181640625, -0.3125, -0.24163818359375, -0.1707763671875, -0.09991455078125, -0.029052734375, 0.04180908203125, 0.1126708984375, 0.18353271484375, 0.25439453125, 0.32525634765625, 0.3961181640625, 0.46697998046875, 0.537841796875, 0.60870361328125, 0.6795654296875, 0.75042724609375, 0.8212890625, 0.89215087890625, 0.9630126953125, 1.03387451171875, 1.104736328125, 1.17559814453125, 1.2464599609375, 1.31732177734375, 1.38818359375, 1.45904541015625, 1.5299072265625, 1.60076904296875, 1.671630859375, 1.74249267578125, 1.8133544921875, 1.88421630859375, 1.955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 7.0, 24.0, 21.0, 30.0, 45.0, 60.0, 79.0, 136.0, 194.0, 392.0, 575.0, 1015.0, 1901.0, 3472.0, 6757.0, 15029.0, 38874.0, 147989.0, 880100.0, 2235993.0, 678775.0, 119492.0, 35011.0, 13941.0, 6583.0, 3398.0, 1777.0, 1027.0, 579.0, 372.0, 224.0, 117.0, 93.0, 49.0, 35.0, 32.0, 17.0, 8.0, 10.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.65625, -3.54351806640625, -3.4307861328125, -3.31805419921875, -3.205322265625, -3.09259033203125, -2.9798583984375, -2.86712646484375, -2.75439453125, -2.64166259765625, -2.5289306640625, -2.41619873046875, -2.303466796875, -2.19073486328125, -2.0780029296875, -1.96527099609375, -1.8525390625, -1.73980712890625, -1.6270751953125, -1.51434326171875, -1.401611328125, -1.28887939453125, -1.1761474609375, -1.06341552734375, -0.95068359375, -0.83795166015625, -0.7252197265625, -0.61248779296875, -0.499755859375, -0.38702392578125, -0.2742919921875, -0.16156005859375, -0.048828125, 0.06390380859375, 0.1766357421875, 0.28936767578125, 0.402099609375, 0.51483154296875, 0.6275634765625, 0.74029541015625, 0.85302734375, 0.96575927734375, 1.0784912109375, 1.19122314453125, 1.303955078125, 1.41668701171875, 1.5294189453125, 1.64215087890625, 1.7548828125, 1.86761474609375, 1.9803466796875, 2.09307861328125, 2.205810546875, 2.31854248046875, 2.4312744140625, 2.54400634765625, 2.65673828125, 2.76947021484375, 2.8822021484375, 2.99493408203125, 3.107666015625, 3.22039794921875, 3.3331298828125, 3.44586181640625, 3.55859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 6.0, 11.0, 9.0, 10.0, 20.0, 28.0, 25.0, 43.0, 52.0, 69.0, 115.0, 188.0, 280.0, 477.0, 547.0, 671.0, 466.0, 345.0, 228.0, 145.0, 110.0, 67.0, 51.0, 37.0, 18.0, 19.0, 9.0, 6.0, 8.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.09002685546875, -4.9495849609375, -4.80914306640625, -4.668701171875, -4.52825927734375, -4.3878173828125, -4.24737548828125, -4.10693359375, -3.96649169921875, -3.8260498046875, -3.68560791015625, -3.545166015625, -3.40472412109375, -3.2642822265625, -3.12384033203125, -2.9833984375, -2.84295654296875, -2.7025146484375, -2.56207275390625, -2.421630859375, -2.28118896484375, -2.1407470703125, -2.00030517578125, -1.85986328125, -1.71942138671875, -1.5789794921875, -1.43853759765625, -1.298095703125, -1.15765380859375, -1.0172119140625, -0.87677001953125, -0.736328125, -0.59588623046875, -0.4554443359375, -0.31500244140625, -0.174560546875, -0.03411865234375, 0.1063232421875, 0.24676513671875, 0.38720703125, 0.52764892578125, 0.6680908203125, 0.80853271484375, 0.948974609375, 1.08941650390625, 1.2298583984375, 1.37030029296875, 1.5107421875, 1.65118408203125, 1.7916259765625, 1.93206787109375, 2.072509765625, 2.21295166015625, 2.3533935546875, 2.49383544921875, 2.63427734375, 2.77471923828125, 2.9151611328125, 3.05560302734375, 3.196044921875, 3.33648681640625, 3.4769287109375, 3.61737060546875, 3.7578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 3.0, 7.0, 9.0, 14.0, 18.0, 35.0, 52.0, 85.0, 131.0, 243.0, 410.0, 985.0, 3506.0, 39736.0, 3447626.0, 682043.0, 15607.0, 2217.0, 713.0, 358.0, 184.0, 79.0, 62.0, 43.0, 27.0, 26.0, 15.0, 10.0, 17.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.0345458984375, -12.530029296875, -12.0255126953125, -11.52099609375, -11.0164794921875, -10.511962890625, -10.0074462890625, -9.5029296875, -8.9984130859375, -8.493896484375, -7.9893798828125, -7.48486328125, -6.9803466796875, -6.475830078125, -5.9713134765625, -5.466796875, -4.9622802734375, -4.457763671875, -3.9532470703125, -3.44873046875, -2.9442138671875, -2.439697265625, -1.9351806640625, -1.4306640625, -0.9261474609375, -0.421630859375, 0.0828857421875, 0.58740234375, 1.0919189453125, 1.596435546875, 2.1009521484375, 2.60546875, 3.1099853515625, 3.614501953125, 4.1190185546875, 4.62353515625, 5.1280517578125, 5.632568359375, 6.1370849609375, 6.6416015625, 7.1461181640625, 7.650634765625, 8.1551513671875, 8.65966796875, 9.1641845703125, 9.668701171875, 10.1732177734375, 10.677734375, 11.1822509765625, 11.686767578125, 12.1912841796875, 12.69580078125, 13.2003173828125, 13.704833984375, 14.2093505859375, 14.7138671875, 15.2183837890625, 15.722900390625, 16.2274169921875, 16.73193359375, 17.2364501953125, 17.740966796875, 18.2454833984375, 18.75]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 134.0, 505.0, 309.0, 49.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.03105926513672, -70.08778381347656, -67.1445083618164, -64.20122528076172, -61.25794982910156, -58.314674377441406, -55.37139892578125, -52.42811965942383, -49.484840393066406, -46.54156494140625, -43.59828567504883, -40.65501022338867, -37.71173095703125, -34.768455505371094, -31.825178146362305, -28.881900787353516, -25.93862533569336, -22.99534797668457, -20.05207061767578, -17.108795166015625, -14.16551685333252, -11.22223949432373, -8.278963088989258, -5.335685729980469, -2.3924083709716797, 0.5508687496185303, 3.4941458702087402, 6.437422752380371, 9.38070011138916, 12.32397747039795, 15.267253875732422, 18.21053123474121, 21.15380859375, 24.09708595275879, 27.040363311767578, 29.983638763427734, 32.926918029785156, 35.87019348144531, 38.81346893310547, 41.75674819946289, 44.70002746582031, 47.64330291748047, 50.58658218383789, 53.52985763549805, 56.47313690185547, 59.416412353515625, 62.35968780517578, 65.30296325683594, 68.24624633789062, 71.18952178955078, 74.13279724121094, 77.07608032226562, 80.01935577392578, 82.96263122558594, 85.9059066772461, 88.84918212890625, 91.7924575805664, 94.73573303222656, 97.67900848388672, 100.6222915649414, 103.56556701660156, 106.50884246826172, 109.45211791992188, 112.39540100097656, 115.33867645263672]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 11.0, 15.0, 20.0, 28.0, 24.0, 24.0, 31.0, 36.0, 36.0, 48.0, 40.0, 44.0, 56.0, 54.0, 45.0, 44.0, 50.0, 47.0, 35.0, 39.0, 28.0, 33.0, 25.0, 21.0, 22.0, 20.0, 25.0, 19.0, 14.0, 7.0, 5.0, 6.0, 9.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.346147537231445, -13.881064414978027, -13.415982246398926, -12.950899124145508, -12.485816955566406, -12.020733833312988, -11.55565071105957, -11.090568542480469, -10.62548542022705, -10.160402297973633, -9.695320129394531, -9.230237007141113, -8.765154838562012, -8.300071716308594, -7.834989070892334, -7.369906425476074, -6.9048237800598145, -6.439741134643555, -5.974658489227295, -5.509575843811035, -5.044492721557617, -4.579410076141357, -4.114327430725098, -3.649244546890259, -3.184161901473999, -2.7190792560577393, -2.2539963722229004, -1.7889137268066406, -1.3238309621810913, -0.858748197555542, -0.3936655521392822, 0.07141733169555664, 0.5364999771118164, 1.0015827417373657, 1.466665506362915, 1.9317481517791748, 2.3968310356140137, 2.8619136810302734, 3.326996326446533, 3.792079210281372, 4.257162094116211, 4.722244739532471, 5.1873273849487305, 5.652410507202148, 6.117493152618408, 6.582575798034668, 7.047658443450928, 7.5127410888671875, 7.977823734283447, 8.442906379699707, 8.907989501953125, 9.373071670532227, 9.838154792785645, 10.303237915039062, 10.768320083618164, 11.233403205871582, 11.698485374450684, 12.163568496704102, 12.628650665283203, 13.093733787536621, 13.558815956115723, 14.02389907836914, 14.488981246948242, 14.95406436920166, 15.419147491455078]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 3.0, 11.0, 10.0, 19.0, 23.0, 24.0, 28.0, 32.0, 43.0, 34.0, 31.0, 55.0, 57.0, 45.0, 45.0, 48.0, 45.0, 53.0, 52.0, 42.0, 45.0, 44.0, 38.0, 32.0, 18.0, 21.0, 20.0, 19.0, 15.0, 12.0, 3.0, 9.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.283203125, -2.2167510986328125, -2.150299072265625, -2.0838470458984375, -2.01739501953125, -1.9509429931640625, -1.884490966796875, -1.8180389404296875, -1.7515869140625, -1.6851348876953125, -1.618682861328125, -1.5522308349609375, -1.48577880859375, -1.4193267822265625, -1.352874755859375, -1.2864227294921875, -1.219970703125, -1.1535186767578125, -1.087066650390625, -1.0206146240234375, -0.95416259765625, -0.8877105712890625, -0.821258544921875, -0.7548065185546875, -0.6883544921875, -0.6219024658203125, -0.555450439453125, -0.4889984130859375, -0.42254638671875, -0.3560943603515625, -0.289642333984375, -0.2231903076171875, -0.15673828125, -0.0902862548828125, -0.023834228515625, 0.0426177978515625, 0.10906982421875, 0.1755218505859375, 0.241973876953125, 0.3084259033203125, 0.3748779296875, 0.4413299560546875, 0.507781982421875, 0.5742340087890625, 0.64068603515625, 0.7071380615234375, 0.773590087890625, 0.8400421142578125, 0.906494140625, 0.9729461669921875, 1.039398193359375, 1.1058502197265625, 1.17230224609375, 1.2387542724609375, 1.305206298828125, 1.3716583251953125, 1.4381103515625, 1.5045623779296875, 1.571014404296875, 1.6374664306640625, 1.70391845703125, 1.7703704833984375, 1.836822509765625, 1.9032745361328125, 1.9697265625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 14.0, 24.0, 20.0, 48.0, 68.0, 95.0, 164.0, 252.0, 341.0, 566.0, 1047.0, 1789.0, 3448.0, 7591.0, 18301.0, 49854.0, 140064.0, 307045.0, 300560.0, 135612.0, 48695.0, 17853.0, 7414.0, 3364.0, 1691.0, 989.0, 614.0, 362.0, 233.0, 139.0, 101.0, 74.0, 42.0, 20.0, 14.0, 14.0, 11.0, 9.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330078125, -0.806121826171875, -0.77923583984375, -0.752349853515625, -0.7254638671875, -0.698577880859375, -0.67169189453125, -0.644805908203125, -0.617919921875, -0.591033935546875, -0.56414794921875, -0.537261962890625, -0.5103759765625, -0.483489990234375, -0.45660400390625, -0.429718017578125, -0.40283203125, -0.375946044921875, -0.34906005859375, -0.322174072265625, -0.2952880859375, -0.268402099609375, -0.24151611328125, -0.214630126953125, -0.187744140625, -0.160858154296875, -0.13397216796875, -0.107086181640625, -0.0802001953125, -0.053314208984375, -0.02642822265625, 0.000457763671875, 0.02734375, 0.054229736328125, 0.08111572265625, 0.108001708984375, 0.1348876953125, 0.161773681640625, 0.18865966796875, 0.215545654296875, 0.242431640625, 0.269317626953125, 0.29620361328125, 0.323089599609375, 0.3499755859375, 0.376861572265625, 0.40374755859375, 0.430633544921875, 0.45751953125, 0.484405517578125, 0.51129150390625, 0.538177490234375, 0.5650634765625, 0.591949462890625, 0.61883544921875, 0.645721435546875, 0.672607421875, 0.699493408203125, 0.72637939453125, 0.753265380859375, 0.7801513671875, 0.807037353515625, 0.83392333984375, 0.860809326171875, 0.8876953125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 6.0, 14.0, 9.0, 12.0, 16.0, 24.0, 11.0, 22.0, 25.0, 24.0, 24.0, 35.0, 34.0, 25.0, 25.0, 35.0, 36.0, 36.0, 17.0, 1068.0, 30.0, 42.0, 32.0, 25.0, 30.0, 29.0, 32.0, 36.0, 34.0, 27.0, 24.0, 13.0, 20.0, 22.0, 11.0, 12.0, 9.0, 7.0, 14.0, 10.0, 12.0, 9.0, 9.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.1884765625, -1.15313720703125, -1.1177978515625, -1.08245849609375, -1.047119140625, -1.01177978515625, -0.9764404296875, -0.94110107421875, -0.90576171875, -0.87042236328125, -0.8350830078125, -0.79974365234375, -0.764404296875, -0.72906494140625, -0.6937255859375, -0.65838623046875, -0.623046875, -0.58770751953125, -0.5523681640625, -0.51702880859375, -0.481689453125, -0.44635009765625, -0.4110107421875, -0.37567138671875, -0.34033203125, -0.30499267578125, -0.2696533203125, -0.23431396484375, -0.198974609375, -0.16363525390625, -0.1282958984375, -0.09295654296875, -0.0576171875, -0.02227783203125, 0.0130615234375, 0.04840087890625, 0.083740234375, 0.11907958984375, 0.1544189453125, 0.18975830078125, 0.22509765625, 0.26043701171875, 0.2957763671875, 0.33111572265625, 0.366455078125, 0.40179443359375, 0.4371337890625, 0.47247314453125, 0.5078125, 0.54315185546875, 0.5784912109375, 0.61383056640625, 0.649169921875, 0.68450927734375, 0.7198486328125, 0.75518798828125, 0.79052734375, 0.82586669921875, 0.8612060546875, 0.89654541015625, 0.931884765625, 0.96722412109375, 1.0025634765625, 1.03790283203125, 1.0732421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 16.0, 23.0, 38.0, 63.0, 95.0, 161.0, 203.0, 404.0, 678.0, 1194.0, 2089.0, 3746.0, 7316.0, 14046.0, 29670.0, 134407.0, 1742614.0, 105161.0, 27167.0, 12794.0, 6796.0, 3613.0, 2006.0, 1138.0, 666.0, 375.0, 241.0, 157.0, 75.0, 59.0, 39.0, 17.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.99658203125, -0.9684677124023438, -0.9403533935546875, -0.9122390747070312, -0.884124755859375, -0.8560104370117188, -0.8278961181640625, -0.7997817993164062, -0.77166748046875, -0.7435531616210938, -0.7154388427734375, -0.6873245239257812, -0.659210205078125, -0.6310958862304688, -0.6029815673828125, -0.5748672485351562, -0.5467529296875, -0.5186386108398438, -0.4905242919921875, -0.46240997314453125, -0.434295654296875, -0.40618133544921875, -0.3780670166015625, -0.34995269775390625, -0.32183837890625, -0.29372406005859375, -0.2656097412109375, -0.23749542236328125, -0.209381103515625, -0.18126678466796875, -0.1531524658203125, -0.12503814697265625, -0.096923828125, -0.06880950927734375, -0.0406951904296875, -0.01258087158203125, 0.015533447265625, 0.04364776611328125, 0.0717620849609375, 0.09987640380859375, 0.12799072265625, 0.15610504150390625, 0.1842193603515625, 0.21233367919921875, 0.240447998046875, 0.26856231689453125, 0.2966766357421875, 0.32479095458984375, 0.3529052734375, 0.38101959228515625, 0.4091339111328125, 0.43724822998046875, 0.465362548828125, 0.49347686767578125, 0.5215911865234375, 0.5497055053710938, 0.57781982421875, 0.6059341430664062, 0.6340484619140625, 0.6621627807617188, 0.690277099609375, 0.7183914184570312, 0.7465057373046875, 0.7746200561523438, 0.802734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 7.0, 16.0, 13.0, 22.0, 19.0, 35.0, 37.0, 54.0, 70.0, 87.0, 108.0, 105.0, 73.0, 69.0, 53.0, 47.0, 38.0, 26.0, 12.0, 18.0, 21.0, 8.0, 14.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06060791015625, -0.058670997619628906, -0.05673408508300781, -0.05479717254638672, -0.052860260009765625, -0.05092334747314453, -0.04898643493652344, -0.047049522399902344, -0.04511260986328125, -0.043175697326660156, -0.04123878479003906, -0.03930187225341797, -0.037364959716796875, -0.03542804718017578, -0.03349113464355469, -0.031554222106933594, -0.0296173095703125, -0.027680397033691406, -0.025743484497070312, -0.02380657196044922, -0.021869659423828125, -0.01993274688720703, -0.017995834350585938, -0.016058921813964844, -0.01412200927734375, -0.012185096740722656, -0.010248184204101562, -0.008311271667480469, -0.006374359130859375, -0.004437446594238281, -0.0025005340576171875, -0.0005636215209960938, 0.001373291015625, 0.0033102035522460938, 0.0052471160888671875, 0.007184028625488281, 0.009120941162109375, 0.011057853698730469, 0.012994766235351562, 0.014931678771972656, 0.01686859130859375, 0.018805503845214844, 0.020742416381835938, 0.02267932891845703, 0.024616241455078125, 0.02655315399169922, 0.028490066528320312, 0.030426979064941406, 0.0323638916015625, 0.034300804138183594, 0.03623771667480469, 0.03817462921142578, 0.040111541748046875, 0.04204845428466797, 0.04398536682128906, 0.045922279357910156, 0.04785919189453125, 0.049796104431152344, 0.05173301696777344, 0.05366992950439453, 0.055606842041015625, 0.05754375457763672, 0.05948066711425781, 0.061417579650878906, 0.0633544921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 16.0, 10.0, 19.0, 23.0, 33.0, 35.0, 63.0, 106.0, 163.0, 329.0, 2081.0, 966864.0, 77434.0, 701.0, 247.0, 141.0, 85.0, 46.0, 36.0, 23.0, 21.0, 20.0, 17.0, 5.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3475799560546875, -1.306488037109375, -1.2653961181640625, -1.22430419921875, -1.1832122802734375, -1.142120361328125, -1.1010284423828125, -1.0599365234375, -1.0188446044921875, -0.977752685546875, -0.9366607666015625, -0.89556884765625, -0.8544769287109375, -0.813385009765625, -0.7722930908203125, -0.731201171875, -0.6901092529296875, -0.649017333984375, -0.6079254150390625, -0.56683349609375, -0.5257415771484375, -0.484649658203125, -0.4435577392578125, -0.4024658203125, -0.3613739013671875, -0.320281982421875, -0.2791900634765625, -0.23809814453125, -0.1970062255859375, -0.155914306640625, -0.1148223876953125, -0.07373046875, -0.0326385498046875, 0.008453369140625, 0.0495452880859375, 0.09063720703125, 0.1317291259765625, 0.172821044921875, 0.2139129638671875, 0.2550048828125, 0.2960968017578125, 0.337188720703125, 0.3782806396484375, 0.41937255859375, 0.4604644775390625, 0.501556396484375, 0.5426483154296875, 0.583740234375, 0.6248321533203125, 0.665924072265625, 0.7070159912109375, 0.74810791015625, 0.7891998291015625, 0.830291748046875, 0.8713836669921875, 0.9124755859375, 0.9535675048828125, 0.994659423828125, 1.0357513427734375, 1.07684326171875, 1.1179351806640625, 1.159027099609375, 1.2001190185546875, 1.2412109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 15.0, 37.0, 90.0, 247.0, 337.0, 162.0, 77.0, 25.0, 12.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5141112804412842, -0.5040780901908875, -0.49404487013816833, -0.4840116798877716, -0.4739784598350525, -0.46394526958465576, -0.45391207933425903, -0.4438788592815399, -0.4338456690311432, -0.42381247878074646, -0.41377925872802734, -0.4037460684776306, -0.3937128484249115, -0.38367965817451477, -0.37364643812179565, -0.3636132478713989, -0.3535800576210022, -0.34354686737060547, -0.33351364731788635, -0.3234804570674896, -0.3134472370147705, -0.3034140467643738, -0.29338085651397705, -0.28334763646125793, -0.2733144164085388, -0.2632812261581421, -0.253248006105423, -0.24321481585502625, -0.23318161070346832, -0.2231484055519104, -0.21311520040035248, -0.20308199524879456, -0.19304880499839783, -0.1830155998468399, -0.17298239469528198, -0.16294920444488525, -0.15291599929332733, -0.1428827941417694, -0.1328495889902115, -0.12281639128923416, -0.11278318613767624, -0.10274998098611832, -0.09271678328514099, -0.08268357813358307, -0.07265037298202515, -0.06261717528104782, -0.0525839701294899, -0.04255077242851257, -0.03251756727695465, -0.022484365850687027, -0.012451162561774254, -0.0024179592728614807, 0.007615242153406143, 0.017648443579673767, 0.02768164873123169, 0.037714846432209015, 0.04774805158376694, 0.05778125301003456, 0.06781445443630219, 0.07784765958786011, 0.08788086473941803, 0.09791406244039536, 0.10794726759195328, 0.1179804652929306, 0.12801367044448853]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 8.0, 19.0, 13.0, 20.0, 25.0, 23.0, 26.0, 27.0, 23.0, 37.0, 41.0, 40.0, 26.0, 35.0, 39.0, 39.0, 44.0, 43.0, 39.0, 32.0, 33.0, 54.0, 39.0, 35.0, 25.0, 29.0, 25.0, 19.0, 16.0, 14.0, 18.0, 15.0, 9.0, 10.0, 16.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08822470903396606, -0.08505868911743164, -0.08189266920089722, -0.0787266418337822, -0.07556062191724777, -0.07239460200071335, -0.06922857463359833, -0.0660625547170639, -0.06289653480052948, -0.059730514883995056, -0.056564491242170334, -0.05339846760034561, -0.05023244768381119, -0.047066427767276764, -0.04390040412545204, -0.04073438048362732, -0.037568360567092896, -0.03440234065055847, -0.03123631700873375, -0.028070295229554176, -0.024904273450374603, -0.02173825167119503, -0.018572229892015457, -0.015406208112835884, -0.012240186333656311, -0.009074164554476738, -0.005908142775297165, -0.002742120996117592, 0.0004239007830619812, 0.0035899225622415543, 0.006755944341421127, 0.0099219661206007, 0.013087987899780273, 0.016254009678959846, 0.01942003145813942, 0.022586053237318993, 0.025752075016498566, 0.02891809679567814, 0.03208411857485771, 0.035250142216682434, 0.03841616213321686, 0.04158218204975128, 0.044748205691576004, 0.047914229333400726, 0.05108024924993515, 0.054246269166469574, 0.057412292808294296, 0.06057831645011902, 0.06374433636665344, 0.06691035628318787, 0.07007637619972229, 0.07324240356683731, 0.07640842348337173, 0.07957444339990616, 0.08274047076702118, 0.0859064906835556, 0.08907251060009003, 0.09223853051662445, 0.09540455043315887, 0.0985705778002739, 0.10173659771680832, 0.10490261763334274, 0.10806864500045776, 0.11123466491699219, 0.11440068483352661]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 9.0, 17.0, 10.0, 21.0, 31.0, 35.0, 35.0, 34.0, 42.0, 47.0, 54.0, 44.0, 44.0, 57.0, 38.0, 34.0, 49.0, 39.0, 55.0, 49.0, 50.0, 38.0, 25.0, 20.0, 19.0, 19.0, 16.0, 11.0, 12.0, 8.0, 4.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.189453125, -2.125579833984375, -2.06170654296875, -1.997833251953125, -1.9339599609375, -1.870086669921875, -1.80621337890625, -1.742340087890625, -1.678466796875, -1.614593505859375, -1.55072021484375, -1.486846923828125, -1.4229736328125, -1.359100341796875, -1.29522705078125, -1.231353759765625, -1.16748046875, -1.103607177734375, -1.03973388671875, -0.975860595703125, -0.9119873046875, -0.848114013671875, -0.78424072265625, -0.720367431640625, -0.656494140625, -0.592620849609375, -0.52874755859375, -0.464874267578125, -0.4010009765625, -0.337127685546875, -0.27325439453125, -0.209381103515625, -0.1455078125, -0.081634521484375, -0.01776123046875, 0.046112060546875, 0.1099853515625, 0.173858642578125, 0.23773193359375, 0.301605224609375, 0.365478515625, 0.429351806640625, 0.49322509765625, 0.557098388671875, 0.6209716796875, 0.684844970703125, 0.74871826171875, 0.812591552734375, 0.87646484375, 0.940338134765625, 1.00421142578125, 1.068084716796875, 1.1319580078125, 1.195831298828125, 1.25970458984375, 1.323577880859375, 1.387451171875, 1.451324462890625, 1.51519775390625, 1.579071044921875, 1.6429443359375, 1.706817626953125, 1.77069091796875, 1.834564208984375, 1.8984375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 13.0, 16.0, 20.0, 38.0, 57.0, 68.0, 124.0, 158.0, 240.0, 370.0, 619.0, 971.0, 1536.0, 2674.0, 4809.0, 9218.0, 20206.0, 51054.0, 154082.0, 401034.0, 259309.0, 83534.0, 30287.0, 12912.0, 6345.0, 3508.0, 1998.0, 1174.0, 790.0, 467.0, 299.0, 204.0, 125.0, 91.0, 61.0, 43.0, 23.0, 15.0, 15.0, 9.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6328125, -2.549835205078125, -2.46685791015625, -2.383880615234375, -2.3009033203125, -2.217926025390625, -2.13494873046875, -2.051971435546875, -1.968994140625, -1.886016845703125, -1.80303955078125, -1.720062255859375, -1.6370849609375, -1.554107666015625, -1.47113037109375, -1.388153076171875, -1.30517578125, -1.222198486328125, -1.13922119140625, -1.056243896484375, -0.9732666015625, -0.890289306640625, -0.80731201171875, -0.724334716796875, -0.641357421875, -0.558380126953125, -0.47540283203125, -0.392425537109375, -0.3094482421875, -0.226470947265625, -0.14349365234375, -0.060516357421875, 0.0224609375, 0.105438232421875, 0.18841552734375, 0.271392822265625, 0.3543701171875, 0.437347412109375, 0.52032470703125, 0.603302001953125, 0.686279296875, 0.769256591796875, 0.85223388671875, 0.935211181640625, 1.0181884765625, 1.101165771484375, 1.18414306640625, 1.267120361328125, 1.35009765625, 1.433074951171875, 1.51605224609375, 1.599029541015625, 1.6820068359375, 1.764984130859375, 1.84796142578125, 1.930938720703125, 2.013916015625, 2.096893310546875, 2.17987060546875, 2.262847900390625, 2.3458251953125, 2.428802490234375, 2.51177978515625, 2.594757080078125, 2.677734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 10.0, 9.0, 7.0, 17.0, 16.0, 15.0, 20.0, 24.0, 12.0, 24.0, 21.0, 32.0, 39.0, 42.0, 42.0, 56.0, 91.0, 178.0, 875.0, 840.0, 152.0, 87.0, 47.0, 47.0, 34.0, 36.0, 35.0, 40.0, 17.0, 34.0, 26.0, 19.0, 20.0, 14.0, 17.0, 12.0, 4.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.927734375, -4.7578125, -4.587890625, -4.41796875, -4.248046875, -4.078125, -3.908203125, -3.73828125, -3.568359375, -3.3984375, -3.228515625, -3.05859375, -2.888671875, -2.71875, -2.548828125, -2.37890625, -2.208984375, -2.0390625, -1.869140625, -1.69921875, -1.529296875, -1.359375, -1.189453125, -1.01953125, -0.849609375, -0.6796875, -0.509765625, -0.33984375, -0.169921875, 0.0, 0.169921875, 0.33984375, 0.509765625, 0.6796875, 0.849609375, 1.01953125, 1.189453125, 1.359375, 1.529296875, 1.69921875, 1.869140625, 2.0390625, 2.208984375, 2.37890625, 2.548828125, 2.71875, 2.888671875, 3.05859375, 3.228515625, 3.3984375, 3.568359375, 3.73828125, 3.908203125, 4.078125, 4.248046875, 4.41796875, 4.587890625, 4.7578125, 4.927734375, 5.09765625, 5.267578125, 5.4375, 5.607421875, 5.77734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 5.0, 11.0, 15.0, 14.0, 26.0, 38.0, 32.0, 50.0, 67.0, 94.0, 125.0, 264.0, 567.0, 1641.0, 5423.0, 25714.0, 535481.0, 2501181.0, 61390.0, 9334.0, 2476.0, 842.0, 369.0, 164.0, 92.0, 67.0, 39.0, 40.0, 28.0, 20.0, 16.0, 19.0, 18.0, 13.0, 3.0, 8.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3560791015625, -8.079345703125, -7.8026123046875, -7.52587890625, -7.2491455078125, -6.972412109375, -6.6956787109375, -6.4189453125, -6.1422119140625, -5.865478515625, -5.5887451171875, -5.31201171875, -5.0352783203125, -4.758544921875, -4.4818115234375, -4.205078125, -3.9283447265625, -3.651611328125, -3.3748779296875, -3.09814453125, -2.8214111328125, -2.544677734375, -2.2679443359375, -1.9912109375, -1.7144775390625, -1.437744140625, -1.1610107421875, -0.88427734375, -0.6075439453125, -0.330810546875, -0.0540771484375, 0.22265625, 0.4993896484375, 0.776123046875, 1.0528564453125, 1.32958984375, 1.6063232421875, 1.883056640625, 2.1597900390625, 2.4365234375, 2.7132568359375, 2.989990234375, 3.2667236328125, 3.54345703125, 3.8201904296875, 4.096923828125, 4.3736572265625, 4.650390625, 4.9271240234375, 5.203857421875, 5.4805908203125, 5.75732421875, 6.0340576171875, 6.310791015625, 6.5875244140625, 6.8642578125, 7.1409912109375, 7.417724609375, 7.6944580078125, 7.97119140625, 8.2479248046875, 8.524658203125, 8.8013916015625, 9.078125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 43.0, 935.0, 38.0, 2.0], "bins": [-259.7878112792969, -255.5616455078125, -251.33547973632812, -247.10931396484375, -242.88314819335938, -238.65699768066406, -234.4308319091797, -230.2046661376953, -225.97850036621094, -221.75233459472656, -217.5261688232422, -213.3000030517578, -209.0738525390625, -204.84768676757812, -200.62152099609375, -196.39535522460938, -192.169189453125, -187.94302368164062, -183.71685791015625, -179.49069213867188, -175.2645263671875, -171.0383758544922, -166.8122100830078, -162.58604431152344, -158.35987854003906, -154.1337127685547, -149.9075469970703, -145.68138122558594, -141.45523071289062, -137.22906494140625, -133.00289916992188, -128.7767333984375, -124.55058288574219, -120.32441711425781, -116.09825134277344, -111.8720932006836, -107.64592742919922, -103.41976165771484, -99.193603515625, -94.96743774414062, -90.74127197265625, -86.51510620117188, -82.2889404296875, -78.06278228759766, -73.83661651611328, -69.6104507446289, -65.38429260253906, -61.15812683105469, -56.93195724487305, -52.70579528808594, -48.47962951660156, -44.25346374511719, -40.02730178833008, -35.80113983154297, -31.574974060058594, -27.34881019592285, -23.12264633178711, -18.896482467651367, -14.670318603515625, -10.444154739379883, -6.217990875244141, -1.9918270111083984, 2.2343368530273438, 6.460500717163086, 10.686663627624512]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 10.0, 10.0, 13.0, 9.0, 15.0, 19.0, 16.0, 25.0, 19.0, 36.0, 28.0, 34.0, 28.0, 39.0, 37.0, 35.0, 40.0, 30.0, 29.0, 31.0, 43.0, 38.0, 35.0, 39.0, 26.0, 27.0, 30.0, 26.0, 25.0, 27.0, 24.0, 13.0, 23.0, 19.0, 15.0, 11.0, 9.0, 3.0, 15.0, 6.0, 8.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.471179962158203, -13.046581268310547, -12.621981620788574, -12.197382926940918, -11.772784233093262, -11.348184585571289, -10.923585891723633, -10.498987197875977, -10.07438850402832, -9.649789810180664, -9.225190162658691, -8.800591468811035, -8.375992774963379, -7.9513936042785645, -7.52679443359375, -7.102195739746094, -6.677596092224121, -6.252996921539307, -5.82839822769165, -5.403799057006836, -4.97920036315918, -4.554601192474365, -4.130002021789551, -3.7054030895233154, -3.28080415725708, -2.8562052249908447, -2.4316062927246094, -2.007007122039795, -1.5824081897735596, -1.1578092575073242, -0.7332100868225098, -0.3086111545562744, 0.11598682403564453, 0.5405858159065247, 0.9651848077774048, 1.3897838592529297, 1.814382791519165, 2.2389817237854004, 2.663580894470215, 3.08817982673645, 3.5127787590026855, 3.937377691268921, 4.361976623535156, 4.786575794219971, 5.211174964904785, 5.635773658752441, 6.060372829437256, 6.48497200012207, 6.909570693969727, 7.334169864654541, 7.758768558502197, 8.183367729187012, 8.607966423034668, 9.03256607055664, 9.457164764404297, 9.881763458251953, 10.30636215209961, 10.730960845947266, 11.155560493469238, 11.580159187316895, 12.00475788116455, 12.429357528686523, 12.85395622253418, 13.278554916381836, 13.703154563903809]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 8.0, 4.0, 18.0, 18.0, 18.0, 29.0, 40.0, 38.0, 40.0, 44.0, 49.0, 51.0, 50.0, 46.0, 44.0, 50.0, 52.0, 48.0, 40.0, 39.0, 38.0, 47.0, 35.0, 33.0, 26.0, 13.0, 16.0, 10.0, 13.0, 5.0, 5.0, 5.0, 8.0, 3.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.5384674072265625, -2.467559814453125, -2.3966522216796875, -2.32574462890625, -2.2548370361328125, -2.183929443359375, -2.1130218505859375, -2.0421142578125, -1.9712066650390625, -1.900299072265625, -1.8293914794921875, -1.75848388671875, -1.6875762939453125, -1.616668701171875, -1.5457611083984375, -1.474853515625, -1.4039459228515625, -1.333038330078125, -1.2621307373046875, -1.19122314453125, -1.1203155517578125, -1.049407958984375, -0.9785003662109375, -0.9075927734375, -0.8366851806640625, -0.765777587890625, -0.6948699951171875, -0.62396240234375, -0.5530548095703125, -0.482147216796875, -0.4112396240234375, -0.34033203125, -0.2694244384765625, -0.198516845703125, -0.1276092529296875, -0.05670166015625, 0.0142059326171875, 0.085113525390625, 0.1560211181640625, 0.2269287109375, 0.2978363037109375, 0.368743896484375, 0.4396514892578125, 0.51055908203125, 0.5814666748046875, 0.652374267578125, 0.7232818603515625, 0.794189453125, 0.8650970458984375, 0.936004638671875, 1.0069122314453125, 1.07781982421875, 1.1487274169921875, 1.219635009765625, 1.2905426025390625, 1.3614501953125, 1.4323577880859375, 1.503265380859375, 1.5741729736328125, 1.64508056640625, 1.7159881591796875, 1.786895751953125, 1.8578033447265625, 1.9287109375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 12.0, 24.0, 33.0, 39.0, 54.0, 111.0, 177.0, 303.0, 481.0, 947.0, 1885.0, 4012.0, 9456.0, 26780.0, 122000.0, 1294368.0, 2421550.0, 247331.0, 41499.0, 13088.0, 5182.0, 2339.0, 1156.0, 594.0, 331.0, 198.0, 104.0, 63.0, 45.0, 32.0, 22.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.9415283203125, -4.801025390625, -4.6605224609375, -4.52001953125, -4.3795166015625, -4.239013671875, -4.0985107421875, -3.9580078125, -3.8175048828125, -3.677001953125, -3.5364990234375, -3.39599609375, -3.2554931640625, -3.114990234375, -2.9744873046875, -2.833984375, -2.6934814453125, -2.552978515625, -2.4124755859375, -2.27197265625, -2.1314697265625, -1.990966796875, -1.8504638671875, -1.7099609375, -1.5694580078125, -1.428955078125, -1.2884521484375, -1.14794921875, -1.0074462890625, -0.866943359375, -0.7264404296875, -0.5859375, -0.4454345703125, -0.304931640625, -0.1644287109375, -0.02392578125, 0.1165771484375, 0.257080078125, 0.3975830078125, 0.5380859375, 0.6785888671875, 0.819091796875, 0.9595947265625, 1.10009765625, 1.2406005859375, 1.381103515625, 1.5216064453125, 1.662109375, 1.8026123046875, 1.943115234375, 2.0836181640625, 2.22412109375, 2.3646240234375, 2.505126953125, 2.6456298828125, 2.7861328125, 2.9266357421875, 3.067138671875, 3.2076416015625, 3.34814453125, 3.4886474609375, 3.629150390625, 3.7696533203125, 3.91015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 20.0, 22.0, 25.0, 30.0, 35.0, 46.0, 64.0, 82.0, 105.0, 150.0, 215.0, 311.0, 373.0, 505.0, 463.0, 390.0, 318.0, 212.0, 164.0, 114.0, 95.0, 49.0, 46.0, 29.0, 32.0, 32.0, 18.0, 19.0, 13.0, 11.0, 8.0, 10.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.307342529296875, -2.21820068359375, -2.129058837890625, -2.0399169921875, -1.950775146484375, -1.86163330078125, -1.772491455078125, -1.683349609375, -1.594207763671875, -1.50506591796875, -1.415924072265625, -1.3267822265625, -1.237640380859375, -1.14849853515625, -1.059356689453125, -0.97021484375, -0.881072998046875, -0.79193115234375, -0.702789306640625, -0.6136474609375, -0.524505615234375, -0.43536376953125, -0.346221923828125, -0.257080078125, -0.167938232421875, -0.07879638671875, 0.010345458984375, 0.0994873046875, 0.188629150390625, 0.27777099609375, 0.366912841796875, 0.4560546875, 0.545196533203125, 0.63433837890625, 0.723480224609375, 0.8126220703125, 0.901763916015625, 0.99090576171875, 1.080047607421875, 1.169189453125, 1.258331298828125, 1.34747314453125, 1.436614990234375, 1.5257568359375, 1.614898681640625, 1.70404052734375, 1.793182373046875, 1.88232421875, 1.971466064453125, 2.06060791015625, 2.149749755859375, 2.2388916015625, 2.328033447265625, 2.41717529296875, 2.506317138671875, 2.595458984375, 2.684600830078125, 2.77374267578125, 2.862884521484375, 2.9520263671875, 3.041168212890625, 3.13031005859375, 3.219451904296875, 3.30859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 11.0, 9.0, 14.0, 10.0, 17.0, 22.0, 27.0, 37.0, 49.0, 56.0, 97.0, 145.0, 214.0, 413.0, 1068.0, 3922.0, 21481.0, 261723.0, 3660902.0, 219109.0, 19495.0, 3491.0, 933.0, 391.0, 196.0, 117.0, 83.0, 71.0, 31.0, 39.0, 28.0, 18.0, 11.0, 6.0, 7.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0], "bins": [-12.3046875, -11.976318359375, -11.64794921875, -11.319580078125, -10.9912109375, -10.662841796875, -10.33447265625, -10.006103515625, -9.677734375, -9.349365234375, -9.02099609375, -8.692626953125, -8.3642578125, -8.035888671875, -7.70751953125, -7.379150390625, -7.05078125, -6.722412109375, -6.39404296875, -6.065673828125, -5.7373046875, -5.408935546875, -5.08056640625, -4.752197265625, -4.423828125, -4.095458984375, -3.76708984375, -3.438720703125, -3.1103515625, -2.781982421875, -2.45361328125, -2.125244140625, -1.796875, -1.468505859375, -1.14013671875, -0.811767578125, -0.4833984375, -0.155029296875, 0.17333984375, 0.501708984375, 0.830078125, 1.158447265625, 1.48681640625, 1.815185546875, 2.1435546875, 2.471923828125, 2.80029296875, 3.128662109375, 3.45703125, 3.785400390625, 4.11376953125, 4.442138671875, 4.7705078125, 5.098876953125, 5.42724609375, 5.755615234375, 6.083984375, 6.412353515625, 6.74072265625, 7.069091796875, 7.3974609375, 7.725830078125, 8.05419921875, 8.382568359375, 8.7109375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 39.0, 230.0, 435.0, 257.0, 40.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.31867218017578, -74.43461608886719, -72.5505599975586, -70.66650390625, -68.78244018554688, -66.89838409423828, -65.01432800292969, -63.130271911621094, -61.2462158203125, -59.362159729003906, -57.47809982299805, -55.59404373168945, -53.70998764038086, -51.825927734375, -49.941871643066406, -48.05781555175781, -46.17375946044922, -44.289703369140625, -42.405643463134766, -40.52158737182617, -38.63753128051758, -36.75347137451172, -34.869415283203125, -32.98535919189453, -31.101299285888672, -29.217241287231445, -27.33318519592285, -25.449127197265625, -23.56507110595703, -21.681013107299805, -19.796955108642578, -17.912899017333984, -16.02884292602539, -14.14478588104248, -12.26072883605957, -10.376670837402344, -8.49261474609375, -6.608556747436523, -4.724499702453613, -2.840442657470703, -0.956385612487793, 0.9276715517044067, 2.8117287158966064, 4.695785999298096, 6.579843044281006, 8.463900566101074, 10.347957611083984, 12.232014656066895, 14.116071701049805, 16.00012969970703, 17.884185791015625, 19.76824378967285, 21.652299880981445, 23.536357879638672, 25.420413970947266, 27.304471969604492, 29.18852996826172, 31.072587966918945, 32.95664596557617, 34.840702056884766, 36.72475814819336, 38.60881805419922, 40.49287414550781, 42.376930236816406, 44.260986328125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 14.0, 21.0, 14.0, 12.0, 20.0, 22.0, 27.0, 26.0, 26.0, 27.0, 40.0, 36.0, 27.0, 38.0, 38.0, 38.0, 43.0, 29.0, 36.0, 28.0, 33.0, 42.0, 37.0, 26.0, 30.0, 24.0, 29.0, 21.0, 26.0, 13.0, 26.0, 12.0, 15.0, 12.0, 13.0, 5.0, 12.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.702871322631836, -9.389101028442383, -9.07533073425293, -8.76155948638916, -8.447789192199707, -8.134018898010254, -7.820248603820801, -7.5064778327941895, -7.192707061767578, -6.878936767578125, -6.565165996551514, -6.2513957023620605, -5.937624931335449, -5.623854637145996, -5.310084342956543, -4.996313571929932, -4.6825432777404785, -4.368772983551025, -4.055002212524414, -3.741231918334961, -3.4274611473083496, -3.1136908531188965, -2.7999203205108643, -2.486149787902832, -2.1723792552948, -1.8586087226867676, -1.5448381900787354, -1.2310677766799927, -0.9172972440719604, -0.6035267114639282, -0.28975629806518555, 0.02401423454284668, 0.3377847671508789, 0.6515552997589111, 0.9653257727622986, 1.279096245765686, 1.5928667783737183, 1.9066373109817505, 2.220407724380493, 2.5341782569885254, 2.8479487895965576, 3.16171932220459, 3.475489854812622, 3.7892603874206543, 4.103030681610107, 4.416801452636719, 4.730571746826172, 5.044342041015625, 5.358112812042236, 5.6718831062316895, 5.985653877258301, 6.299424171447754, 6.613194942474365, 6.926965236663818, 7.24073600769043, 7.554506301879883, 7.868276596069336, 8.182046890258789, 8.495817184448242, 8.809588432312012, 9.123358726501465, 9.437129020690918, 9.750899314880371, 10.06467056274414, 10.378440856933594]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 14.0, 19.0, 13.0, 18.0, 25.0, 17.0, 31.0, 30.0, 38.0, 30.0, 34.0, 52.0, 50.0, 45.0, 44.0, 35.0, 43.0, 55.0, 46.0, 35.0, 47.0, 39.0, 35.0, 34.0, 31.0, 23.0, 17.0, 11.0, 15.0, 10.0, 13.0, 11.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.9836273193359375, -1.922332763671875, -1.8610382080078125, -1.79974365234375, -1.7384490966796875, -1.677154541015625, -1.6158599853515625, -1.5545654296875, -1.4932708740234375, -1.431976318359375, -1.3706817626953125, -1.30938720703125, -1.2480926513671875, -1.186798095703125, -1.1255035400390625, -1.064208984375, -1.0029144287109375, -0.941619873046875, -0.8803253173828125, -0.81903076171875, -0.7577362060546875, -0.696441650390625, -0.6351470947265625, -0.5738525390625, -0.5125579833984375, -0.451263427734375, -0.3899688720703125, -0.32867431640625, -0.2673797607421875, -0.206085205078125, -0.1447906494140625, -0.08349609375, -0.0222015380859375, 0.039093017578125, 0.1003875732421875, 0.16168212890625, 0.2229766845703125, 0.284271240234375, 0.3455657958984375, 0.4068603515625, 0.4681549072265625, 0.529449462890625, 0.5907440185546875, 0.65203857421875, 0.7133331298828125, 0.774627685546875, 0.8359222412109375, 0.897216796875, 0.9585113525390625, 1.019805908203125, 1.0811004638671875, 1.14239501953125, 1.2036895751953125, 1.264984130859375, 1.3262786865234375, 1.3875732421875, 1.4488677978515625, 1.510162353515625, 1.5714569091796875, 1.63275146484375, 1.6940460205078125, 1.755340576171875, 1.8166351318359375, 1.8779296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 13.0, 16.0, 32.0, 37.0, 63.0, 78.0, 133.0, 195.0, 301.0, 501.0, 780.0, 1288.0, 2031.0, 3287.0, 5304.0, 8825.0, 14365.0, 23304.0, 36963.0, 57630.0, 87477.0, 122450.0, 150784.0, 151746.0, 126280.0, 91144.0, 60698.0, 38935.0, 24491.0, 15214.0, 9322.0, 5675.0, 3462.0, 2200.0, 1324.0, 785.0, 516.0, 319.0, 197.0, 131.0, 87.0, 66.0, 36.0, 24.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.293212890625, -0.28406524658203125, -0.2749176025390625, -0.26576995849609375, -0.256622314453125, -0.24747467041015625, -0.2383270263671875, -0.22917938232421875, -0.22003173828125, -0.21088409423828125, -0.2017364501953125, -0.19258880615234375, -0.183441162109375, -0.17429351806640625, -0.1651458740234375, -0.15599822998046875, -0.1468505859375, -0.13770294189453125, -0.1285552978515625, -0.11940765380859375, -0.110260009765625, -0.10111236572265625, -0.0919647216796875, -0.08281707763671875, -0.07366943359375, -0.06452178955078125, -0.0553741455078125, -0.04622650146484375, -0.037078857421875, -0.02793121337890625, -0.0187835693359375, -0.00963592529296875, -0.00048828125, 0.00865936279296875, 0.0178070068359375, 0.02695465087890625, 0.036102294921875, 0.04524993896484375, 0.0543975830078125, 0.06354522705078125, 0.07269287109375, 0.08184051513671875, 0.0909881591796875, 0.10013580322265625, 0.109283447265625, 0.11843109130859375, 0.1275787353515625, 0.13672637939453125, 0.1458740234375, 0.15502166748046875, 0.1641693115234375, 0.17331695556640625, 0.182464599609375, 0.19161224365234375, 0.2007598876953125, 0.20990753173828125, 0.21905517578125, 0.22820281982421875, 0.2373504638671875, 0.24649810791015625, 0.255645751953125, 0.26479339599609375, 0.2739410400390625, 0.28308868408203125, 0.292236328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 8.0, 5.0, 9.0, 11.0, 19.0, 8.0, 20.0, 25.0, 22.0, 29.0, 25.0, 32.0, 28.0, 38.0, 43.0, 48.0, 46.0, 42.0, 1066.0, 30.0, 40.0, 38.0, 46.0, 40.0, 28.0, 41.0, 33.0, 28.0, 29.0, 15.0, 26.0, 9.0, 11.0, 9.0, 13.0, 11.0, 8.0, 5.0, 5.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2763671875, -1.2359466552734375, -1.195526123046875, -1.1551055908203125, -1.11468505859375, -1.0742645263671875, -1.033843994140625, -0.9934234619140625, -0.9530029296875, -0.9125823974609375, -0.872161865234375, -0.8317413330078125, -0.79132080078125, -0.7509002685546875, -0.710479736328125, -0.6700592041015625, -0.629638671875, -0.5892181396484375, -0.548797607421875, -0.5083770751953125, -0.46795654296875, -0.4275360107421875, -0.387115478515625, -0.3466949462890625, -0.3062744140625, -0.2658538818359375, -0.225433349609375, -0.1850128173828125, -0.14459228515625, -0.1041717529296875, -0.063751220703125, -0.0233306884765625, 0.01708984375, 0.0575103759765625, 0.097930908203125, 0.1383514404296875, 0.17877197265625, 0.2191925048828125, 0.259613037109375, 0.3000335693359375, 0.3404541015625, 0.3808746337890625, 0.421295166015625, 0.4617156982421875, 0.50213623046875, 0.5425567626953125, 0.582977294921875, 0.6233978271484375, 0.663818359375, 0.7042388916015625, 0.744659423828125, 0.7850799560546875, 0.82550048828125, 0.8659210205078125, 0.906341552734375, 0.9467620849609375, 0.9871826171875, 1.0276031494140625, 1.068023681640625, 1.1084442138671875, 1.14886474609375, 1.1892852783203125, 1.229705810546875, 1.2701263427734375, 1.310546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 17.0, 8.0, 13.0, 26.0, 43.0, 63.0, 121.0, 189.0, 291.0, 541.0, 914.0, 1548.0, 2754.0, 4841.0, 8723.0, 15564.0, 32896.0, 207312.0, 1693730.0, 75538.0, 23621.0, 12585.0, 6692.0, 3908.0, 2218.0, 1249.0, 680.0, 431.0, 249.0, 134.0, 91.0, 50.0, 35.0, 26.0, 12.0, 13.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.77978515625, -0.7599449157714844, -0.7401046752929688, -0.7202644348144531, -0.7004241943359375, -0.6805839538574219, -0.6607437133789062, -0.6409034729003906, -0.621063232421875, -0.6012229919433594, -0.5813827514648438, -0.5615425109863281, -0.5417022705078125, -0.5218620300292969, -0.5020217895507812, -0.4821815490722656, -0.46234130859375, -0.4425010681152344, -0.42266082763671875, -0.4028205871582031, -0.3829803466796875, -0.3631401062011719, -0.34329986572265625, -0.3234596252441406, -0.303619384765625, -0.2837791442871094, -0.26393890380859375, -0.24409866333007812, -0.2242584228515625, -0.20441818237304688, -0.18457794189453125, -0.16473770141601562, -0.1448974609375, -0.12505722045898438, -0.10521697998046875, -0.08537673950195312, -0.0655364990234375, -0.045696258544921875, -0.02585601806640625, -0.006015777587890625, 0.013824462890625, 0.033664703369140625, 0.05350494384765625, 0.07334518432617188, 0.0931854248046875, 0.11302566528320312, 0.13286590576171875, 0.15270614624023438, 0.17254638671875, 0.19238662719726562, 0.21222686767578125, 0.23206710815429688, 0.2519073486328125, 0.2717475891113281, 0.29158782958984375, 0.3114280700683594, 0.331268310546875, 0.3511085510253906, 0.37094879150390625, 0.3907890319824219, 0.4106292724609375, 0.4304695129394531, 0.45030975341796875, 0.4701499938964844, 0.489990234375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 15.0, 15.0, 18.0, 18.0, 26.0, 36.0, 38.0, 53.0, 72.0, 62.0, 89.0, 74.0, 78.0, 82.0, 61.0, 40.0, 55.0, 29.0, 24.0, 19.0, 20.0, 16.0, 9.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050048828125, -0.04844999313354492, -0.046851158142089844, -0.045252323150634766, -0.04365348815917969, -0.04205465316772461, -0.04045581817626953, -0.03885698318481445, -0.037258148193359375, -0.0356593132019043, -0.03406047821044922, -0.03246164321899414, -0.030862808227539062, -0.029263973236083984, -0.027665138244628906, -0.026066303253173828, -0.02446746826171875, -0.022868633270263672, -0.021269798278808594, -0.019670963287353516, -0.018072128295898438, -0.01647329330444336, -0.014874458312988281, -0.013275623321533203, -0.011676788330078125, -0.010077953338623047, -0.008479118347167969, -0.006880283355712891, -0.0052814483642578125, -0.0036826133728027344, -0.0020837783813476562, -0.0004849433898925781, 0.0011138916015625, 0.002712726593017578, 0.004311561584472656, 0.005910396575927734, 0.0075092315673828125, 0.00910806655883789, 0.010706901550292969, 0.012305736541748047, 0.013904571533203125, 0.015503406524658203, 0.01710224151611328, 0.01870107650756836, 0.020299911499023438, 0.021898746490478516, 0.023497581481933594, 0.025096416473388672, 0.02669525146484375, 0.028294086456298828, 0.029892921447753906, 0.031491756439208984, 0.03309059143066406, 0.03468942642211914, 0.03628826141357422, 0.0378870964050293, 0.039485931396484375, 0.04108476638793945, 0.04268360137939453, 0.04428243637084961, 0.04588127136230469, 0.047480106353759766, 0.049078941345214844, 0.05067777633666992, 0.052276611328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 3.0, 7.0, 12.0, 11.0, 21.0, 28.0, 38.0, 41.0, 64.0, 110.0, 159.0, 317.0, 1799.0, 585239.0, 458295.0, 1549.0, 325.0, 183.0, 91.0, 65.0, 34.0, 36.0, 22.0, 29.0, 14.0, 14.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.1123046875, -1.078582763671875, -1.04486083984375, -1.011138916015625, -0.9774169921875, -0.943695068359375, -0.90997314453125, -0.876251220703125, -0.842529296875, -0.808807373046875, -0.77508544921875, -0.741363525390625, -0.7076416015625, -0.673919677734375, -0.64019775390625, -0.606475830078125, -0.57275390625, -0.539031982421875, -0.50531005859375, -0.471588134765625, -0.4378662109375, -0.404144287109375, -0.37042236328125, -0.336700439453125, -0.302978515625, -0.269256591796875, -0.23553466796875, -0.201812744140625, -0.1680908203125, -0.134368896484375, -0.10064697265625, -0.066925048828125, -0.033203125, 0.000518798828125, 0.03424072265625, 0.067962646484375, 0.1016845703125, 0.135406494140625, 0.16912841796875, 0.202850341796875, 0.236572265625, 0.270294189453125, 0.30401611328125, 0.337738037109375, 0.3714599609375, 0.405181884765625, 0.43890380859375, 0.472625732421875, 0.50634765625, 0.540069580078125, 0.57379150390625, 0.607513427734375, 0.6412353515625, 0.674957275390625, 0.70867919921875, 0.742401123046875, 0.776123046875, 0.809844970703125, 0.84356689453125, 0.877288818359375, 0.9110107421875, 0.944732666015625, 0.97845458984375, 1.012176513671875, 1.0458984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 28.0, 172.0, 457.0, 269.0, 62.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820741593837738, -0.17327998578548431, -0.16448581218719482, -0.15569162368774414, -0.14689745008945465, -0.13810327649116516, -0.12930908799171448, -0.12051491439342499, -0.1117207407951355, -0.10292656719684601, -0.09413238614797592, -0.08533820509910583, -0.07654403150081635, -0.06774985790252686, -0.05895567685365677, -0.05016149953007698, -0.04136732220649719, -0.032573144882917404, -0.023778967559337616, -0.014984790235757828, -0.0061906129121780396, 0.0026035644114017487, 0.011397741734981537, 0.020191919058561325, 0.028986096382141113, 0.0377802737057209, 0.04657445102930069, 0.05536862835288048, 0.06416280567646027, 0.07295697927474976, 0.08175116032361984, 0.09054534137248993, 0.09933948516845703, 0.10813365876674652, 0.11692783981561661, 0.1257220208644867, 0.13451619446277618, 0.14331036806106567, 0.15210455656051636, 0.16089873015880585, 0.16969290375709534, 0.17848707735538483, 0.18728125095367432, 0.196075439453125, 0.2048696130514145, 0.21366378664970398, 0.22245797514915466, 0.23125214874744415, 0.24004632234573364, 0.24884049594402313, 0.2576346695423126, 0.2664288580417633, 0.2752230167388916, 0.2840172052383423, 0.29281139373779297, 0.30160555243492126, 0.31039974093437195, 0.31919392943382263, 0.3279880881309509, 0.3367822766304016, 0.3455764651298523, 0.3543706238269806, 0.3631648123264313, 0.37195897102355957, 0.38075315952301025]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 8.0, 10.0, 14.0, 12.0, 18.0, 38.0, 35.0, 36.0, 32.0, 35.0, 54.0, 50.0, 47.0, 54.0, 62.0, 55.0, 52.0, 52.0, 44.0, 41.0, 44.0, 38.0, 29.0, 36.0, 16.0, 20.0, 12.0, 15.0, 6.0, 8.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06160688400268555, -0.059279914945364, -0.05695294588804245, -0.0546259768307209, -0.05229900777339935, -0.049972038716077805, -0.047645069658756256, -0.04531810060143471, -0.04299113154411316, -0.04066416248679161, -0.03833719342947006, -0.036010224372148514, -0.033683255314826965, -0.03135628625750542, -0.02902931720018387, -0.02670234814286232, -0.02437537908554077, -0.022048410028219223, -0.019721440970897675, -0.017394471913576126, -0.015067502856254578, -0.01274053379893303, -0.01041356474161148, -0.008086595684289932, -0.005759626626968384, -0.0034326575696468353, -0.0011056885123252869, 0.0012212805449962616, 0.00354824960231781, 0.0058752186596393585, 0.008202187716960907, 0.010529156774282455, 0.012856125831604004, 0.015183094888925552, 0.0175100639462471, 0.01983703300356865, 0.022164002060890198, 0.024490971118211746, 0.026817940175533295, 0.029144909232854843, 0.03147187829017639, 0.03379884734749794, 0.03612581640481949, 0.03845278546214104, 0.040779754519462585, 0.043106723576784134, 0.04543369263410568, 0.04776066169142723, 0.05008763074874878, 0.05241459980607033, 0.054741568863391876, 0.057068537920713425, 0.05939550697803497, 0.06172247603535652, 0.06404944509267807, 0.06637641787528992, 0.06870338320732117, 0.07103034853935242, 0.07335732132196426, 0.07568429410457611, 0.07801125943660736, 0.08033822476863861, 0.08266519755125046, 0.0849921703338623, 0.08731913566589355]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 9.0, 6.0, 13.0, 22.0, 21.0, 17.0, 28.0, 29.0, 37.0, 37.0, 42.0, 46.0, 42.0, 43.0, 43.0, 47.0, 52.0, 45.0, 56.0, 43.0, 38.0, 32.0, 31.0, 40.0, 22.0, 26.0, 30.0, 15.0, 21.0, 14.0, 10.0, 11.0, 12.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.20703125, -2.144195556640625, -2.08135986328125, -2.018524169921875, -1.9556884765625, -1.892852783203125, -1.83001708984375, -1.767181396484375, -1.704345703125, -1.641510009765625, -1.57867431640625, -1.515838623046875, -1.4530029296875, -1.390167236328125, -1.32733154296875, -1.264495849609375, -1.20166015625, -1.138824462890625, -1.07598876953125, -1.013153076171875, -0.9503173828125, -0.887481689453125, -0.82464599609375, -0.761810302734375, -0.698974609375, -0.636138916015625, -0.57330322265625, -0.510467529296875, -0.4476318359375, -0.384796142578125, -0.32196044921875, -0.259124755859375, -0.1962890625, -0.133453369140625, -0.07061767578125, -0.007781982421875, 0.0550537109375, 0.117889404296875, 0.18072509765625, 0.243560791015625, 0.306396484375, 0.369232177734375, 0.43206787109375, 0.494903564453125, 0.5577392578125, 0.620574951171875, 0.68341064453125, 0.746246337890625, 0.80908203125, 0.871917724609375, 0.93475341796875, 0.997589111328125, 1.0604248046875, 1.123260498046875, 1.18609619140625, 1.248931884765625, 1.311767578125, 1.374603271484375, 1.43743896484375, 1.500274658203125, 1.5631103515625, 1.625946044921875, 1.68878173828125, 1.751617431640625, 1.814453125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 13.0, 9.0, 12.0, 13.0, 23.0, 41.0, 59.0, 67.0, 111.0, 134.0, 203.0, 321.0, 458.0, 736.0, 1074.0, 1819.0, 2986.0, 5339.0, 10248.0, 21837.0, 55800.0, 178040.0, 470221.0, 192442.0, 59033.0, 23084.0, 10633.0, 5455.0, 3035.0, 1865.0, 1172.0, 775.0, 486.0, 317.0, 215.0, 115.0, 107.0, 77.0, 61.0, 37.0, 27.0, 19.0, 9.0, 14.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.55078125, -2.46722412109375, -2.3836669921875, -2.30010986328125, -2.216552734375, -2.13299560546875, -2.0494384765625, -1.96588134765625, -1.88232421875, -1.79876708984375, -1.7152099609375, -1.63165283203125, -1.548095703125, -1.46453857421875, -1.3809814453125, -1.29742431640625, -1.2138671875, -1.13031005859375, -1.0467529296875, -0.96319580078125, -0.879638671875, -0.79608154296875, -0.7125244140625, -0.62896728515625, -0.54541015625, -0.46185302734375, -0.3782958984375, -0.29473876953125, -0.211181640625, -0.12762451171875, -0.0440673828125, 0.03948974609375, 0.123046875, 0.20660400390625, 0.2901611328125, 0.37371826171875, 0.457275390625, 0.54083251953125, 0.6243896484375, 0.70794677734375, 0.79150390625, 0.87506103515625, 0.9586181640625, 1.04217529296875, 1.125732421875, 1.20928955078125, 1.2928466796875, 1.37640380859375, 1.4599609375, 1.54351806640625, 1.6270751953125, 1.71063232421875, 1.794189453125, 1.87774658203125, 1.9613037109375, 2.04486083984375, 2.12841796875, 2.21197509765625, 2.2955322265625, 2.37908935546875, 2.462646484375, 2.54620361328125, 2.6297607421875, 2.71331787109375, 2.796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 11.0, 7.0, 4.0, 9.0, 13.0, 11.0, 18.0, 28.0, 30.0, 28.0, 30.0, 27.0, 34.0, 48.0, 44.0, 59.0, 110.0, 290.0, 1456.0, 257.0, 106.0, 53.0, 42.0, 50.0, 29.0, 42.0, 37.0, 28.0, 21.0, 17.0, 18.0, 14.0, 12.0, 14.0, 11.0, 9.0, 6.0, 4.0, 7.0, 1.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.1014404296875, -5.913818359375, -5.7261962890625, -5.53857421875, -5.3509521484375, -5.163330078125, -4.9757080078125, -4.7880859375, -4.6004638671875, -4.412841796875, -4.2252197265625, -4.03759765625, -3.8499755859375, -3.662353515625, -3.4747314453125, -3.287109375, -3.0994873046875, -2.911865234375, -2.7242431640625, -2.53662109375, -2.3489990234375, -2.161376953125, -1.9737548828125, -1.7861328125, -1.5985107421875, -1.410888671875, -1.2232666015625, -1.03564453125, -0.8480224609375, -0.660400390625, -0.4727783203125, -0.28515625, -0.0975341796875, 0.090087890625, 0.2777099609375, 0.46533203125, 0.6529541015625, 0.840576171875, 1.0281982421875, 1.2158203125, 1.4034423828125, 1.591064453125, 1.7786865234375, 1.96630859375, 2.1539306640625, 2.341552734375, 2.5291748046875, 2.716796875, 2.9044189453125, 3.092041015625, 3.2796630859375, 3.46728515625, 3.6549072265625, 3.842529296875, 4.0301513671875, 4.2177734375, 4.4053955078125, 4.593017578125, 4.7806396484375, 4.96826171875, 5.1558837890625, 5.343505859375, 5.5311279296875, 5.71875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 9.0, 9.0, 6.0, 5.0, 19.0, 10.0, 16.0, 18.0, 20.0, 34.0, 48.0, 37.0, 55.0, 96.0, 118.0, 178.0, 361.0, 759.0, 2081.0, 6754.0, 30124.0, 536881.0, 2478528.0, 71945.0, 11887.0, 3251.0, 1142.0, 499.0, 250.0, 125.0, 79.0, 81.0, 70.0, 42.0, 34.0, 20.0, 15.0, 15.0, 12.0, 17.0, 10.0, 11.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.15728759765625, -6.9122314453125, -6.66717529296875, -6.422119140625, -6.17706298828125, -5.9320068359375, -5.68695068359375, -5.44189453125, -5.19683837890625, -4.9517822265625, -4.70672607421875, -4.461669921875, -4.21661376953125, -3.9715576171875, -3.72650146484375, -3.4814453125, -3.23638916015625, -2.9913330078125, -2.74627685546875, -2.501220703125, -2.25616455078125, -2.0111083984375, -1.76605224609375, -1.52099609375, -1.27593994140625, -1.0308837890625, -0.78582763671875, -0.540771484375, -0.29571533203125, -0.0506591796875, 0.19439697265625, 0.439453125, 0.68450927734375, 0.9295654296875, 1.17462158203125, 1.419677734375, 1.66473388671875, 1.9097900390625, 2.15484619140625, 2.39990234375, 2.64495849609375, 2.8900146484375, 3.13507080078125, 3.380126953125, 3.62518310546875, 3.8702392578125, 4.11529541015625, 4.3603515625, 4.60540771484375, 4.8504638671875, 5.09552001953125, 5.340576171875, 5.58563232421875, 5.8306884765625, 6.07574462890625, 6.32080078125, 6.56585693359375, 6.8109130859375, 7.05596923828125, 7.301025390625, 7.54608154296875, 7.7911376953125, 8.03619384765625, 8.28125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 43.0, 496.0, 451.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.41239166259766, -105.45640563964844, -103.50041961669922, -101.54444122314453, -99.58845520019531, -97.6324691772461, -95.67648315429688, -93.72050476074219, -91.76451873779297, -89.80853271484375, -87.85254669189453, -85.89656829833984, -83.94058227539062, -81.9845962524414, -80.02861022949219, -78.0726318359375, -76.11663818359375, -74.16065216064453, -72.20466613769531, -70.24868774414062, -68.2927017211914, -66.33671569824219, -64.38072967529297, -62.424747467041016, -60.46876525878906, -58.512779235839844, -56.55679702758789, -54.60081100463867, -52.64482879638672, -50.6888427734375, -48.73285675048828, -46.77687454223633, -44.820892333984375, -42.864906311035156, -40.9089241027832, -38.952938079833984, -36.99695587158203, -35.04096984863281, -33.084983825683594, -31.12900161743164, -29.173019409179688, -27.2170352935791, -25.261051177978516, -23.305065155029297, -21.349082946777344, -19.393096923828125, -17.43711280822754, -15.481128692626953, -13.525144577026367, -11.569160461425781, -9.613176345825195, -7.657191276550293, -5.701207160949707, -3.745223045349121, -1.7892379760742188, 0.1667461395263672, 2.122730255126953, 4.078714370727539, 6.034698963165283, 7.990683555603027, 9.946667671203613, 11.9026517868042, 13.858636856079102, 15.814620971679688, 17.770605087280273]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 11.0, 16.0, 13.0, 15.0, 16.0, 16.0, 23.0, 17.0, 25.0, 31.0, 35.0, 25.0, 34.0, 45.0, 43.0, 44.0, 38.0, 39.0, 46.0, 44.0, 51.0, 44.0, 49.0, 36.0, 32.0, 28.0, 23.0, 30.0, 24.0, 24.0, 16.0, 13.0, 5.0, 13.0, 8.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.599956512451172, -15.074480056762695, -14.549003601074219, -14.023526191711426, -13.49804973602295, -12.972573280334473, -12.44709587097168, -11.921619415283203, -11.396142959594727, -10.87066650390625, -10.345190048217773, -9.81971263885498, -9.294236183166504, -8.768759727478027, -8.243282318115234, -7.717805862426758, -7.192329406738281, -6.666852951049805, -6.14137601852417, -5.615899085998535, -5.090422630310059, -4.564946174621582, -4.039469242095947, -3.5139925479888916, -2.988515853881836, -2.4630391597747803, -1.9375624656677246, -1.412085771560669, -0.8866090774536133, -0.3611323833465576, 0.16434431076049805, 0.6898210048675537, 1.2152976989746094, 1.740774393081665, 2.2662510871887207, 2.7917277812957764, 3.317204475402832, 3.8426811695098877, 4.368157863616943, 4.893634796142578, 5.419111251831055, 5.944587707519531, 6.470064640045166, 6.995541572570801, 7.521018028259277, 8.046494483947754, 8.571971893310547, 9.097448348999023, 9.6229248046875, 10.148401260375977, 10.673877716064453, 11.199355125427246, 11.724831581115723, 12.2503080368042, 12.775785446166992, 13.301261901855469, 13.826738357543945, 14.352214813232422, 14.877691268920898, 15.403168678283691, 15.928645133972168, 16.45412254333496, 16.979598999023438, 17.505075454711914, 18.03055191040039]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 11.0, 9.0, 14.0, 17.0, 16.0, 29.0, 27.0, 38.0, 42.0, 40.0, 52.0, 41.0, 36.0, 60.0, 54.0, 48.0, 46.0, 46.0, 36.0, 54.0, 49.0, 31.0, 37.0, 31.0, 23.0, 32.0, 20.0, 13.0, 16.0, 13.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.4537353515625, -2.380126953125, -2.3065185546875, -2.23291015625, -2.1593017578125, -2.085693359375, -2.0120849609375, -1.9384765625, -1.8648681640625, -1.791259765625, -1.7176513671875, -1.64404296875, -1.5704345703125, -1.496826171875, -1.4232177734375, -1.349609375, -1.2760009765625, -1.202392578125, -1.1287841796875, -1.05517578125, -0.9815673828125, -0.907958984375, -0.8343505859375, -0.7607421875, -0.6871337890625, -0.613525390625, -0.5399169921875, -0.46630859375, -0.3927001953125, -0.319091796875, -0.2454833984375, -0.171875, -0.0982666015625, -0.024658203125, 0.0489501953125, 0.12255859375, 0.1961669921875, 0.269775390625, 0.3433837890625, 0.4169921875, 0.4906005859375, 0.564208984375, 0.6378173828125, 0.71142578125, 0.7850341796875, 0.858642578125, 0.9322509765625, 1.005859375, 1.0794677734375, 1.153076171875, 1.2266845703125, 1.30029296875, 1.3739013671875, 1.447509765625, 1.5211181640625, 1.5947265625, 1.6683349609375, 1.741943359375, 1.8155517578125, 1.88916015625, 1.9627685546875, 2.036376953125, 2.1099853515625, 2.18359375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 21.0, 23.0, 31.0, 50.0, 86.0, 116.0, 174.0, 316.0, 578.0, 1001.0, 1924.0, 3775.0, 8596.0, 23391.0, 97549.0, 795864.0, 2596692.0, 554987.0, 74760.0, 20025.0, 7379.0, 3304.0, 1622.0, 877.0, 489.0, 258.0, 174.0, 70.0, 60.0, 34.0, 18.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2109375, -4.092041015625, -3.97314453125, -3.854248046875, -3.7353515625, -3.616455078125, -3.49755859375, -3.378662109375, -3.259765625, -3.140869140625, -3.02197265625, -2.903076171875, -2.7841796875, -2.665283203125, -2.54638671875, -2.427490234375, -2.30859375, -2.189697265625, -2.07080078125, -1.951904296875, -1.8330078125, -1.714111328125, -1.59521484375, -1.476318359375, -1.357421875, -1.238525390625, -1.11962890625, -1.000732421875, -0.8818359375, -0.762939453125, -0.64404296875, -0.525146484375, -0.40625, -0.287353515625, -0.16845703125, -0.049560546875, 0.0693359375, 0.188232421875, 0.30712890625, 0.426025390625, 0.544921875, 0.663818359375, 0.78271484375, 0.901611328125, 1.0205078125, 1.139404296875, 1.25830078125, 1.377197265625, 1.49609375, 1.614990234375, 1.73388671875, 1.852783203125, 1.9716796875, 2.090576171875, 2.20947265625, 2.328369140625, 2.447265625, 2.566162109375, 2.68505859375, 2.803955078125, 2.9228515625, 3.041748046875, 3.16064453125, 3.279541015625, 3.3984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 15.0, 21.0, 23.0, 33.0, 46.0, 54.0, 89.0, 133.0, 222.0, 323.0, 434.0, 615.0, 568.0, 471.0, 353.0, 198.0, 128.0, 86.0, 51.0, 53.0, 37.0, 33.0, 16.0, 17.0, 6.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.28125, -3.17218017578125, -3.0631103515625, -2.95404052734375, -2.844970703125, -2.73590087890625, -2.6268310546875, -2.51776123046875, -2.40869140625, -2.29962158203125, -2.1905517578125, -2.08148193359375, -1.972412109375, -1.86334228515625, -1.7542724609375, -1.64520263671875, -1.5361328125, -1.42706298828125, -1.3179931640625, -1.20892333984375, -1.099853515625, -0.99078369140625, -0.8817138671875, -0.77264404296875, -0.66357421875, -0.55450439453125, -0.4454345703125, -0.33636474609375, -0.227294921875, -0.11822509765625, -0.0091552734375, 0.09991455078125, 0.208984375, 0.31805419921875, 0.4271240234375, 0.53619384765625, 0.645263671875, 0.75433349609375, 0.8634033203125, 0.97247314453125, 1.08154296875, 1.19061279296875, 1.2996826171875, 1.40875244140625, 1.517822265625, 1.62689208984375, 1.7359619140625, 1.84503173828125, 1.9541015625, 2.06317138671875, 2.1722412109375, 2.28131103515625, 2.390380859375, 2.49945068359375, 2.6085205078125, 2.71759033203125, 2.82666015625, 2.93572998046875, 3.0447998046875, 3.15386962890625, 3.262939453125, 3.37200927734375, 3.4810791015625, 3.59014892578125, 3.69921875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 13.0, 10.0, 26.0, 32.0, 59.0, 73.0, 94.0, 163.0, 357.0, 686.0, 2264.0, 11299.0, 105897.0, 3402258.0, 631717.0, 32159.0, 4775.0, 1240.0, 477.0, 234.0, 135.0, 97.0, 64.0, 42.0, 32.0, 17.0, 8.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.6885986328125, -9.392822265625, -9.0970458984375, -8.80126953125, -8.5054931640625, -8.209716796875, -7.9139404296875, -7.6181640625, -7.3223876953125, -7.026611328125, -6.7308349609375, -6.43505859375, -6.1392822265625, -5.843505859375, -5.5477294921875, -5.251953125, -4.9561767578125, -4.660400390625, -4.3646240234375, -4.06884765625, -3.7730712890625, -3.477294921875, -3.1815185546875, -2.8857421875, -2.5899658203125, -2.294189453125, -1.9984130859375, -1.70263671875, -1.4068603515625, -1.111083984375, -0.8153076171875, -0.51953125, -0.2237548828125, 0.072021484375, 0.3677978515625, 0.66357421875, 0.9593505859375, 1.255126953125, 1.5509033203125, 1.8466796875, 2.1424560546875, 2.438232421875, 2.7340087890625, 3.02978515625, 3.3255615234375, 3.621337890625, 3.9171142578125, 4.212890625, 4.5086669921875, 4.804443359375, 5.1002197265625, 5.39599609375, 5.6917724609375, 5.987548828125, 6.2833251953125, 6.5791015625, 6.8748779296875, 7.170654296875, 7.4664306640625, 7.76220703125, 8.0579833984375, 8.353759765625, 8.6495361328125, 8.9453125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 57.0, 139.0, 348.0, 290.0, 136.0, 24.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.767168045043945, -22.44314956665039, -21.11913299560547, -19.795114517211914, -18.471097946166992, -17.147079467773438, -15.8230619430542, -14.499044418334961, -13.175026893615723, -11.851009368896484, -10.526991844177246, -9.202974319458008, -7.878956317901611, -6.554938793182373, -5.230920791625977, -3.9069032669067383, -2.5828857421875, -1.2588680982589722, 0.06514954566955566, 1.389167308807373, 2.7131848335266113, 4.03720235824585, 5.361220359802246, 6.685237884521484, 8.009255409240723, 9.333272933959961, 10.6572904586792, 11.981307983398438, 13.305326461791992, 14.629343032836914, 15.953361511230469, 17.27737808227539, 18.601398468017578, 19.925416946411133, 21.249433517456055, 22.57345199584961, 23.89746856689453, 25.221487045288086, 26.54550552368164, 27.869522094726562, 29.193538665771484, 30.51755714416504, 31.84157371520996, 33.165592193603516, 34.48960876464844, 35.81362533569336, 37.13764572143555, 38.46166229248047, 39.785682678222656, 41.10969924926758, 42.433719635009766, 43.75773620605469, 45.08175277709961, 46.40576934814453, 47.72978973388672, 49.05380630493164, 50.37782287597656, 51.701839447021484, 53.02585983276367, 54.349876403808594, 55.673892974853516, 56.99790954589844, 58.321929931640625, 59.64594650268555, 60.96996307373047]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 10.0, 8.0, 8.0, 4.0, 12.0, 20.0, 13.0, 22.0, 24.0, 20.0, 25.0, 27.0, 21.0, 26.0, 32.0, 18.0, 37.0, 29.0, 38.0, 46.0, 41.0, 31.0, 33.0, 39.0, 21.0, 31.0, 27.0, 26.0, 36.0, 35.0, 21.0, 27.0, 26.0, 28.0, 23.0, 20.0, 12.0, 13.0, 14.0, 10.0, 8.0, 7.0, 5.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-10.219720840454102, -9.927141189575195, -9.634560585021973, -9.341980934143066, -9.04940128326416, -8.756820678710938, -8.464241027832031, -8.171661376953125, -7.8790812492370605, -7.586501121520996, -7.29392147064209, -7.001341342926025, -6.708761215209961, -6.416181564331055, -6.12360143661499, -5.831021308898926, -5.5384416580200195, -5.245861530303955, -4.953281879425049, -4.660701751708984, -4.368122100830078, -4.075541973114014, -3.782961845397949, -3.490381956100464, -3.1978020668029785, -2.905222177505493, -2.612642288208008, -2.3200621604919434, -2.027482271194458, -1.7349023818969727, -1.4423223733901978, -1.1497423648834229, -0.8571615219116211, -0.564581573009491, -0.27200162410736084, 0.020578324794769287, 0.3131582736968994, 0.6057381629943848, 0.8983181715011597, 1.1908981800079346, 1.48347806930542, 1.7760579586029053, 2.0686378479003906, 2.361217975616455, 2.6537978649139404, 2.946377754211426, 3.2389578819274902, 3.5315377712249756, 3.824117660522461, 4.116697788238525, 4.409277439117432, 4.701857566833496, 4.994437217712402, 5.287017345428467, 5.579597473144531, 5.8721771240234375, 6.164757251739502, 6.457337379455566, 6.749917030334473, 7.042497158050537, 7.335077285766602, 7.627656936645508, 7.920237064361572, 8.212817192077637, 8.505396842956543]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 2.0, 11.0, 12.0, 14.0, 23.0, 25.0, 29.0, 29.0, 44.0, 43.0, 44.0, 49.0, 43.0, 48.0, 59.0, 51.0, 54.0, 43.0, 35.0, 43.0, 43.0, 37.0, 29.0, 28.0, 23.0, 23.0, 15.0, 20.0, 13.0, 13.0, 8.0, 11.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.072784423828125, -2.00494384765625, -1.937103271484375, -1.8692626953125, -1.801422119140625, -1.73358154296875, -1.665740966796875, -1.597900390625, -1.530059814453125, -1.46221923828125, -1.394378662109375, -1.3265380859375, -1.258697509765625, -1.19085693359375, -1.123016357421875, -1.05517578125, -0.987335205078125, -0.91949462890625, -0.851654052734375, -0.7838134765625, -0.715972900390625, -0.64813232421875, -0.580291748046875, -0.512451171875, -0.444610595703125, -0.37677001953125, -0.308929443359375, -0.2410888671875, -0.173248291015625, -0.10540771484375, -0.037567138671875, 0.0302734375, 0.098114013671875, 0.16595458984375, 0.233795166015625, 0.3016357421875, 0.369476318359375, 0.43731689453125, 0.505157470703125, 0.572998046875, 0.640838623046875, 0.70867919921875, 0.776519775390625, 0.8443603515625, 0.912200927734375, 0.98004150390625, 1.047882080078125, 1.11572265625, 1.183563232421875, 1.25140380859375, 1.319244384765625, 1.3870849609375, 1.454925537109375, 1.52276611328125, 1.590606689453125, 1.658447265625, 1.726287841796875, 1.79412841796875, 1.861968994140625, 1.9298095703125, 1.997650146484375, 2.06549072265625, 2.133331298828125, 2.201171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 9.0, 4.0, 7.0, 4.0, 14.0, 21.0, 22.0, 40.0, 60.0, 79.0, 123.0, 207.0, 305.0, 463.0, 729.0, 1056.0, 1597.0, 2487.0, 3945.0, 5743.0, 8950.0, 13489.0, 20983.0, 32343.0, 49225.0, 72627.0, 103707.0, 135156.0, 148718.0, 133144.0, 102622.0, 71553.0, 48141.0, 31759.0, 20605.0, 13390.0, 8652.0, 5657.0, 3751.0, 2402.0, 1673.0, 1042.0, 677.0, 442.0, 328.0, 204.0, 131.0, 92.0, 70.0, 42.0, 16.0, 22.0, 14.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.25927734375, -0.25077056884765625, -0.2422637939453125, -0.23375701904296875, -0.225250244140625, -0.21674346923828125, -0.2082366943359375, -0.19972991943359375, -0.19122314453125, -0.18271636962890625, -0.1742095947265625, -0.16570281982421875, -0.157196044921875, -0.14868927001953125, -0.1401824951171875, -0.13167572021484375, -0.1231689453125, -0.11466217041015625, -0.1061553955078125, -0.09764862060546875, -0.089141845703125, -0.08063507080078125, -0.0721282958984375, -0.06362152099609375, -0.05511474609375, -0.04660797119140625, -0.0381011962890625, -0.02959442138671875, -0.021087646484375, -0.01258087158203125, -0.0040740966796875, 0.00443267822265625, 0.012939453125, 0.02144622802734375, 0.0299530029296875, 0.03845977783203125, 0.046966552734375, 0.05547332763671875, 0.0639801025390625, 0.07248687744140625, 0.08099365234375, 0.08950042724609375, 0.0980072021484375, 0.10651397705078125, 0.115020751953125, 0.12352752685546875, 0.1320343017578125, 0.14054107666015625, 0.1490478515625, 0.15755462646484375, 0.1660614013671875, 0.17456817626953125, 0.183074951171875, 0.19158172607421875, 0.2000885009765625, 0.20859527587890625, 0.21710205078125, 0.22560882568359375, 0.2341156005859375, 0.24262237548828125, 0.251129150390625, 0.25963592529296875, 0.2681427001953125, 0.27664947509765625, 0.28515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 4.0, 6.0, 13.0, 14.0, 13.0, 18.0, 27.0, 24.0, 24.0, 25.0, 25.0, 39.0, 43.0, 43.0, 35.0, 37.0, 41.0, 45.0, 1068.0, 51.0, 42.0, 43.0, 44.0, 37.0, 32.0, 41.0, 34.0, 25.0, 19.0, 24.0, 13.0, 11.0, 12.0, 14.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4580078125, -1.41290283203125, -1.3677978515625, -1.32269287109375, -1.277587890625, -1.23248291015625, -1.1873779296875, -1.14227294921875, -1.09716796875, -1.05206298828125, -1.0069580078125, -0.96185302734375, -0.916748046875, -0.87164306640625, -0.8265380859375, -0.78143310546875, -0.736328125, -0.69122314453125, -0.6461181640625, -0.60101318359375, -0.555908203125, -0.51080322265625, -0.4656982421875, -0.42059326171875, -0.37548828125, -0.33038330078125, -0.2852783203125, -0.24017333984375, -0.195068359375, -0.14996337890625, -0.1048583984375, -0.05975341796875, -0.0146484375, 0.03045654296875, 0.0755615234375, 0.12066650390625, 0.165771484375, 0.21087646484375, 0.2559814453125, 0.30108642578125, 0.34619140625, 0.39129638671875, 0.4364013671875, 0.48150634765625, 0.526611328125, 0.57171630859375, 0.6168212890625, 0.66192626953125, 0.70703125, 0.75213623046875, 0.7972412109375, 0.84234619140625, 0.887451171875, 0.93255615234375, 0.9776611328125, 1.02276611328125, 1.06787109375, 1.11297607421875, 1.1580810546875, 1.20318603515625, 1.248291015625, 1.29339599609375, 1.3385009765625, 1.38360595703125, 1.4287109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 8.0, 11.0, 12.0, 17.0, 26.0, 39.0, 54.0, 71.0, 136.0, 174.0, 285.0, 440.0, 659.0, 1080.0, 1672.0, 2634.0, 4301.0, 6575.0, 10419.0, 17671.0, 37556.0, 252411.0, 1616510.0, 83028.0, 24990.0, 13523.0, 8366.0, 5249.0, 3285.0, 2108.0, 1330.0, 893.0, 559.0, 354.0, 210.0, 166.0, 104.0, 70.0, 38.0, 37.0, 23.0, 12.0, 13.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5859375, -0.5697822570800781, -0.5536270141601562, -0.5374717712402344, -0.5213165283203125, -0.5051612854003906, -0.48900604248046875, -0.4728507995605469, -0.456695556640625, -0.4405403137207031, -0.42438507080078125, -0.4082298278808594, -0.3920745849609375, -0.3759193420410156, -0.35976409912109375, -0.3436088562011719, -0.32745361328125, -0.3112983703613281, -0.29514312744140625, -0.2789878845214844, -0.2628326416015625, -0.24667739868164062, -0.23052215576171875, -0.21436691284179688, -0.198211669921875, -0.18205642700195312, -0.16590118408203125, -0.14974594116210938, -0.1335906982421875, -0.11743545532226562, -0.10128021240234375, -0.08512496948242188, -0.0689697265625, -0.052814483642578125, -0.03665924072265625, -0.020503997802734375, -0.0043487548828125, 0.011806488037109375, 0.02796173095703125, 0.044116973876953125, 0.060272216796875, 0.07642745971679688, 0.09258270263671875, 0.10873794555664062, 0.1248931884765625, 0.14104843139648438, 0.15720367431640625, 0.17335891723632812, 0.18951416015625, 0.20566940307617188, 0.22182464599609375, 0.23797988891601562, 0.2541351318359375, 0.2702903747558594, 0.28644561767578125, 0.3026008605957031, 0.318756103515625, 0.3349113464355469, 0.35106658935546875, 0.3672218322753906, 0.3833770751953125, 0.3995323181152344, 0.41568756103515625, 0.4318428039550781, 0.447998046875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 17.0, 27.0, 26.0, 31.0, 42.0, 62.0, 60.0, 79.0, 84.0, 74.0, 84.0, 81.0, 76.0, 49.0, 48.0, 31.0, 30.0, 16.0, 18.0, 10.0, 6.0, 9.0, 7.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0546875, -0.053189754486083984, -0.05169200897216797, -0.05019426345825195, -0.04869651794433594, -0.04719877243041992, -0.045701026916503906, -0.04420328140258789, -0.042705535888671875, -0.04120779037475586, -0.039710044860839844, -0.03821229934692383, -0.03671455383300781, -0.0352168083190918, -0.03371906280517578, -0.032221317291259766, -0.03072357177734375, -0.029225826263427734, -0.02772808074951172, -0.026230335235595703, -0.024732589721679688, -0.023234844207763672, -0.021737098693847656, -0.02023935317993164, -0.018741607666015625, -0.01724386215209961, -0.015746116638183594, -0.014248371124267578, -0.012750625610351562, -0.011252880096435547, -0.009755134582519531, -0.008257389068603516, -0.0067596435546875, -0.005261898040771484, -0.0037641525268554688, -0.002266407012939453, -0.0007686614990234375, 0.0007290840148925781, 0.0022268295288085938, 0.0037245750427246094, 0.005222320556640625, 0.006720066070556641, 0.008217811584472656, 0.009715557098388672, 0.011213302612304688, 0.012711048126220703, 0.014208793640136719, 0.015706539154052734, 0.01720428466796875, 0.018702030181884766, 0.02019977569580078, 0.021697521209716797, 0.023195266723632812, 0.024693012237548828, 0.026190757751464844, 0.02768850326538086, 0.029186248779296875, 0.03068399429321289, 0.032181739807128906, 0.03367948532104492, 0.03517723083496094, 0.03667497634887695, 0.03817272186279297, 0.039670467376708984, 0.041168212890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 11.0, 10.0, 8.0, 21.0, 17.0, 40.0, 38.0, 65.0, 93.0, 190.0, 379.0, 1923.0, 994101.0, 50292.0, 698.0, 229.0, 154.0, 91.0, 43.0, 41.0, 24.0, 29.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8355026245117188, -0.8043060302734375, -0.7731094360351562, -0.741912841796875, -0.7107162475585938, -0.6795196533203125, -0.6483230590820312, -0.61712646484375, -0.5859298706054688, -0.5547332763671875, -0.5235366821289062, -0.492340087890625, -0.46114349365234375, -0.4299468994140625, -0.39875030517578125, -0.3675537109375, -0.33635711669921875, -0.3051605224609375, -0.27396392822265625, -0.242767333984375, -0.21157073974609375, -0.1803741455078125, -0.14917755126953125, -0.11798095703125, -0.08678436279296875, -0.0555877685546875, -0.02439117431640625, 0.006805419921875, 0.03800201416015625, 0.0691986083984375, 0.10039520263671875, 0.131591796875, 0.16278839111328125, 0.1939849853515625, 0.22518157958984375, 0.256378173828125, 0.28757476806640625, 0.3187713623046875, 0.34996795654296875, 0.38116455078125, 0.41236114501953125, 0.4435577392578125, 0.47475433349609375, 0.505950927734375, 0.5371475219726562, 0.5683441162109375, 0.5995407104492188, 0.6307373046875, 0.6619338989257812, 0.6931304931640625, 0.7243270874023438, 0.755523681640625, 0.7867202758789062, 0.8179168701171875, 0.8491134643554688, 0.88031005859375, 0.9115066528320312, 0.9427032470703125, 0.9738998413085938, 1.005096435546875, 1.0362930297851562, 1.0674896240234375, 1.0986862182617188, 1.1298828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 19.0, 855.0, 144.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9690470695495605, -0.9509902596473694, -0.9329334497451782, -0.9148766398429871, -0.8968198299407959, -0.8787630796432495, -0.8607062101364136, -0.8426494598388672, -0.824592649936676, -0.8065358400344849, -0.7884790301322937, -0.7704222202301025, -0.7523654103279114, -0.7343086004257202, -0.7162518501281738, -0.6981950402259827, -0.6801382303237915, -0.6620814204216003, -0.6440246105194092, -0.625967800617218, -0.6079109907150269, -0.5898542404174805, -0.5717973709106445, -0.5537406206130981, -0.5356837511062622, -0.517626941204071, -0.4995701313018799, -0.4815133213996887, -0.46345654129981995, -0.4453997313976288, -0.4273429214954376, -0.40928614139556885, -0.3912293314933777, -0.3731725215911865, -0.35511571168899536, -0.3370589017868042, -0.3190021216869354, -0.30094531178474426, -0.2828885018825531, -0.2648317217826843, -0.24677488207817078, -0.22871807217597961, -0.21066127717494965, -0.19260446727275848, -0.17454767227172852, -0.15649086236953735, -0.1384340524673462, -0.12037725746631622, -0.10232044756412506, -0.0842636451125145, -0.06620684266090393, -0.04815003275871277, -0.030093230307102203, -0.012036427855491638, 0.006020382046699524, 0.024077177047729492, 0.042133986949920654, 0.06019078940153122, 0.07824759185314178, 0.09630440175533295, 0.11436120420694351, 0.13241800665855408, 0.15047481656074524, 0.1685316115617752, 0.18658842146396637]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 0.0, 2.0, 2.0, 7.0, 8.0, 10.0, 13.0, 24.0, 22.0, 32.0, 20.0, 38.0, 42.0, 59.0, 40.0, 51.0, 46.0, 53.0, 55.0, 47.0, 56.0, 55.0, 54.0, 40.0, 39.0, 36.0, 33.0, 25.0, 21.0, 17.0, 13.0, 8.0, 16.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056599974632263184, -0.054925937205553055, -0.053251899778842926, -0.0515778586268425, -0.04990382120013237, -0.04822978377342224, -0.046555742621421814, -0.044881705194711685, -0.043207667768001556, -0.04153363034129143, -0.0398595929145813, -0.03818555176258087, -0.03651151433587074, -0.034837476909160614, -0.03316343575716019, -0.03148939833045006, -0.02981536090373993, -0.0281413234770298, -0.026467284187674522, -0.024793244898319244, -0.023119207471609116, -0.021445170044898987, -0.01977113075554371, -0.01809709146618843, -0.016423054039478302, -0.014749015681445599, -0.013074977323412895, -0.011400938965380192, -0.009726900607347488, -0.008052862249314785, -0.006378823891282082, -0.004704785533249378, -0.003030747175216675, -0.0013567088171839714, 0.000317329540848732, 0.0019913678988814354, 0.003665406256914139, 0.005339444614946842, 0.007013482972979546, 0.008687521331012249, 0.010361559689044952, 0.012035598047077656, 0.01370963640511036, 0.015383674763143063, 0.017057713121175766, 0.018731750547885895, 0.020405789837241173, 0.02207982912659645, 0.02375386655330658, 0.02542790398001671, 0.027101943269371986, 0.028775982558727264, 0.030450019985437393, 0.03212405741214752, 0.03379809856414795, 0.03547213599085808, 0.03714617341756821, 0.038820210844278336, 0.040494248270988464, 0.04216828942298889, 0.04384232684969902, 0.04551636427640915, 0.047190405428409576, 0.048864442855119705, 0.050538480281829834]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 13.0, 14.0, 12.0, 13.0, 14.0, 23.0, 32.0, 44.0, 35.0, 40.0, 45.0, 43.0, 47.0, 51.0, 56.0, 52.0, 52.0, 34.0, 47.0, 50.0, 26.0, 28.0, 33.0, 25.0, 35.0, 19.0, 19.0, 14.0, 16.0, 13.0, 6.0, 9.0, 4.0, 2.0, 10.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -1.99066162109375, -1.9246826171875, -1.85870361328125, -1.792724609375, -1.72674560546875, -1.6607666015625, -1.59478759765625, -1.52880859375, -1.46282958984375, -1.3968505859375, -1.33087158203125, -1.264892578125, -1.19891357421875, -1.1329345703125, -1.06695556640625, -1.0009765625, -0.93499755859375, -0.8690185546875, -0.80303955078125, -0.737060546875, -0.67108154296875, -0.6051025390625, -0.53912353515625, -0.47314453125, -0.40716552734375, -0.3411865234375, -0.27520751953125, -0.209228515625, -0.14324951171875, -0.0772705078125, -0.01129150390625, 0.0546875, 0.12066650390625, 0.1866455078125, 0.25262451171875, 0.318603515625, 0.38458251953125, 0.4505615234375, 0.51654052734375, 0.58251953125, 0.64849853515625, 0.7144775390625, 0.78045654296875, 0.846435546875, 0.91241455078125, 0.9783935546875, 1.04437255859375, 1.1103515625, 1.17633056640625, 1.2423095703125, 1.30828857421875, 1.374267578125, 1.44024658203125, 1.5062255859375, 1.57220458984375, 1.63818359375, 1.70416259765625, 1.7701416015625, 1.83612060546875, 1.902099609375, 1.96807861328125, 2.0340576171875, 2.10003662109375, 2.166015625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 2.0, 8.0, 10.0, 11.0, 13.0, 21.0, 23.0, 37.0, 54.0, 96.0, 138.0, 248.0, 344.0, 661.0, 1137.0, 2438.0, 4732.0, 10098.0, 23275.0, 62255.0, 379513.0, 449678.0, 67501.0, 24849.0, 10899.0, 5122.0, 2452.0, 1281.0, 655.0, 363.0, 205.0, 118.0, 88.0, 59.0, 41.0, 29.0, 23.0, 21.0, 15.0, 9.0, 8.0, 5.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.293426513671875, -3.16693115234375, -3.040435791015625, -2.9139404296875, -2.787445068359375, -2.66094970703125, -2.534454345703125, -2.407958984375, -2.281463623046875, -2.15496826171875, -2.028472900390625, -1.9019775390625, -1.775482177734375, -1.64898681640625, -1.522491455078125, -1.39599609375, -1.269500732421875, -1.14300537109375, -1.016510009765625, -0.8900146484375, -0.763519287109375, -0.63702392578125, -0.510528564453125, -0.384033203125, -0.257537841796875, -0.13104248046875, -0.004547119140625, 0.1219482421875, 0.248443603515625, 0.37493896484375, 0.501434326171875, 0.6279296875, 0.754425048828125, 0.88092041015625, 1.007415771484375, 1.1339111328125, 1.260406494140625, 1.38690185546875, 1.513397216796875, 1.639892578125, 1.766387939453125, 1.89288330078125, 2.019378662109375, 2.1458740234375, 2.272369384765625, 2.39886474609375, 2.525360107421875, 2.65185546875, 2.778350830078125, 2.90484619140625, 3.031341552734375, 3.1578369140625, 3.284332275390625, 3.41082763671875, 3.537322998046875, 3.663818359375, 3.790313720703125, 3.91680908203125, 4.043304443359375, 4.1697998046875, 4.296295166015625, 4.42279052734375, 4.549285888671875, 4.67578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 5.0, 7.0, 14.0, 14.0, 26.0, 24.0, 21.0, 26.0, 26.0, 30.0, 40.0, 46.0, 39.0, 46.0, 67.0, 121.0, 348.0, 1444.0, 155.0, 85.0, 47.0, 51.0, 38.0, 46.0, 41.0, 28.0, 23.0, 18.0, 25.0, 24.0, 22.0, 20.0, 9.0, 8.0, 10.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.2982177734375, -5.127685546875, -4.9571533203125, -4.78662109375, -4.6160888671875, -4.445556640625, -4.2750244140625, -4.1044921875, -3.9339599609375, -3.763427734375, -3.5928955078125, -3.42236328125, -3.2518310546875, -3.081298828125, -2.9107666015625, -2.740234375, -2.5697021484375, -2.399169921875, -2.2286376953125, -2.05810546875, -1.8875732421875, -1.717041015625, -1.5465087890625, -1.3759765625, -1.2054443359375, -1.034912109375, -0.8643798828125, -0.69384765625, -0.5233154296875, -0.352783203125, -0.1822509765625, -0.01171875, 0.1588134765625, 0.329345703125, 0.4998779296875, 0.67041015625, 0.8409423828125, 1.011474609375, 1.1820068359375, 1.3525390625, 1.5230712890625, 1.693603515625, 1.8641357421875, 2.03466796875, 2.2052001953125, 2.375732421875, 2.5462646484375, 2.716796875, 2.8873291015625, 3.057861328125, 3.2283935546875, 3.39892578125, 3.5694580078125, 3.739990234375, 3.9105224609375, 4.0810546875, 4.2515869140625, 4.422119140625, 4.5926513671875, 4.76318359375, 4.9337158203125, 5.104248046875, 5.2747802734375, 5.4453125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 13.0, 5.0, 12.0, 23.0, 29.0, 25.0, 35.0, 60.0, 93.0, 116.0, 196.0, 413.0, 864.0, 2332.0, 9270.0, 71169.0, 2889610.0, 151773.0, 14224.0, 3195.0, 1074.0, 448.0, 241.0, 137.0, 91.0, 58.0, 45.0, 34.0, 25.0, 22.0, 15.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.625, -10.29931640625, -9.9736328125, -9.64794921875, -9.322265625, -8.99658203125, -8.6708984375, -8.34521484375, -8.01953125, -7.69384765625, -7.3681640625, -7.04248046875, -6.716796875, -6.39111328125, -6.0654296875, -5.73974609375, -5.4140625, -5.08837890625, -4.7626953125, -4.43701171875, -4.111328125, -3.78564453125, -3.4599609375, -3.13427734375, -2.80859375, -2.48291015625, -2.1572265625, -1.83154296875, -1.505859375, -1.18017578125, -0.8544921875, -0.52880859375, -0.203125, 0.12255859375, 0.4482421875, 0.77392578125, 1.099609375, 1.42529296875, 1.7509765625, 2.07666015625, 2.40234375, 2.72802734375, 3.0537109375, 3.37939453125, 3.705078125, 4.03076171875, 4.3564453125, 4.68212890625, 5.0078125, 5.33349609375, 5.6591796875, 5.98486328125, 6.310546875, 6.63623046875, 6.9619140625, 7.28759765625, 7.61328125, 7.93896484375, 8.2646484375, 8.59033203125, 8.916015625, 9.24169921875, 9.5673828125, 9.89306640625, 10.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 13.0, 26.0, 56.0, 90.0, 120.0, 185.0, 181.0, 140.0, 91.0, 60.0, 20.0, 13.0, 11.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.342370986938477, -16.93958854675293, -16.536806106567383, -16.134023666381836, -15.731240272521973, -15.328457832336426, -14.925675392150879, -14.522891998291016, -14.120109558105469, -13.717327117919922, -13.314544677734375, -12.911761283874512, -12.508978843688965, -12.106196403503418, -11.703413963317871, -11.300630569458008, -10.897848129272461, -10.495065689086914, -10.092283248901367, -9.689499855041504, -9.286717414855957, -8.88393497467041, -8.481152534484863, -8.078369140625, -7.6755876541137695, -7.272805213928223, -6.870022296905518, -6.467239856719971, -6.064456939697266, -5.661674499511719, -5.258892059326172, -4.856109142303467, -4.453326225280762, -4.050543785095215, -3.6477608680725098, -3.244978427886963, -2.842195510864258, -2.439413070678711, -2.036630392074585, -1.633847713470459, -1.231065034866333, -0.828282356262207, -0.42549973726272583, -0.02271711826324463, 0.38006556034088135, 0.7828481197357178, 1.1856307983398438, 1.5884134769439697, 1.9911961555480957, 2.3939788341522217, 2.7967615127563477, 3.1995439529418945, 3.6023268699645996, 4.0051093101501465, 4.407892227172852, 4.810674667358398, 5.213457107543945, 5.616239547729492, 6.019022464752197, 6.421804904937744, 6.824587821960449, 7.227370262145996, 7.630152702331543, 8.032936096191406, 8.435718536376953]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 1.0, 8.0, 14.0, 11.0, 10.0, 22.0, 14.0, 21.0, 22.0, 18.0, 20.0, 25.0, 28.0, 31.0, 41.0, 46.0, 33.0, 56.0, 42.0, 32.0, 37.0, 53.0, 41.0, 39.0, 36.0, 37.0, 32.0, 31.0, 34.0, 24.0, 19.0, 18.0, 17.0, 12.0, 13.0, 8.0, 5.0, 10.0, 8.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.799412727355957, -13.32646369934082, -12.853514671325684, -12.380565643310547, -11.907617568969727, -11.43466854095459, -10.961719512939453, -10.488770484924316, -10.01582145690918, -9.542872428894043, -9.069923400878906, -8.596975326538086, -8.12402629852295, -7.6510772705078125, -7.178128242492676, -6.705179214477539, -6.232231140136719, -5.759282112121582, -5.2863335609436035, -4.813384532928467, -4.340435981750488, -3.8674869537353516, -3.394537925720215, -2.9215891361236572, -2.4486403465270996, -1.975691556930542, -1.5027426481246948, -1.0297937393188477, -0.55684494972229, -0.08389616012573242, 0.3890528678894043, 0.8620016574859619, 1.3349494934082031, 1.8078982830047607, 2.2808470726013184, 2.753796100616455, 3.2267448902130127, 3.6996936798095703, 4.172642707824707, 4.645591735839844, 5.118540287017822, 5.591489315032959, 6.0644378662109375, 6.537386894226074, 7.010335922241211, 7.4832844734191895, 7.956233501434326, 8.429182052612305, 8.902131080627441, 9.375080108642578, 9.848029136657715, 10.320978164672852, 10.793926239013672, 11.266875267028809, 11.739824295043945, 12.212773323059082, 12.685722351074219, 13.158671379089355, 13.631620407104492, 14.104568481445312, 14.57751750946045, 15.050466537475586, 15.523415565490723, 15.99636459350586, 16.46931266784668]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 3.0, 12.0, 14.0, 11.0, 26.0, 15.0, 14.0, 31.0, 38.0, 36.0, 37.0, 36.0, 38.0, 56.0, 40.0, 42.0, 51.0, 30.0, 44.0, 48.0, 59.0, 46.0, 30.0, 32.0, 28.0, 24.0, 26.0, 15.0, 23.0, 10.0, 15.0, 13.0, 9.0, 9.0, 6.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.0925445556640625, -2.028839111328125, -1.9651336669921875, -1.90142822265625, -1.8377227783203125, -1.774017333984375, -1.7103118896484375, -1.6466064453125, -1.5829010009765625, -1.519195556640625, -1.4554901123046875, -1.39178466796875, -1.3280792236328125, -1.264373779296875, -1.2006683349609375, -1.136962890625, -1.0732574462890625, -1.009552001953125, -0.9458465576171875, -0.88214111328125, -0.8184356689453125, -0.754730224609375, -0.6910247802734375, -0.6273193359375, -0.5636138916015625, -0.499908447265625, -0.4362030029296875, -0.37249755859375, -0.3087921142578125, -0.245086669921875, -0.1813812255859375, -0.11767578125, -0.0539703369140625, 0.009735107421875, 0.0734405517578125, 0.13714599609375, 0.2008514404296875, 0.264556884765625, 0.3282623291015625, 0.3919677734375, 0.4556732177734375, 0.519378662109375, 0.5830841064453125, 0.64678955078125, 0.7104949951171875, 0.774200439453125, 0.8379058837890625, 0.901611328125, 0.9653167724609375, 1.029022216796875, 1.0927276611328125, 1.15643310546875, 1.2201385498046875, 1.283843994140625, 1.3475494384765625, 1.4112548828125, 1.4749603271484375, 1.538665771484375, 1.6023712158203125, 1.66607666015625, 1.7297821044921875, 1.793487548828125, 1.8571929931640625, 1.9208984375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 7.0, 10.0, 10.0, 14.0, 17.0, 25.0, 43.0, 47.0, 98.0, 111.0, 208.0, 311.0, 530.0, 825.0, 1512.0, 2720.0, 5484.0, 12120.0, 31892.0, 125431.0, 842991.0, 2412240.0, 610684.0, 97824.0, 27526.0, 10628.0, 4987.0, 2532.0, 1431.0, 775.0, 492.0, 272.0, 174.0, 106.0, 65.0, 40.0, 32.0, 21.0, 12.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.587890625, -3.48052978515625, -3.3731689453125, -3.26580810546875, -3.158447265625, -3.05108642578125, -2.9437255859375, -2.83636474609375, -2.72900390625, -2.62164306640625, -2.5142822265625, -2.40692138671875, -2.299560546875, -2.19219970703125, -2.0848388671875, -1.97747802734375, -1.8701171875, -1.76275634765625, -1.6553955078125, -1.54803466796875, -1.440673828125, -1.33331298828125, -1.2259521484375, -1.11859130859375, -1.01123046875, -0.90386962890625, -0.7965087890625, -0.68914794921875, -0.581787109375, -0.47442626953125, -0.3670654296875, -0.25970458984375, -0.15234375, -0.04498291015625, 0.0623779296875, 0.16973876953125, 0.277099609375, 0.38446044921875, 0.4918212890625, 0.59918212890625, 0.70654296875, 0.81390380859375, 0.9212646484375, 1.02862548828125, 1.135986328125, 1.24334716796875, 1.3507080078125, 1.45806884765625, 1.5654296875, 1.67279052734375, 1.7801513671875, 1.88751220703125, 1.994873046875, 2.10223388671875, 2.2095947265625, 2.31695556640625, 2.42431640625, 2.53167724609375, 2.6390380859375, 2.74639892578125, 2.853759765625, 2.96112060546875, 3.0684814453125, 3.17584228515625, 3.283203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 5.0, 4.0, 12.0, 16.0, 16.0, 21.0, 27.0, 38.0, 76.0, 78.0, 99.0, 129.0, 186.0, 294.0, 389.0, 508.0, 528.0, 459.0, 329.0, 230.0, 154.0, 113.0, 72.0, 71.0, 54.0, 32.0, 29.0, 35.0, 14.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.96484375, -2.875396728515625, -2.78594970703125, -2.696502685546875, -2.6070556640625, -2.517608642578125, -2.42816162109375, -2.338714599609375, -2.249267578125, -2.159820556640625, -2.07037353515625, -1.980926513671875, -1.8914794921875, -1.802032470703125, -1.71258544921875, -1.623138427734375, -1.53369140625, -1.444244384765625, -1.35479736328125, -1.265350341796875, -1.1759033203125, -1.086456298828125, -0.99700927734375, -0.907562255859375, -0.818115234375, -0.728668212890625, -0.63922119140625, -0.549774169921875, -0.4603271484375, -0.370880126953125, -0.28143310546875, -0.191986083984375, -0.1025390625, -0.013092041015625, 0.07635498046875, 0.165802001953125, 0.2552490234375, 0.344696044921875, 0.43414306640625, 0.523590087890625, 0.613037109375, 0.702484130859375, 0.79193115234375, 0.881378173828125, 0.9708251953125, 1.060272216796875, 1.14971923828125, 1.239166259765625, 1.32861328125, 1.418060302734375, 1.50750732421875, 1.596954345703125, 1.6864013671875, 1.775848388671875, 1.86529541015625, 1.954742431640625, 2.044189453125, 2.133636474609375, 2.22308349609375, 2.312530517578125, 2.4019775390625, 2.491424560546875, 2.58087158203125, 2.670318603515625, 2.759765625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 15.0, 30.0, 41.0, 50.0, 68.0, 119.0, 182.0, 232.0, 481.0, 914.0, 2104.0, 6826.0, 30855.0, 274431.0, 3461930.0, 366515.0, 36954.0, 7972.0, 2280.0, 953.0, 478.0, 274.0, 171.0, 122.0, 62.0, 50.0, 24.0, 18.0, 23.0, 17.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.4248046875, -7.189453125, -6.9541015625, -6.71875, -6.4833984375, -6.248046875, -6.0126953125, -5.77734375, -5.5419921875, -5.306640625, -5.0712890625, -4.8359375, -4.6005859375, -4.365234375, -4.1298828125, -3.89453125, -3.6591796875, -3.423828125, -3.1884765625, -2.953125, -2.7177734375, -2.482421875, -2.2470703125, -2.01171875, -1.7763671875, -1.541015625, -1.3056640625, -1.0703125, -0.8349609375, -0.599609375, -0.3642578125, -0.12890625, 0.1064453125, 0.341796875, 0.5771484375, 0.8125, 1.0478515625, 1.283203125, 1.5185546875, 1.75390625, 1.9892578125, 2.224609375, 2.4599609375, 2.6953125, 2.9306640625, 3.166015625, 3.4013671875, 3.63671875, 3.8720703125, 4.107421875, 4.3427734375, 4.578125, 4.8134765625, 5.048828125, 5.2841796875, 5.51953125, 5.7548828125, 5.990234375, 6.2255859375, 6.4609375, 6.6962890625, 6.931640625, 7.1669921875, 7.40234375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 43.0, 121.0, 303.0, 323.0, 152.0, 49.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.864646911621094, -43.6187744140625, -42.37290573120117, -41.127037048339844, -39.88116455078125, -38.635292053222656, -37.38942337036133, -36.1435546875, -34.897682189941406, -33.65180969238281, -32.405941009521484, -31.160070419311523, -29.914199829101562, -28.6683292388916, -27.42245864868164, -26.17658805847168, -24.93071746826172, -23.684846878051758, -22.438976287841797, -21.193105697631836, -19.947235107421875, -18.701364517211914, -17.455493927001953, -16.209623336791992, -14.963752746582031, -13.71788215637207, -12.47201156616211, -11.226140975952148, -9.980270385742188, -8.734399795532227, -7.488529205322266, -6.242658615112305, -4.996788024902344, -3.750917434692383, -2.505046844482422, -1.259176254272461, -0.0133056640625, 1.232564926147461, 2.478435516357422, 3.724306106567383, 4.970176696777344, 6.216047286987305, 7.461917877197266, 8.707788467407227, 9.953659057617188, 11.199529647827148, 12.44540023803711, 13.69127082824707, 14.937141418457031, 16.183012008666992, 17.428882598876953, 18.674753189086914, 19.920623779296875, 21.166494369506836, 22.412364959716797, 23.658235549926758, 24.90410614013672, 26.14997673034668, 27.39584732055664, 28.6417179107666, 29.887588500976562, 31.133459091186523, 32.379329681396484, 33.62519836425781, 34.871070861816406]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 6.0, 9.0, 6.0, 16.0, 15.0, 16.0, 23.0, 28.0, 21.0, 25.0, 31.0, 28.0, 34.0, 33.0, 42.0, 42.0, 45.0, 27.0, 42.0, 40.0, 36.0, 35.0, 44.0, 37.0, 35.0, 29.0, 35.0, 27.0, 24.0, 29.0, 16.0, 19.0, 19.0, 16.0, 13.0, 7.0, 13.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.684999465942383, -8.395992279052734, -8.10698413848877, -7.817976951599121, -7.5289692878723145, -7.239961624145508, -6.950954437255859, -6.661946773529053, -6.372939109802246, -6.0839314460754395, -5.794924259185791, -5.505916595458984, -5.216908931732178, -4.927901268005371, -4.638894081115723, -4.349886417388916, -4.060879230499268, -3.77187180519104, -3.4828641414642334, -3.193856716156006, -2.904849052429199, -2.6158416271209717, -2.326834201812744, -2.0378265380859375, -1.74881911277771, -1.4598115682601929, -1.1708040237426758, -0.8817965984344482, -0.5927890539169312, -0.30378150939941406, -0.014774084091186523, 0.2742335796356201, 0.5632410049438477, 0.8522485494613647, 1.1412560939788818, 1.4302635192871094, 1.7192710638046265, 2.0082786083221436, 2.297286033630371, 2.5862936973571777, 2.8753011226654053, 3.164308547973633, 3.4533162117004395, 3.742323637008667, 4.0313310623168945, 4.320338726043701, 4.609346389770508, 4.898353576660156, 5.187361240386963, 5.4763689041137695, 5.765376091003418, 6.054383754730225, 6.343391418457031, 6.63239860534668, 6.921406269073486, 7.210413932800293, 7.499421119689941, 7.788428783416748, 8.077436447143555, 8.366443634033203, 8.655450820922852, 8.944458961486816, 9.233466148376465, 9.52247428894043, 9.811481475830078]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 9.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 15.0, 15.0, 21.0, 30.0, 31.0, 30.0, 31.0, 45.0, 36.0, 35.0, 43.0, 40.0, 49.0, 53.0, 59.0, 52.0, 49.0, 31.0, 45.0, 29.0, 24.0, 28.0, 30.0, 15.0, 18.0, 14.0, 11.0, 12.0, 11.0, 14.0, 5.0, 8.0, 3.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.158203125, -2.0951690673828125, -2.032135009765625, -1.9691009521484375, -1.90606689453125, -1.8430328369140625, -1.779998779296875, -1.7169647216796875, -1.6539306640625, -1.5908966064453125, -1.527862548828125, -1.4648284912109375, -1.40179443359375, -1.3387603759765625, -1.275726318359375, -1.2126922607421875, -1.149658203125, -1.0866241455078125, -1.023590087890625, -0.9605560302734375, -0.89752197265625, -0.8344879150390625, -0.771453857421875, -0.7084197998046875, -0.6453857421875, -0.5823516845703125, -0.519317626953125, -0.4562835693359375, -0.39324951171875, -0.3302154541015625, -0.267181396484375, -0.2041473388671875, -0.14111328125, -0.0780792236328125, -0.015045166015625, 0.0479888916015625, 0.11102294921875, 0.1740570068359375, 0.237091064453125, 0.3001251220703125, 0.3631591796875, 0.4261932373046875, 0.489227294921875, 0.5522613525390625, 0.61529541015625, 0.6783294677734375, 0.741363525390625, 0.8043975830078125, 0.867431640625, 0.9304656982421875, 0.993499755859375, 1.0565338134765625, 1.11956787109375, 1.1826019287109375, 1.245635986328125, 1.3086700439453125, 1.3717041015625, 1.4347381591796875, 1.497772216796875, 1.5608062744140625, 1.62384033203125, 1.6868743896484375, 1.749908447265625, 1.8129425048828125, 1.8759765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 19.0, 16.0, 35.0, 48.0, 91.0, 154.0, 233.0, 356.0, 520.0, 870.0, 1424.0, 2172.0, 3503.0, 5448.0, 8578.0, 13411.0, 20996.0, 32253.0, 48264.0, 72016.0, 102473.0, 132454.0, 148352.0, 134352.0, 104011.0, 74081.0, 49665.0, 33284.0, 21473.0, 13749.0, 8790.0, 5554.0, 3619.0, 2264.0, 1468.0, 937.0, 631.0, 378.0, 216.0, 134.0, 96.0, 60.0, 28.0, 20.0, 22.0, 13.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2476806640625, -0.23956871032714844, -0.23145675659179688, -0.2233448028564453, -0.21523284912109375, -0.2071208953857422, -0.19900894165039062, -0.19089698791503906, -0.1827850341796875, -0.17467308044433594, -0.16656112670898438, -0.1584491729736328, -0.15033721923828125, -0.1422252655029297, -0.13411331176757812, -0.12600135803222656, -0.117889404296875, -0.10977745056152344, -0.10166549682617188, -0.09355354309082031, -0.08544158935546875, -0.07732963562011719, -0.06921768188476562, -0.06110572814941406, -0.0529937744140625, -0.04488182067871094, -0.036769866943359375, -0.028657913208007812, -0.02054595947265625, -0.012434005737304688, -0.004322052001953125, 0.0037899017333984375, 0.01190185546875, 0.020013809204101562, 0.028125762939453125, 0.03623771667480469, 0.04434967041015625, 0.05246162414550781, 0.060573577880859375, 0.06868553161621094, 0.0767974853515625, 0.08490943908691406, 0.09302139282226562, 0.10113334655761719, 0.10924530029296875, 0.11735725402832031, 0.12546920776367188, 0.13358116149902344, 0.141693115234375, 0.14980506896972656, 0.15791702270507812, 0.1660289764404297, 0.17414093017578125, 0.1822528839111328, 0.19036483764648438, 0.19847679138183594, 0.2065887451171875, 0.21470069885253906, 0.22281265258789062, 0.2309246063232422, 0.23903656005859375, 0.2471485137939453, 0.2552604675292969, 0.26337242126464844, 0.271484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 7.0, 13.0, 7.0, 16.0, 23.0, 20.0, 22.0, 18.0, 27.0, 22.0, 32.0, 27.0, 26.0, 32.0, 50.0, 29.0, 38.0, 48.0, 1064.0, 40.0, 46.0, 27.0, 45.0, 33.0, 29.0, 32.0, 31.0, 28.0, 27.0, 23.0, 21.0, 20.0, 13.0, 11.0, 7.0, 12.0, 11.0, 6.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2666015625, -1.22613525390625, -1.1856689453125, -1.14520263671875, -1.104736328125, -1.06427001953125, -1.0238037109375, -0.98333740234375, -0.94287109375, -0.90240478515625, -0.8619384765625, -0.82147216796875, -0.781005859375, -0.74053955078125, -0.7000732421875, -0.65960693359375, -0.619140625, -0.57867431640625, -0.5382080078125, -0.49774169921875, -0.457275390625, -0.41680908203125, -0.3763427734375, -0.33587646484375, -0.29541015625, -0.25494384765625, -0.2144775390625, -0.17401123046875, -0.133544921875, -0.09307861328125, -0.0526123046875, -0.01214599609375, 0.0283203125, 0.06878662109375, 0.1092529296875, 0.14971923828125, 0.190185546875, 0.23065185546875, 0.2711181640625, 0.31158447265625, 0.35205078125, 0.39251708984375, 0.4329833984375, 0.47344970703125, 0.513916015625, 0.55438232421875, 0.5948486328125, 0.63531494140625, 0.67578125, 0.71624755859375, 0.7567138671875, 0.79718017578125, 0.837646484375, 0.87811279296875, 0.9185791015625, 0.95904541015625, 0.99951171875, 1.03997802734375, 1.0804443359375, 1.12091064453125, 1.161376953125, 1.20184326171875, 1.2423095703125, 1.28277587890625, 1.3232421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 14.0, 19.0, 30.0, 47.0, 54.0, 100.0, 123.0, 180.0, 231.0, 314.0, 471.0, 712.0, 990.0, 1456.0, 2315.0, 3339.0, 4974.0, 7474.0, 11378.0, 18604.0, 41612.0, 262182.0, 1571324.0, 98122.0, 27431.0, 14745.0, 9313.0, 6198.0, 4155.0, 2946.0, 1902.0, 1355.0, 907.0, 612.0, 432.0, 297.0, 223.0, 148.0, 102.0, 72.0, 60.0, 46.0, 26.0, 28.0, 15.0, 14.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412841796875, -0.39920806884765625, -0.3855743408203125, -0.37194061279296875, -0.358306884765625, -0.34467315673828125, -0.3310394287109375, -0.31740570068359375, -0.30377197265625, -0.29013824462890625, -0.2765045166015625, -0.26287078857421875, -0.249237060546875, -0.23560333251953125, -0.2219696044921875, -0.20833587646484375, -0.1947021484375, -0.18106842041015625, -0.1674346923828125, -0.15380096435546875, -0.140167236328125, -0.12653350830078125, -0.1128997802734375, -0.09926605224609375, -0.08563232421875, -0.07199859619140625, -0.0583648681640625, -0.04473114013671875, -0.031097412109375, -0.01746368408203125, -0.0038299560546875, 0.00980377197265625, 0.0234375, 0.03707122802734375, 0.0507049560546875, 0.06433868408203125, 0.077972412109375, 0.09160614013671875, 0.1052398681640625, 0.11887359619140625, 0.13250732421875, 0.14614105224609375, 0.1597747802734375, 0.17340850830078125, 0.187042236328125, 0.20067596435546875, 0.2143096923828125, 0.22794342041015625, 0.2415771484375, 0.25521087646484375, 0.2688446044921875, 0.28247833251953125, 0.296112060546875, 0.30974578857421875, 0.3233795166015625, 0.33701324462890625, 0.35064697265625, 0.36428070068359375, 0.3779144287109375, 0.39154815673828125, 0.405181884765625, 0.41881561279296875, 0.4324493408203125, 0.44608306884765625, 0.459716796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 4.0, 6.0, 10.0, 10.0, 7.0, 12.0, 15.0, 22.0, 36.0, 27.0, 26.0, 35.0, 40.0, 43.0, 44.0, 56.0, 55.0, 48.0, 64.0, 54.0, 49.0, 60.0, 38.0, 40.0, 34.0, 20.0, 22.0, 15.0, 12.0, 14.0, 17.0, 8.0, 9.0, 10.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0222625732421875, -0.02152729034423828, -0.020792007446289062, -0.020056724548339844, -0.019321441650390625, -0.018586158752441406, -0.017850875854492188, -0.01711559295654297, -0.01638031005859375, -0.01564502716064453, -0.014909744262695312, -0.014174461364746094, -0.013439178466796875, -0.012703895568847656, -0.011968612670898438, -0.011233329772949219, -0.010498046875, -0.009762763977050781, -0.009027481079101562, -0.008292198181152344, -0.007556915283203125, -0.006821632385253906, -0.0060863494873046875, -0.005351066589355469, -0.00461578369140625, -0.0038805007934570312, -0.0031452178955078125, -0.0024099349975585938, -0.001674652099609375, -0.0009393692016601562, -0.0002040863037109375, 0.0005311965942382812, 0.0012664794921875, 0.0020017623901367188, 0.0027370452880859375, 0.0034723281860351562, 0.004207611083984375, 0.004942893981933594, 0.0056781768798828125, 0.006413459777832031, 0.00714874267578125, 0.007884025573730469, 0.008619308471679688, 0.009354591369628906, 0.010089874267578125, 0.010825157165527344, 0.011560440063476562, 0.012295722961425781, 0.013031005859375, 0.013766288757324219, 0.014501571655273438, 0.015236854553222656, 0.015972137451171875, 0.016707420349121094, 0.017442703247070312, 0.01817798614501953, 0.01891326904296875, 0.01964855194091797, 0.020383834838867188, 0.021119117736816406, 0.021854400634765625, 0.022589683532714844, 0.023324966430664062, 0.02406024932861328, 0.0247955322265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 8.0, 11.0, 11.0, 16.0, 21.0, 15.0, 27.0, 38.0, 60.0, 71.0, 102.0, 139.0, 223.0, 471.0, 2133.0, 260482.0, 778236.0, 5083.0, 571.0, 232.0, 165.0, 101.0, 61.0, 56.0, 34.0, 43.0, 30.0, 15.0, 14.0, 13.0, 7.0, 6.0, 5.0, 5.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52734375, -0.5118904113769531, -0.49643707275390625, -0.4809837341308594, -0.4655303955078125, -0.4500770568847656, -0.43462371826171875, -0.4191703796386719, -0.403717041015625, -0.3882637023925781, -0.37281036376953125, -0.3573570251464844, -0.3419036865234375, -0.3264503479003906, -0.31099700927734375, -0.2955436706542969, -0.28009033203125, -0.2646369934082031, -0.24918365478515625, -0.23373031616210938, -0.2182769775390625, -0.20282363891601562, -0.18737030029296875, -0.17191696166992188, -0.156463623046875, -0.14101028442382812, -0.12555694580078125, -0.11010360717773438, -0.0946502685546875, -0.07919692993164062, -0.06374359130859375, -0.048290252685546875, -0.0328369140625, -0.017383575439453125, -0.00193023681640625, 0.013523101806640625, 0.0289764404296875, 0.044429779052734375, 0.05988311767578125, 0.07533645629882812, 0.090789794921875, 0.10624313354492188, 0.12169647216796875, 0.13714981079101562, 0.1526031494140625, 0.16805648803710938, 0.18350982666015625, 0.19896316528320312, 0.21441650390625, 0.22986984252929688, 0.24532318115234375, 0.2607765197753906, 0.2762298583984375, 0.2916831970214844, 0.30713653564453125, 0.3225898742675781, 0.338043212890625, 0.3534965515136719, 0.36894989013671875, 0.3844032287597656, 0.3998565673828125, 0.4153099060058594, 0.43076324462890625, 0.4462165832519531, 0.461669921875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 606.0, 387.0, 13.0], "bins": [-0.7706297636032104, -0.7581807374954224, -0.7457316517829895, -0.7332825660705566, -0.7208335399627686, -0.7083845138549805, -0.6959354281425476, -0.6834863424301147, -0.6710373163223267, -0.6585882902145386, -0.6461392045021057, -0.6336901187896729, -0.6212410926818848, -0.6087920665740967, -0.5963429808616638, -0.583893895149231, -0.5714448690414429, -0.5589958429336548, -0.5465467572212219, -0.5340976715087891, -0.521648645401001, -0.5091996192932129, -0.49675053358078003, -0.48430147767066956, -0.4718524217605591, -0.4594033658504486, -0.44695430994033813, -0.43450525403022766, -0.4220561981201172, -0.4096071422100067, -0.39715808629989624, -0.38470903038978577, -0.3722599446773529, -0.35981088876724243, -0.34736183285713196, -0.3349127769470215, -0.322463721036911, -0.31001466512680054, -0.29756560921669006, -0.2851165533065796, -0.2726674973964691, -0.26021844148635864, -0.24776938557624817, -0.2353203296661377, -0.22287127375602722, -0.21042221784591675, -0.19797316193580627, -0.1855241060256958, -0.17307506501674652, -0.16062600910663605, -0.14817695319652557, -0.1357278972864151, -0.12327884137630463, -0.11082978546619415, -0.09838072955608368, -0.0859316736459732, -0.07348261028528214, -0.06103355437517166, -0.04858449846506119, -0.036135442554950714, -0.02368638664484024, -0.011237330734729767, 0.0012117251753807068, 0.01366078108549118, 0.026109835132956505]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 10.0, 5.0, 8.0, 11.0, 13.0, 12.0, 14.0, 19.0, 25.0, 31.0, 36.0, 27.0, 27.0, 33.0, 53.0, 42.0, 49.0, 42.0, 38.0, 39.0, 50.0, 39.0, 43.0, 38.0, 39.0, 37.0, 30.0, 30.0, 30.0, 22.0, 16.0, 16.0, 16.0, 7.0, 12.0, 5.0, 7.0, 7.0, 2.0, 5.0, 1.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02419590950012207, -0.02327083796262741, -0.0223457682877779, -0.02142069861292839, -0.02049562707543373, -0.01957055553793907, -0.01864548586308956, -0.01772041618824005, -0.016795344650745392, -0.015870273113250732, -0.014945203438401222, -0.014020132832229137, -0.013095062226057053, -0.012169991619884968, -0.011244921013712883, -0.010319850407540798, -0.009394779801368713, -0.008469709195196629, -0.007544638589024544, -0.006619567982852459, -0.005694497376680374, -0.004769426770508289, -0.0038443561643362045, -0.0029192855581641197, -0.001994214951992035, -0.00106914434581995, -0.0001440737396478653, 0.0007809968665242195, 0.0017060674726963043, 0.002631138078868389, 0.003556208685040474, 0.004481279291212559, 0.0054063498973846436, 0.006331420503556728, 0.007256491109728813, 0.008181561715900898, 0.009106632322072983, 0.010031702928245068, 0.010956773534417152, 0.011881844140589237, 0.012806914746761322, 0.013731985352933407, 0.014657055959105492, 0.015582126565277576, 0.01650719717144966, 0.01743226870894432, 0.01835733838379383, 0.01928240805864334, 0.020207479596138, 0.02113255113363266, 0.02205762080848217, 0.02298269048333168, 0.02390776202082634, 0.024832833558321, 0.02575790323317051, 0.02668297290802002, 0.02760804444551468, 0.02853311598300934, 0.02945818565785885, 0.03038325533270836, 0.03130832687020302, 0.03223339840769768, 0.03315846621990204, 0.0340835377573967, 0.03500860929489136]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 5.0, 8.0, 16.0, 9.0, 12.0, 9.0, 17.0, 11.0, 19.0, 39.0, 36.0, 30.0, 35.0, 36.0, 41.0, 48.0, 53.0, 39.0, 32.0, 30.0, 59.0, 60.0, 49.0, 32.0, 30.0, 37.0, 44.0, 27.0, 21.0, 14.0, 16.0, 12.0, 10.0, 15.0, 8.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.0547637939453125, -1.992340087890625, -1.9299163818359375, -1.86749267578125, -1.8050689697265625, -1.742645263671875, -1.6802215576171875, -1.6177978515625, -1.5553741455078125, -1.492950439453125, -1.4305267333984375, -1.36810302734375, -1.3056793212890625, -1.243255615234375, -1.1808319091796875, -1.118408203125, -1.0559844970703125, -0.993560791015625, -0.9311370849609375, -0.86871337890625, -0.8062896728515625, -0.743865966796875, -0.6814422607421875, -0.6190185546875, -0.5565948486328125, -0.494171142578125, -0.4317474365234375, -0.36932373046875, -0.3069000244140625, -0.244476318359375, -0.1820526123046875, -0.11962890625, -0.0572052001953125, 0.005218505859375, 0.0676422119140625, 0.13006591796875, 0.1924896240234375, 0.254913330078125, 0.3173370361328125, 0.3797607421875, 0.4421844482421875, 0.504608154296875, 0.5670318603515625, 0.62945556640625, 0.6918792724609375, 0.754302978515625, 0.8167266845703125, 0.879150390625, 0.9415740966796875, 1.003997802734375, 1.0664215087890625, 1.12884521484375, 1.1912689208984375, 1.253692626953125, 1.3161163330078125, 1.3785400390625, 1.4409637451171875, 1.503387451171875, 1.5658111572265625, 1.62823486328125, 1.6906585693359375, 1.753082275390625, 1.8155059814453125, 1.8779296875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 11.0, 19.0, 27.0, 40.0, 56.0, 100.0, 109.0, 205.0, 310.0, 496.0, 784.0, 1225.0, 2176.0, 3475.0, 6252.0, 12274.0, 25550.0, 61560.0, 166665.0, 387771.0, 231774.0, 81061.0, 32797.0, 15308.0, 7870.0, 4235.0, 2503.0, 1442.0, 923.0, 512.0, 359.0, 231.0, 142.0, 80.0, 61.0, 48.0, 28.0, 26.0, 15.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0], "bins": [-3.044921875, -2.96405029296875, -2.8831787109375, -2.80230712890625, -2.721435546875, -2.64056396484375, -2.5596923828125, -2.47882080078125, -2.39794921875, -2.31707763671875, -2.2362060546875, -2.15533447265625, -2.074462890625, -1.99359130859375, -1.9127197265625, -1.83184814453125, -1.7509765625, -1.67010498046875, -1.5892333984375, -1.50836181640625, -1.427490234375, -1.34661865234375, -1.2657470703125, -1.18487548828125, -1.10400390625, -1.02313232421875, -0.9422607421875, -0.86138916015625, -0.780517578125, -0.69964599609375, -0.6187744140625, -0.53790283203125, -0.45703125, -0.37615966796875, -0.2952880859375, -0.21441650390625, -0.133544921875, -0.05267333984375, 0.0281982421875, 0.10906982421875, 0.18994140625, 0.27081298828125, 0.3516845703125, 0.43255615234375, 0.513427734375, 0.59429931640625, 0.6751708984375, 0.75604248046875, 0.8369140625, 0.91778564453125, 0.9986572265625, 1.07952880859375, 1.160400390625, 1.24127197265625, 1.3221435546875, 1.40301513671875, 1.48388671875, 1.56475830078125, 1.6456298828125, 1.72650146484375, 1.807373046875, 1.88824462890625, 1.9691162109375, 2.04998779296875, 2.130859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 12.0, 9.0, 17.0, 21.0, 16.0, 18.0, 26.0, 25.0, 23.0, 39.0, 30.0, 50.0, 51.0, 66.0, 110.0, 231.0, 1442.0, 275.0, 130.0, 81.0, 61.0, 41.0, 41.0, 33.0, 27.0, 32.0, 25.0, 20.0, 18.0, 13.0, 16.0, 10.0, 6.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.86328125, -3.6927490234375, -3.522216796875, -3.3516845703125, -3.18115234375, -3.0106201171875, -2.840087890625, -2.6695556640625, -2.4990234375, -2.3284912109375, -2.157958984375, -1.9874267578125, -1.81689453125, -1.6463623046875, -1.475830078125, -1.3052978515625, -1.134765625, -0.9642333984375, -0.793701171875, -0.6231689453125, -0.45263671875, -0.2821044921875, -0.111572265625, 0.0589599609375, 0.2294921875, 0.4000244140625, 0.570556640625, 0.7410888671875, 0.91162109375, 1.0821533203125, 1.252685546875, 1.4232177734375, 1.59375, 1.7642822265625, 1.934814453125, 2.1053466796875, 2.27587890625, 2.4464111328125, 2.616943359375, 2.7874755859375, 2.9580078125, 3.1285400390625, 3.299072265625, 3.4696044921875, 3.64013671875, 3.8106689453125, 3.981201171875, 4.1517333984375, 4.322265625, 4.4927978515625, 4.663330078125, 4.8338623046875, 5.00439453125, 5.1749267578125, 5.345458984375, 5.5159912109375, 5.6865234375, 5.8570556640625, 6.027587890625, 6.1981201171875, 6.36865234375, 6.5391845703125, 6.709716796875, 6.8802490234375, 7.05078125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 13.0, 13.0, 13.0, 20.0, 46.0, 57.0, 77.0, 126.0, 300.0, 664.0, 1954.0, 6869.0, 37737.0, 1083012.0, 1953373.0, 49513.0, 8178.0, 2279.0, 789.0, 289.0, 144.0, 85.0, 51.0, 29.0, 16.0, 14.0, 9.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.171875, -8.92437744140625, -8.6768798828125, -8.42938232421875, -8.181884765625, -7.93438720703125, -7.6868896484375, -7.43939208984375, -7.19189453125, -6.94439697265625, -6.6968994140625, -6.44940185546875, -6.201904296875, -5.95440673828125, -5.7069091796875, -5.45941162109375, -5.2119140625, -4.96441650390625, -4.7169189453125, -4.46942138671875, -4.221923828125, -3.97442626953125, -3.7269287109375, -3.47943115234375, -3.23193359375, -2.98443603515625, -2.7369384765625, -2.48944091796875, -2.241943359375, -1.99444580078125, -1.7469482421875, -1.49945068359375, -1.251953125, -1.00445556640625, -0.7569580078125, -0.50946044921875, -0.261962890625, -0.01446533203125, 0.2330322265625, 0.48052978515625, 0.72802734375, 0.97552490234375, 1.2230224609375, 1.47052001953125, 1.718017578125, 1.96551513671875, 2.2130126953125, 2.46051025390625, 2.7080078125, 2.95550537109375, 3.2030029296875, 3.45050048828125, 3.697998046875, 3.94549560546875, 4.1929931640625, 4.44049072265625, 4.68798828125, 4.93548583984375, 5.1829833984375, 5.43048095703125, 5.677978515625, 5.92547607421875, 6.1729736328125, 6.42047119140625, 6.66796875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 444.0, 558.0, 9.0], "bins": [-203.25067138671875, -199.97491455078125, -196.69915771484375, -193.4234161376953, -190.1476593017578, -186.8719024658203, -183.5961456298828, -180.32040405273438, -177.04464721679688, -173.76889038085938, -170.49313354492188, -167.21739196777344, -163.94163513183594, -160.66587829589844, -157.39012145996094, -154.1143798828125, -150.838623046875, -147.5628662109375, -144.287109375, -141.01136779785156, -137.73561096191406, -134.45985412597656, -131.18409729003906, -127.9083480834961, -124.63258361816406, -121.35682678222656, -118.0810775756836, -114.8053207397461, -111.52957153320312, -108.25381469726562, -104.97805786132812, -101.70230865478516, -98.42655944824219, -95.15080261230469, -91.87505340576172, -88.59929656982422, -85.32354736328125, -82.04779052734375, -78.77203369140625, -75.49628448486328, -72.22053527832031, -68.94477844238281, -65.66902923583984, -62.393272399902344, -59.117523193359375, -55.841766357421875, -52.56601333618164, -49.290260314941406, -46.014503479003906, -42.73875045776367, -39.46299743652344, -36.18724060058594, -32.91149139404297, -29.6357364654541, -26.359981536865234, -23.084228515625, -19.808475494384766, -16.53272247314453, -13.25696849822998, -9.98121452331543, -6.705461502075195, -3.429708480834961, -0.15395355224609375, 3.1217994689941406, 6.397552490234375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 5.0, 10.0, 14.0, 16.0, 10.0, 20.0, 19.0, 19.0, 34.0, 31.0, 25.0, 31.0, 37.0, 27.0, 38.0, 29.0, 39.0, 50.0, 36.0, 53.0, 44.0, 49.0, 38.0, 35.0, 26.0, 28.0, 30.0, 26.0, 15.0, 25.0, 17.0, 16.0, 12.0, 12.0, 16.0, 4.0, 10.0, 4.0, 12.0, 9.0, 6.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7178955078125, -11.34408187866211, -10.970268249511719, -10.596454620361328, -10.222640037536621, -9.84882640838623, -9.47501277923584, -9.10119915008545, -8.727384567260742, -8.353570938110352, -7.979756832122803, -7.605943202972412, -7.232129096984863, -6.858315467834473, -6.484501838684082, -6.110688209533691, -5.736874580383301, -5.36306095123291, -4.989246845245361, -4.615433216094971, -4.241619110107422, -3.8678054809570312, -3.4939918518066406, -3.120177984237671, -2.746364116668701, -2.3725502490997314, -1.9987365007400513, -1.624922752380371, -1.2511088848114014, -0.8772950172424316, -0.503481388092041, -0.1296675205230713, 0.24414634704589844, 0.6179601550102234, 0.9917739629745483, 1.3655877113342285, 1.7394015789031982, 2.113215446472168, 2.4870290756225586, 2.8608429431915283, 3.234656810760498, 3.6084706783294678, 3.9822845458984375, 4.356098175048828, 4.729911804199219, 5.103725910186768, 5.477539539337158, 5.851353645324707, 6.225167274475098, 6.598980903625488, 6.972795009613037, 7.346608638763428, 7.720422744750977, 8.094236373901367, 8.468050003051758, 8.841863632202148, 9.215677261352539, 9.58949089050293, 9.96330451965332, 10.337118148803711, 10.710932731628418, 11.084746360778809, 11.4585599899292, 11.83237361907959, 12.206188201904297]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 9.0, 10.0, 10.0, 13.0, 21.0, 21.0, 19.0, 28.0, 34.0, 42.0, 38.0, 34.0, 44.0, 40.0, 46.0, 47.0, 45.0, 43.0, 39.0, 50.0, 37.0, 39.0, 38.0, 42.0, 30.0, 26.0, 29.0, 22.0, 11.0, 8.0, 11.0, 9.0, 11.0, 6.0, 7.0, 4.0, 6.0, 7.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.189453125, -2.1242218017578125, -2.058990478515625, -1.9937591552734375, -1.92852783203125, -1.8632965087890625, -1.798065185546875, -1.7328338623046875, -1.6676025390625, -1.6023712158203125, -1.537139892578125, -1.4719085693359375, -1.40667724609375, -1.3414459228515625, -1.276214599609375, -1.2109832763671875, -1.145751953125, -1.0805206298828125, -1.015289306640625, -0.9500579833984375, -0.88482666015625, -0.8195953369140625, -0.754364013671875, -0.6891326904296875, -0.6239013671875, -0.5586700439453125, -0.493438720703125, -0.4282073974609375, -0.36297607421875, -0.2977447509765625, -0.232513427734375, -0.1672821044921875, -0.10205078125, -0.0368194580078125, 0.028411865234375, 0.0936431884765625, 0.15887451171875, 0.2241058349609375, 0.289337158203125, 0.3545684814453125, 0.4197998046875, 0.4850311279296875, 0.550262451171875, 0.6154937744140625, 0.68072509765625, 0.7459564208984375, 0.811187744140625, 0.8764190673828125, 0.941650390625, 1.0068817138671875, 1.072113037109375, 1.1373443603515625, 1.20257568359375, 1.2678070068359375, 1.333038330078125, 1.3982696533203125, 1.4635009765625, 1.5287322998046875, 1.593963623046875, 1.6591949462890625, 1.72442626953125, 1.7896575927734375, 1.854888916015625, 1.9201202392578125, 1.9853515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 12.0, 7.0, 7.0, 7.0, 7.0, 18.0, 18.0, 27.0, 52.0, 67.0, 85.0, 90.0, 160.0, 239.0, 306.0, 478.0, 659.0, 1048.0, 1721.0, 2689.0, 4738.0, 8844.0, 19592.0, 58414.0, 290522.0, 1647571.0, 1747638.0, 306015.0, 60990.0, 20366.0, 9255.0, 4824.0, 2776.0, 1707.0, 1057.0, 708.0, 456.0, 326.0, 222.0, 167.0, 112.0, 85.0, 51.0, 47.0, 39.0, 22.0, 11.0, 17.0, 9.0, 5.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.033203125, -2.9354248046875, -2.837646484375, -2.7398681640625, -2.64208984375, -2.5443115234375, -2.446533203125, -2.3487548828125, -2.2509765625, -2.1531982421875, -2.055419921875, -1.9576416015625, -1.85986328125, -1.7620849609375, -1.664306640625, -1.5665283203125, -1.46875, -1.3709716796875, -1.273193359375, -1.1754150390625, -1.07763671875, -0.9798583984375, -0.882080078125, -0.7843017578125, -0.6865234375, -0.5887451171875, -0.490966796875, -0.3931884765625, -0.29541015625, -0.1976318359375, -0.099853515625, -0.0020751953125, 0.095703125, 0.1934814453125, 0.291259765625, 0.3890380859375, 0.48681640625, 0.5845947265625, 0.682373046875, 0.7801513671875, 0.8779296875, 0.9757080078125, 1.073486328125, 1.1712646484375, 1.26904296875, 1.3668212890625, 1.464599609375, 1.5623779296875, 1.66015625, 1.7579345703125, 1.855712890625, 1.9534912109375, 2.05126953125, 2.1490478515625, 2.246826171875, 2.3446044921875, 2.4423828125, 2.5401611328125, 2.637939453125, 2.7357177734375, 2.83349609375, 2.9312744140625, 3.029052734375, 3.1268310546875, 3.224609375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 7.0, 8.0, 12.0, 11.0, 21.0, 29.0, 33.0, 47.0, 84.0, 99.0, 177.0, 212.0, 327.0, 501.0, 565.0, 548.0, 454.0, 281.0, 194.0, 150.0, 87.0, 36.0, 45.0, 34.0, 22.0, 16.0, 13.0, 13.0, 13.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.743804931640625, -2.65167236328125, -2.559539794921875, -2.4674072265625, -2.375274658203125, -2.28314208984375, -2.191009521484375, -2.098876953125, -2.006744384765625, -1.91461181640625, -1.822479248046875, -1.7303466796875, -1.638214111328125, -1.54608154296875, -1.453948974609375, -1.36181640625, -1.269683837890625, -1.17755126953125, -1.085418701171875, -0.9932861328125, -0.901153564453125, -0.80902099609375, -0.716888427734375, -0.624755859375, -0.532623291015625, -0.44049072265625, -0.348358154296875, -0.2562255859375, -0.164093017578125, -0.07196044921875, 0.020172119140625, 0.1123046875, 0.204437255859375, 0.29656982421875, 0.388702392578125, 0.4808349609375, 0.572967529296875, 0.66510009765625, 0.757232666015625, 0.849365234375, 0.941497802734375, 1.03363037109375, 1.125762939453125, 1.2178955078125, 1.310028076171875, 1.40216064453125, 1.494293212890625, 1.58642578125, 1.678558349609375, 1.77069091796875, 1.862823486328125, 1.9549560546875, 2.047088623046875, 2.13922119140625, 2.231353759765625, 2.323486328125, 2.415618896484375, 2.50775146484375, 2.599884033203125, 2.6920166015625, 2.784149169921875, 2.87628173828125, 2.968414306640625, 3.060546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 11.0, 12.0, 7.0, 22.0, 24.0, 34.0, 39.0, 59.0, 90.0, 131.0, 219.0, 350.0, 618.0, 1222.0, 2482.0, 5656.0, 14776.0, 46947.0, 209281.0, 2047530.0, 1626829.0, 173670.0, 41053.0, 13158.0, 5034.0, 2364.0, 1106.0, 598.0, 323.0, 205.0, 120.0, 73.0, 63.0, 53.0, 22.0, 24.0, 17.0, 10.0, 13.0, 5.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.64093017578125, -3.5006103515625, -3.36029052734375, -3.219970703125, -3.07965087890625, -2.9393310546875, -2.79901123046875, -2.65869140625, -2.51837158203125, -2.3780517578125, -2.23773193359375, -2.097412109375, -1.95709228515625, -1.8167724609375, -1.67645263671875, -1.5361328125, -1.39581298828125, -1.2554931640625, -1.11517333984375, -0.974853515625, -0.83453369140625, -0.6942138671875, -0.55389404296875, -0.41357421875, -0.27325439453125, -0.1329345703125, 0.00738525390625, 0.147705078125, 0.28802490234375, 0.4283447265625, 0.56866455078125, 0.708984375, 0.84930419921875, 0.9896240234375, 1.12994384765625, 1.270263671875, 1.41058349609375, 1.5509033203125, 1.69122314453125, 1.83154296875, 1.97186279296875, 2.1121826171875, 2.25250244140625, 2.392822265625, 2.53314208984375, 2.6734619140625, 2.81378173828125, 2.9541015625, 3.09442138671875, 3.2347412109375, 3.37506103515625, 3.515380859375, 3.65570068359375, 3.7960205078125, 3.93634033203125, 4.07666015625, 4.21697998046875, 4.3572998046875, 4.49761962890625, 4.637939453125, 4.77825927734375, 4.9185791015625, 5.05889892578125, 5.19921875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 6.0, 33.0, 112.0, 228.0, 315.0, 191.0, 97.0, 21.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-53.51313018798828, -52.47252655029297, -51.431922912597656, -50.39132308959961, -49.3507194519043, -48.310115814208984, -47.26951217651367, -46.22890853881836, -45.18830871582031, -44.147705078125, -43.10710144042969, -42.06650161743164, -41.02589797973633, -39.985294342041016, -38.9446907043457, -37.90408706665039, -36.86348342895508, -35.822879791259766, -34.78227615356445, -33.741676330566406, -32.701072692871094, -31.66046905517578, -30.61986541748047, -29.579261779785156, -28.538660049438477, -27.498056411743164, -26.457454681396484, -25.416851043701172, -24.37624740600586, -23.33564567565918, -22.295042037963867, -21.254440307617188, -20.21384048461914, -19.173236846923828, -18.13263511657715, -17.092031478881836, -16.051429748535156, -15.010826110839844, -13.970222473144531, -12.929619789123535, -11.889016151428223, -10.848413467407227, -9.807809829711914, -8.767207145690918, -7.726604461669922, -6.686001777648926, -5.6453986167907715, -4.604795455932617, -3.564192771911621, -2.523589849472046, -1.4829869270324707, -0.4423840045928955, 0.5982189178466797, 1.6388216018676758, 2.67942476272583, 3.7200279235839844, 4.7606306076049805, 5.801233291625977, 6.841836452484131, 7.882439613342285, 8.923042297363281, 9.963644981384277, 11.004247665405273, 12.044851303100586, 13.085453987121582]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 9.0, 13.0, 23.0, 20.0, 28.0, 28.0, 27.0, 33.0, 24.0, 27.0, 28.0, 45.0, 33.0, 40.0, 47.0, 32.0, 42.0, 33.0, 29.0, 44.0, 32.0, 35.0, 38.0, 34.0, 31.0, 26.0, 21.0, 20.0, 29.0, 14.0, 15.0, 14.0, 9.0, 8.0, 8.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.486639022827148, -8.215720176696777, -7.9448018074035645, -7.673883438110352, -7.4029645919799805, -7.132046222686768, -6.861127853393555, -6.590209007263184, -6.3192901611328125, -6.0483717918396, -5.7774529457092285, -5.506534576416016, -5.2356157302856445, -4.964697360992432, -4.693778991699219, -4.422860145568848, -4.151941776275635, -3.8810231685638428, -3.610104560852051, -3.339186191558838, -3.068267345428467, -2.797348976135254, -2.526430368423462, -2.25551176071167, -1.984593152999878, -1.713674545288086, -1.442755937576294, -1.1718374490737915, -0.9009188413619995, -0.6300002336502075, -0.3590817451477051, -0.08816313743591309, 0.1827554702758789, 0.4536740481853485, 0.7245926260948181, 0.9955111742019653, 1.2664297819137573, 1.5373483896255493, 1.8082668781280518, 2.0791854858398438, 2.3501040935516357, 2.6210227012634277, 2.8919413089752197, 3.1628599166870117, 3.4337782859802246, 3.7046971321105957, 3.9756155014038086, 4.24653434753418, 4.517452716827393, 4.7883710861206055, 5.059289932250977, 5.3302083015441895, 5.6011271476745605, 5.872045516967773, 6.1429643630981445, 6.413882732391357, 6.68480110168457, 6.955719470977783, 7.226638317108154, 7.497556686401367, 7.768475532531738, 8.03939437866211, 8.310312271118164, 8.581231117248535, 8.852149963378906]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 10.0, 14.0, 27.0, 23.0, 20.0, 27.0, 25.0, 37.0, 42.0, 24.0, 30.0, 35.0, 45.0, 43.0, 44.0, 58.0, 35.0, 40.0, 47.0, 50.0, 42.0, 36.0, 39.0, 31.0, 26.0, 17.0, 14.0, 15.0, 14.0, 14.0, 18.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9453125, -1.881927490234375, -1.81854248046875, -1.755157470703125, -1.6917724609375, -1.628387451171875, -1.56500244140625, -1.501617431640625, -1.438232421875, -1.374847412109375, -1.31146240234375, -1.248077392578125, -1.1846923828125, -1.121307373046875, -1.05792236328125, -0.994537353515625, -0.93115234375, -0.867767333984375, -0.80438232421875, -0.740997314453125, -0.6776123046875, -0.614227294921875, -0.55084228515625, -0.487457275390625, -0.424072265625, -0.360687255859375, -0.29730224609375, -0.233917236328125, -0.1705322265625, -0.107147216796875, -0.04376220703125, 0.019622802734375, 0.0830078125, 0.146392822265625, 0.20977783203125, 0.273162841796875, 0.3365478515625, 0.399932861328125, 0.46331787109375, 0.526702880859375, 0.590087890625, 0.653472900390625, 0.71685791015625, 0.780242919921875, 0.8436279296875, 0.907012939453125, 0.97039794921875, 1.033782958984375, 1.09716796875, 1.160552978515625, 1.22393798828125, 1.287322998046875, 1.3507080078125, 1.414093017578125, 1.47747802734375, 1.540863037109375, 1.604248046875, 1.667633056640625, 1.73101806640625, 1.794403076171875, 1.8577880859375, 1.921173095703125, 1.98455810546875, 2.047943115234375, 2.111328125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 17.0, 42.0, 54.0, 91.0, 128.0, 194.0, 269.0, 433.0, 577.0, 954.0, 1424.0, 2141.0, 3259.0, 4668.0, 6819.0, 10029.0, 14470.0, 21230.0, 30143.0, 42377.0, 58204.0, 77067.0, 96527.0, 113979.0, 118736.0, 108615.0, 90181.0, 70549.0, 52026.0, 38076.0, 26474.0, 18547.0, 12766.0, 8815.0, 6053.0, 4155.0, 2854.0, 1846.0, 1281.0, 842.0, 553.0, 383.0, 201.0, 156.0, 136.0, 65.0, 48.0, 31.0, 18.0, 17.0, 9.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.211181640625, -0.20444107055664062, -0.19770050048828125, -0.19095993041992188, -0.1842193603515625, -0.17747879028320312, -0.17073822021484375, -0.16399765014648438, -0.157257080078125, -0.15051651000976562, -0.14377593994140625, -0.13703536987304688, -0.1302947998046875, -0.12355422973632812, -0.11681365966796875, -0.11007308959960938, -0.10333251953125, -0.09659194946289062, -0.08985137939453125, -0.08311080932617188, -0.0763702392578125, -0.06962966918945312, -0.06288909912109375, -0.056148529052734375, -0.049407958984375, -0.042667388916015625, -0.03592681884765625, -0.029186248779296875, -0.0224456787109375, -0.015705108642578125, -0.00896453857421875, -0.002223968505859375, 0.0045166015625, 0.011257171630859375, 0.01799774169921875, 0.024738311767578125, 0.0314788818359375, 0.038219451904296875, 0.04496002197265625, 0.051700592041015625, 0.058441162109375, 0.06518173217773438, 0.07192230224609375, 0.07866287231445312, 0.0854034423828125, 0.09214401245117188, 0.09888458251953125, 0.10562515258789062, 0.11236572265625, 0.11910629272460938, 0.12584686279296875, 0.13258743286132812, 0.1393280029296875, 0.14606857299804688, 0.15280914306640625, 0.15954971313476562, 0.166290283203125, 0.17303085327148438, 0.17977142333984375, 0.18651199340820312, 0.1932525634765625, 0.19999313354492188, 0.20673370361328125, 0.21347427368164062, 0.22021484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 14.0, 14.0, 14.0, 15.0, 19.0, 27.0, 28.0, 20.0, 21.0, 36.0, 28.0, 43.0, 43.0, 39.0, 32.0, 41.0, 44.0, 1056.0, 42.0, 44.0, 40.0, 39.0, 33.0, 22.0, 27.0, 24.0, 33.0, 25.0, 20.0, 19.0, 22.0, 23.0, 11.0, 13.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0819091796875, -1.042724609375, -1.0035400390625, -0.96435546875, -0.9251708984375, -0.885986328125, -0.8468017578125, -0.8076171875, -0.7684326171875, -0.729248046875, -0.6900634765625, -0.65087890625, -0.6116943359375, -0.572509765625, -0.5333251953125, -0.494140625, -0.4549560546875, -0.415771484375, -0.3765869140625, -0.33740234375, -0.2982177734375, -0.259033203125, -0.2198486328125, -0.1806640625, -0.1414794921875, -0.102294921875, -0.0631103515625, -0.02392578125, 0.0152587890625, 0.054443359375, 0.0936279296875, 0.1328125, 0.1719970703125, 0.211181640625, 0.2503662109375, 0.28955078125, 0.3287353515625, 0.367919921875, 0.4071044921875, 0.4462890625, 0.4854736328125, 0.524658203125, 0.5638427734375, 0.60302734375, 0.6422119140625, 0.681396484375, 0.7205810546875, 0.759765625, 0.7989501953125, 0.838134765625, 0.8773193359375, 0.91650390625, 0.9556884765625, 0.994873046875, 1.0340576171875, 1.0732421875, 1.1124267578125, 1.151611328125, 1.1907958984375, 1.22998046875, 1.2691650390625, 1.308349609375, 1.3475341796875, 1.38671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 9.0, 11.0, 17.0, 22.0, 32.0, 49.0, 69.0, 95.0, 121.0, 203.0, 286.0, 427.0, 724.0, 1011.0, 1546.0, 2471.0, 3748.0, 5561.0, 8788.0, 13700.0, 25266.0, 83370.0, 1569257.0, 289506.0, 40619.0, 18312.0, 11341.0, 7154.0, 4605.0, 3029.0, 1947.0, 1313.0, 842.0, 525.0, 386.0, 256.0, 156.0, 111.0, 75.0, 48.0, 39.0, 25.0, 15.0, 13.0, 7.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.456298828125, -0.44193267822265625, -0.4275665283203125, -0.41320037841796875, -0.398834228515625, -0.38446807861328125, -0.3701019287109375, -0.35573577880859375, -0.34136962890625, -0.32700347900390625, -0.3126373291015625, -0.29827117919921875, -0.283905029296875, -0.26953887939453125, -0.2551727294921875, -0.24080657958984375, -0.2264404296875, -0.21207427978515625, -0.1977081298828125, -0.18334197998046875, -0.168975830078125, -0.15460968017578125, -0.1402435302734375, -0.12587738037109375, -0.11151123046875, -0.09714508056640625, -0.0827789306640625, -0.06841278076171875, -0.054046630859375, -0.03968048095703125, -0.0253143310546875, -0.01094818115234375, 0.00341796875, 0.01778411865234375, 0.0321502685546875, 0.04651641845703125, 0.060882568359375, 0.07524871826171875, 0.0896148681640625, 0.10398101806640625, 0.11834716796875, 0.13271331787109375, 0.1470794677734375, 0.16144561767578125, 0.175811767578125, 0.19017791748046875, 0.2045440673828125, 0.21891021728515625, 0.2332763671875, 0.24764251708984375, 0.2620086669921875, 0.27637481689453125, 0.290740966796875, 0.30510711669921875, 0.3194732666015625, 0.33383941650390625, 0.34820556640625, 0.36257171630859375, 0.3769378662109375, 0.39130401611328125, 0.405670166015625, 0.42003631591796875, 0.4344024658203125, 0.44876861572265625, 0.463134765625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 5.0, 4.0, 8.0, 5.0, 13.0, 8.0, 5.0, 12.0, 23.0, 17.0, 17.0, 22.0, 19.0, 26.0, 39.0, 31.0, 41.0, 56.0, 51.0, 49.0, 50.0, 50.0, 51.0, 45.0, 42.0, 41.0, 36.0, 44.0, 35.0, 20.0, 30.0, 12.0, 17.0, 14.0, 13.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0], "bins": [-0.0213775634765625, -0.02080690860748291, -0.02023625373840332, -0.01966559886932373, -0.01909494400024414, -0.01852428913116455, -0.01795363426208496, -0.01738297939300537, -0.01681232452392578, -0.01624166965484619, -0.0156710147857666, -0.015100359916687012, -0.014529705047607422, -0.013959050178527832, -0.013388395309448242, -0.012817740440368652, -0.012247085571289062, -0.011676430702209473, -0.011105775833129883, -0.010535120964050293, -0.009964466094970703, -0.009393811225891113, -0.008823156356811523, -0.008252501487731934, -0.007681846618652344, -0.007111191749572754, -0.006540536880493164, -0.005969882011413574, -0.005399227142333984, -0.0048285722732543945, -0.004257917404174805, -0.003687262535095215, -0.003116607666015625, -0.002545952796936035, -0.0019752979278564453, -0.0014046430587768555, -0.0008339881896972656, -0.0002633333206176758, 0.00030732154846191406, 0.0008779764175415039, 0.0014486312866210938, 0.0020192861557006836, 0.0025899410247802734, 0.0031605958938598633, 0.003731250762939453, 0.004301905632019043, 0.004872560501098633, 0.005443215370178223, 0.0060138702392578125, 0.006584525108337402, 0.007155179977416992, 0.007725834846496582, 0.008296489715576172, 0.008867144584655762, 0.009437799453735352, 0.010008454322814941, 0.010579109191894531, 0.011149764060974121, 0.011720418930053711, 0.0122910737991333, 0.01286172866821289, 0.01343238353729248, 0.01400303840637207, 0.01457369327545166, 0.01514434814453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 10.0, 12.0, 13.0, 16.0, 24.0, 24.0, 32.0, 38.0, 65.0, 84.0, 98.0, 158.0, 241.0, 461.0, 1720.0, 60969.0, 954081.0, 28185.0, 1148.0, 405.0, 230.0, 133.0, 84.0, 66.0, 55.0, 34.0, 26.0, 27.0, 22.0, 15.0, 18.0, 3.0, 6.0, 5.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3455085754394531, -0.33335113525390625, -0.3211936950683594, -0.3090362548828125, -0.2968788146972656, -0.28472137451171875, -0.2725639343261719, -0.260406494140625, -0.24824905395507812, -0.23609161376953125, -0.22393417358398438, -0.2117767333984375, -0.19961929321289062, -0.18746185302734375, -0.17530441284179688, -0.16314697265625, -0.15098953247070312, -0.13883209228515625, -0.12667465209960938, -0.1145172119140625, -0.10235977172851562, -0.09020233154296875, -0.07804489135742188, -0.065887451171875, -0.053730010986328125, -0.04157257080078125, -0.029415130615234375, -0.0172576904296875, -0.005100250244140625, 0.00705718994140625, 0.019214630126953125, 0.0313720703125, 0.043529510498046875, 0.05568695068359375, 0.06784439086914062, 0.0800018310546875, 0.09215927124023438, 0.10431671142578125, 0.11647415161132812, 0.128631591796875, 0.14078903198242188, 0.15294647216796875, 0.16510391235351562, 0.1772613525390625, 0.18941879272460938, 0.20157623291015625, 0.21373367309570312, 0.22589111328125, 0.23804855346679688, 0.25020599365234375, 0.2623634338378906, 0.2745208740234375, 0.2866783142089844, 0.29883575439453125, 0.3109931945800781, 0.323150634765625, 0.3353080749511719, 0.34746551513671875, 0.3596229553222656, 0.3717803955078125, 0.3839378356933594, 0.39609527587890625, 0.4082527160644531, 0.42041015625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 23.0, 82.0, 164.0, 297.0, 271.0, 110.0, 43.0, 12.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1401641070842743, -0.13740800321102142, -0.13465189933776855, -0.13189579546451569, -0.12913969159126282, -0.12638358771800995, -0.12362748384475708, -0.12087137997150421, -0.11811527609825134, -0.11535917222499847, -0.1126030683517456, -0.10984696447849274, -0.10709086060523987, -0.104334756731987, -0.10157865285873413, -0.09882254898548126, -0.0960664451122284, -0.09331034123897552, -0.09055423736572266, -0.08779813349246979, -0.08504202961921692, -0.08228592574596405, -0.07952982187271118, -0.07677371799945831, -0.07401761412620544, -0.07126151025295258, -0.06850540637969971, -0.06574930250644684, -0.06299319863319397, -0.0602370947599411, -0.05748099088668823, -0.054724887013435364, -0.05196879059076309, -0.04921268671751022, -0.046456582844257355, -0.043700478971004486, -0.04094437509775162, -0.03818827122449875, -0.03543216735124588, -0.03267606347799301, -0.029919959604740143, -0.027163855731487274, -0.024407751858234406, -0.021651647984981537, -0.018895544111728668, -0.0161394402384758, -0.013383336365222931, -0.010627232491970062, -0.007871128618717194, -0.005115024745464325, -0.0023589208722114563, 0.00039718300104141235, 0.003153286874294281, 0.00590939074754715, 0.008665494620800018, 0.011421598494052887, 0.014177702367305756, 0.016933806240558624, 0.019689910113811493, 0.02244601398706436, 0.02520211786031723, 0.0279582217335701, 0.030714325606822968, 0.033470429480075836, 0.036226533353328705]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 13.0, 11.0, 17.0, 15.0, 12.0, 15.0, 18.0, 27.0, 18.0, 27.0, 25.0, 44.0, 28.0, 34.0, 23.0, 24.0, 28.0, 25.0, 51.0, 38.0, 47.0, 40.0, 47.0, 30.0, 42.0, 35.0, 18.0, 28.0, 21.0, 35.0, 20.0, 15.0, 18.0, 18.0, 10.0, 11.0, 8.0, 12.0, 2.0, 6.0, 9.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019772648811340332, -0.01914995163679123, -0.018527252599596977, -0.017904553562402725, -0.017281856387853622, -0.01665915921330452, -0.016036460176110268, -0.01541376207023859, -0.014791063964366913, -0.014168365858495235, -0.013545667752623558, -0.01292296964675188, -0.012300271540880203, -0.011677573435008526, -0.011054875329136848, -0.010432177223265171, -0.009809479117393494, -0.009186781011521816, -0.008564082905650139, -0.007941384799778461, -0.007318686693906784, -0.006695988588035107, -0.006073290482163429, -0.005450592376291752, -0.0048278942704200745, -0.004205196164548397, -0.0035824980586767197, -0.0029597999528050423, -0.002337101846933365, -0.0017144037410616875, -0.00109170563519001, -0.00046900752931833267, 0.00015369057655334473, 0.0007763886824250221, 0.0013990867882966995, 0.002021784894168377, 0.0026444830000400543, 0.0032671811059117317, 0.003889879211783409, 0.0045125773176550865, 0.005135275423526764, 0.005757973529398441, 0.006380671635270119, 0.007003369741141796, 0.0076260678470134735, 0.008248765952885151, 0.008871464058756828, 0.009494162164628506, 0.010116860270500183, 0.01073955837637186, 0.011362256482243538, 0.011984954588115215, 0.012607652693986893, 0.01323035079985857, 0.013853048905730247, 0.014475747011601925, 0.015098445117473602, 0.015721142292022705, 0.016343841329216957, 0.01696654036641121, 0.017589237540960312, 0.018211934715509415, 0.018834633752703667, 0.01945733278989792, 0.02008002996444702]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 4.0, 5.0, 9.0, 16.0, 19.0, 23.0, 24.0, 27.0, 17.0, 36.0, 28.0, 41.0, 52.0, 30.0, 42.0, 53.0, 61.0, 45.0, 45.0, 45.0, 46.0, 29.0, 41.0, 27.0, 29.0, 23.0, 34.0, 35.0, 24.0, 16.0, 19.0, 12.0, 11.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03826904296875, -1.9710693359375, -1.90386962890625, -1.836669921875, -1.76947021484375, -1.7022705078125, -1.63507080078125, -1.56787109375, -1.50067138671875, -1.4334716796875, -1.36627197265625, -1.299072265625, -1.23187255859375, -1.1646728515625, -1.09747314453125, -1.0302734375, -0.96307373046875, -0.8958740234375, -0.82867431640625, -0.761474609375, -0.69427490234375, -0.6270751953125, -0.55987548828125, -0.49267578125, -0.42547607421875, -0.3582763671875, -0.29107666015625, -0.223876953125, -0.15667724609375, -0.0894775390625, -0.02227783203125, 0.044921875, 0.11212158203125, 0.1793212890625, 0.24652099609375, 0.313720703125, 0.38092041015625, 0.4481201171875, 0.51531982421875, 0.58251953125, 0.64971923828125, 0.7169189453125, 0.78411865234375, 0.851318359375, 0.91851806640625, 0.9857177734375, 1.05291748046875, 1.1201171875, 1.18731689453125, 1.2545166015625, 1.32171630859375, 1.388916015625, 1.45611572265625, 1.5233154296875, 1.59051513671875, 1.65771484375, 1.72491455078125, 1.7921142578125, 1.85931396484375, 1.926513671875, 1.99371337890625, 2.0609130859375, 2.12811279296875, 2.1953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 12.0, 21.0, 27.0, 45.0, 56.0, 82.0, 137.0, 181.0, 231.0, 353.0, 500.0, 806.0, 1147.0, 1754.0, 2760.0, 4396.0, 7277.0, 12211.0, 21839.0, 41930.0, 96429.0, 272927.0, 345207.0, 124591.0, 51265.0, 25668.0, 14284.0, 8279.0, 5070.0, 3056.0, 1925.0, 1376.0, 851.0, 534.0, 419.0, 271.0, 189.0, 129.0, 82.0, 65.0, 43.0, 41.0, 18.0, 20.0, 13.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.058258056640625, -1.98760986328125, -1.916961669921875, -1.8463134765625, -1.775665283203125, -1.70501708984375, -1.634368896484375, -1.563720703125, -1.493072509765625, -1.42242431640625, -1.351776123046875, -1.2811279296875, -1.210479736328125, -1.13983154296875, -1.069183349609375, -0.99853515625, -0.927886962890625, -0.85723876953125, -0.786590576171875, -0.7159423828125, -0.645294189453125, -0.57464599609375, -0.503997802734375, -0.433349609375, -0.362701416015625, -0.29205322265625, -0.221405029296875, -0.1507568359375, -0.080108642578125, -0.00946044921875, 0.061187744140625, 0.1318359375, 0.202484130859375, 0.27313232421875, 0.343780517578125, 0.4144287109375, 0.485076904296875, 0.55572509765625, 0.626373291015625, 0.697021484375, 0.767669677734375, 0.83831787109375, 0.908966064453125, 0.9796142578125, 1.050262451171875, 1.12091064453125, 1.191558837890625, 1.26220703125, 1.332855224609375, 1.40350341796875, 1.474151611328125, 1.5447998046875, 1.615447998046875, 1.68609619140625, 1.756744384765625, 1.827392578125, 1.898040771484375, 1.96868896484375, 2.039337158203125, 2.1099853515625, 2.180633544921875, 2.25128173828125, 2.321929931640625, 2.392578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 13.0, 13.0, 10.0, 21.0, 17.0, 23.0, 21.0, 27.0, 36.0, 28.0, 41.0, 36.0, 68.0, 62.0, 135.0, 271.0, 1451.0, 221.0, 119.0, 57.0, 51.0, 19.0, 43.0, 33.0, 22.0, 32.0, 23.0, 24.0, 20.0, 10.0, 13.0, 11.0, 12.0, 4.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.9716796875, -3.826171875, -3.6806640625, -3.53515625, -3.3896484375, -3.244140625, -3.0986328125, -2.953125, -2.8076171875, -2.662109375, -2.5166015625, -2.37109375, -2.2255859375, -2.080078125, -1.9345703125, -1.7890625, -1.6435546875, -1.498046875, -1.3525390625, -1.20703125, -1.0615234375, -0.916015625, -0.7705078125, -0.625, -0.4794921875, -0.333984375, -0.1884765625, -0.04296875, 0.1025390625, 0.248046875, 0.3935546875, 0.5390625, 0.6845703125, 0.830078125, 0.9755859375, 1.12109375, 1.2666015625, 1.412109375, 1.5576171875, 1.703125, 1.8486328125, 1.994140625, 2.1396484375, 2.28515625, 2.4306640625, 2.576171875, 2.7216796875, 2.8671875, 3.0126953125, 3.158203125, 3.3037109375, 3.44921875, 3.5947265625, 3.740234375, 3.8857421875, 4.03125, 4.1767578125, 4.322265625, 4.4677734375, 4.61328125, 4.7587890625, 4.904296875, 5.0498046875, 5.1953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 20.0, 7.0, 20.0, 26.0, 37.0, 59.0, 66.0, 99.0, 150.0, 204.0, 449.0, 1076.0, 3644.0, 18637.0, 184267.0, 2775068.0, 140706.0, 15777.0, 3280.0, 971.0, 406.0, 228.0, 135.0, 97.0, 72.0, 53.0, 33.0, 29.0, 24.0, 9.0, 11.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.82684326171875, -5.6146240234375, -5.40240478515625, -5.190185546875, -4.97796630859375, -4.7657470703125, -4.55352783203125, -4.34130859375, -4.12908935546875, -3.9168701171875, -3.70465087890625, -3.492431640625, -3.28021240234375, -3.0679931640625, -2.85577392578125, -2.6435546875, -2.43133544921875, -2.2191162109375, -2.00689697265625, -1.794677734375, -1.58245849609375, -1.3702392578125, -1.15802001953125, -0.94580078125, -0.73358154296875, -0.5213623046875, -0.30914306640625, -0.096923828125, 0.11529541015625, 0.3275146484375, 0.53973388671875, 0.751953125, 0.96417236328125, 1.1763916015625, 1.38861083984375, 1.600830078125, 1.81304931640625, 2.0252685546875, 2.23748779296875, 2.44970703125, 2.66192626953125, 2.8741455078125, 3.08636474609375, 3.298583984375, 3.51080322265625, 3.7230224609375, 3.93524169921875, 4.1474609375, 4.35968017578125, 4.5718994140625, 4.78411865234375, 4.996337890625, 5.20855712890625, 5.4207763671875, 5.63299560546875, 5.84521484375, 6.05743408203125, 6.2696533203125, 6.48187255859375, 6.694091796875, 6.90631103515625, 7.1185302734375, 7.33074951171875, 7.54296875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 36.0, 72.0, 164.0, 222.0, 209.0, 150.0, 96.0, 29.0, 17.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.279764175415039, -5.797384738922119, -5.315005302429199, -4.832625865936279, -4.350246429443359, -3.8678667545318604, -3.3854873180389404, -2.9031078815460205, -2.4207284450531006, -1.9383490085601807, -1.4559695720672607, -0.9735900163650513, -0.49121057987213135, -0.008831024169921875, 0.47354841232299805, 0.955927848815918, 1.438307285308838, 1.9206867218017578, 2.4030661582946777, 2.8854455947875977, 3.3678250312805176, 3.8502047061920166, 4.332584381103516, 4.814963340759277, 5.2973432540893555, 5.779722690582275, 6.262102127075195, 6.744481563568115, 7.226861000061035, 7.709240913391113, 8.191619873046875, 8.673999786376953, 9.156378746032715, 9.638758659362793, 10.121137619018555, 10.603517532348633, 11.085896492004395, 11.568276405334473, 12.050655364990234, 12.533035278320312, 13.015414237976074, 13.497794151306152, 13.980173110961914, 14.462553024291992, 14.944931983947754, 15.427311897277832, 15.909690856933594, 16.392070770263672, 16.87445068359375, 17.356830596923828, 17.839210510253906, 18.32158851623535, 18.80396842956543, 19.286348342895508, 19.768728256225586, 20.25110626220703, 20.73348617553711, 21.215866088867188, 21.698246002197266, 22.18062400817871, 22.66300392150879, 23.145383834838867, 23.627763748168945, 24.11014175415039, 24.59252166748047]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 14.0, 18.0, 9.0, 14.0, 17.0, 20.0, 25.0, 19.0, 33.0, 24.0, 32.0, 32.0, 43.0, 30.0, 43.0, 39.0, 49.0, 51.0, 53.0, 47.0, 47.0, 53.0, 21.0, 33.0, 25.0, 42.0, 25.0, 15.0, 23.0, 16.0, 15.0, 10.0, 8.0, 18.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.374507904052734, -10.02049446105957, -9.666481018066406, -9.312467575073242, -8.958453178405762, -8.604439735412598, -8.250426292419434, -7.8964128494262695, -7.542398929595947, -7.188385486602783, -6.834371566772461, -6.480358123779297, -6.126344680786133, -5.7723307609558105, -5.4183173179626465, -5.064303398132324, -4.71028995513916, -4.356276512145996, -4.002262592315674, -3.6482491493225098, -3.2942354679107666, -2.9402217864990234, -2.5862083435058594, -2.232194662094116, -1.878180980682373, -1.5241672992706299, -1.1701537370681763, -0.8161401748657227, -0.4621264934539795, -0.10811281204223633, 0.24590063095092773, 0.5999143123626709, 0.9539289474487305, 1.3079426288604736, 1.6619561910629272, 2.015969753265381, 2.369983434677124, 2.723997116088867, 3.0780105590820312, 3.4320242404937744, 3.7860379219055176, 4.140051364898682, 4.494065284729004, 4.848078727722168, 5.202092170715332, 5.556106090545654, 5.910119533538818, 6.264133453369141, 6.618146896362305, 6.972160339355469, 7.326174259185791, 7.680187702178955, 8.034201622009277, 8.388215065002441, 8.742228507995605, 9.09624195098877, 9.45025634765625, 9.804269790649414, 10.158283233642578, 10.512296676635742, 10.866311073303223, 11.220324516296387, 11.57433795928955, 11.928351402282715, 12.282364845275879]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 9.0, 12.0, 10.0, 18.0, 14.0, 27.0, 20.0, 24.0, 23.0, 34.0, 30.0, 45.0, 45.0, 34.0, 51.0, 45.0, 42.0, 37.0, 45.0, 50.0, 41.0, 41.0, 32.0, 28.0, 36.0, 35.0, 19.0, 22.0, 18.0, 23.0, 17.0, 24.0, 10.0, 9.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7138671875, -1.6490325927734375, -1.584197998046875, -1.5193634033203125, -1.45452880859375, -1.3896942138671875, -1.324859619140625, -1.2600250244140625, -1.1951904296875, -1.1303558349609375, -1.065521240234375, -1.0006866455078125, -0.93585205078125, -0.8710174560546875, -0.806182861328125, -0.7413482666015625, -0.676513671875, -0.6116790771484375, -0.546844482421875, -0.4820098876953125, -0.41717529296875, -0.3523406982421875, -0.287506103515625, -0.2226715087890625, -0.1578369140625, -0.0930023193359375, -0.028167724609375, 0.0366668701171875, 0.10150146484375, 0.1663360595703125, 0.231170654296875, 0.2960052490234375, 0.36083984375, 0.4256744384765625, 0.490509033203125, 0.5553436279296875, 0.62017822265625, 0.6850128173828125, 0.749847412109375, 0.8146820068359375, 0.8795166015625, 0.9443511962890625, 1.009185791015625, 1.0740203857421875, 1.13885498046875, 1.2036895751953125, 1.268524169921875, 1.3333587646484375, 1.398193359375, 1.4630279541015625, 1.527862548828125, 1.5926971435546875, 1.65753173828125, 1.7223663330078125, 1.787200927734375, 1.8520355224609375, 1.9168701171875, 1.9817047119140625, 2.046539306640625, 2.1113739013671875, 2.17620849609375, 2.2410430908203125, 2.305877685546875, 2.3707122802734375, 2.435546875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 12.0, 8.0, 9.0, 9.0, 13.0, 9.0, 21.0, 39.0, 46.0, 40.0, 54.0, 82.0, 127.0, 152.0, 180.0, 323.0, 553.0, 1746.0, 19588.0, 4005665.0, 159571.0, 3911.0, 844.0, 376.0, 218.0, 157.0, 144.0, 91.0, 57.0, 50.0, 52.0, 36.0, 15.0, 15.0, 15.0, 10.0, 8.0, 9.0, 14.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.722412109375, -15.21044921875, -14.698486328125, -14.1865234375, -13.674560546875, -13.16259765625, -12.650634765625, -12.138671875, -11.626708984375, -11.11474609375, -10.602783203125, -10.0908203125, -9.578857421875, -9.06689453125, -8.554931640625, -8.04296875, -7.531005859375, -7.01904296875, -6.507080078125, -5.9951171875, -5.483154296875, -4.97119140625, -4.459228515625, -3.947265625, -3.435302734375, -2.92333984375, -2.411376953125, -1.8994140625, -1.387451171875, -0.87548828125, -0.363525390625, 0.1484375, 0.660400390625, 1.17236328125, 1.684326171875, 2.1962890625, 2.708251953125, 3.22021484375, 3.732177734375, 4.244140625, 4.756103515625, 5.26806640625, 5.780029296875, 6.2919921875, 6.803955078125, 7.31591796875, 7.827880859375, 8.33984375, 8.851806640625, 9.36376953125, 9.875732421875, 10.3876953125, 10.899658203125, 11.41162109375, 11.923583984375, 12.435546875, 12.947509765625, 13.45947265625, 13.971435546875, 14.4833984375, 14.995361328125, 15.50732421875, 16.019287109375, 16.53125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 22.0, 30.0, 36.0, 36.0, 63.0, 83.0, 118.0, 176.0, 269.0, 379.0, 515.0, 590.0, 468.0, 350.0, 241.0, 152.0, 95.0, 98.0, 80.0, 38.0, 44.0, 28.0, 22.0, 19.0, 15.0, 12.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.67578125, -2.593048095703125, -2.51031494140625, -2.427581787109375, -2.3448486328125, -2.262115478515625, -2.17938232421875, -2.096649169921875, -2.013916015625, -1.931182861328125, -1.84844970703125, -1.765716552734375, -1.6829833984375, -1.600250244140625, -1.51751708984375, -1.434783935546875, -1.35205078125, -1.269317626953125, -1.18658447265625, -1.103851318359375, -1.0211181640625, -0.938385009765625, -0.85565185546875, -0.772918701171875, -0.690185546875, -0.607452392578125, -0.52471923828125, -0.441986083984375, -0.3592529296875, -0.276519775390625, -0.19378662109375, -0.111053466796875, -0.0283203125, 0.054412841796875, 0.13714599609375, 0.219879150390625, 0.3026123046875, 0.385345458984375, 0.46807861328125, 0.550811767578125, 0.633544921875, 0.716278076171875, 0.79901123046875, 0.881744384765625, 0.9644775390625, 1.047210693359375, 1.12994384765625, 1.212677001953125, 1.29541015625, 1.378143310546875, 1.46087646484375, 1.543609619140625, 1.6263427734375, 1.709075927734375, 1.79180908203125, 1.874542236328125, 1.957275390625, 2.040008544921875, 2.12274169921875, 2.205474853515625, 2.2882080078125, 2.370941162109375, 2.45367431640625, 2.536407470703125, 2.619140625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 11.0, 8.0, 18.0, 25.0, 28.0, 44.0, 47.0, 84.0, 157.0, 303.0, 845.0, 2884.0, 17314.0, 235744.0, 3741221.0, 176995.0, 14580.0, 2565.0, 702.0, 276.0, 154.0, 81.0, 40.0, 30.0, 24.0, 17.0, 17.0, 10.0, 3.0, 10.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1875, -7.8997802734375, -7.612060546875, -7.3243408203125, -7.03662109375, -6.7489013671875, -6.461181640625, -6.1734619140625, -5.8857421875, -5.5980224609375, -5.310302734375, -5.0225830078125, -4.73486328125, -4.4471435546875, -4.159423828125, -3.8717041015625, -3.583984375, -3.2962646484375, -3.008544921875, -2.7208251953125, -2.43310546875, -2.1453857421875, -1.857666015625, -1.5699462890625, -1.2822265625, -0.9945068359375, -0.706787109375, -0.4190673828125, -0.13134765625, 0.1563720703125, 0.444091796875, 0.7318115234375, 1.01953125, 1.3072509765625, 1.594970703125, 1.8826904296875, 2.17041015625, 2.4581298828125, 2.745849609375, 3.0335693359375, 3.3212890625, 3.6090087890625, 3.896728515625, 4.1844482421875, 4.47216796875, 4.7598876953125, 5.047607421875, 5.3353271484375, 5.623046875, 5.9107666015625, 6.198486328125, 6.4862060546875, 6.77392578125, 7.0616455078125, 7.349365234375, 7.6370849609375, 7.9248046875, 8.2125244140625, 8.500244140625, 8.7879638671875, 9.07568359375, 9.3634033203125, 9.651123046875, 9.9388427734375, 10.2265625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 44.0, 168.0, 387.0, 292.0, 99.0, 19.0, 3.0, 2.0, 2.0, 1.0], "bins": [-71.2143325805664, -69.9607162475586, -68.70709991455078, -67.45347595214844, -66.19985961914062, -64.94624328613281, -63.692626953125, -62.43901062011719, -61.18539047241211, -59.9317741394043, -58.67815399169922, -57.424537658691406, -56.170921325683594, -54.917301177978516, -53.6636848449707, -52.410064697265625, -51.15644836425781, -49.90283203125, -48.64921188354492, -47.39559555053711, -46.14197540283203, -44.88835906982422, -43.634742736816406, -42.381126403808594, -41.127506256103516, -39.8738899230957, -38.620269775390625, -37.36665344238281, -36.113037109375, -34.85941696166992, -33.60580062866211, -32.35218048095703, -31.098560333251953, -29.844942092895508, -28.591323852539062, -27.33770751953125, -26.084089279174805, -24.83047103881836, -23.576854705810547, -22.3232364654541, -21.069618225097656, -19.81599998474121, -18.562381744384766, -17.308765411376953, -16.055147171020508, -14.801528930664062, -13.547911643981934, -12.294294357299805, -11.040677070617676, -9.787059783935547, -8.533441543579102, -7.2798237800598145, -6.026206016540527, -4.77258825302124, -3.518970489501953, -2.265353202819824, -1.011734962463379, 0.2418828010559082, 1.4955005645751953, 2.7491183280944824, 4.0027360916137695, 5.256353855133057, 6.509971618652344, 7.763588905334473, 9.017207145690918]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 1.0, 9.0, 10.0, 12.0, 12.0, 14.0, 20.0, 15.0, 20.0, 18.0, 16.0, 29.0, 20.0, 32.0, 38.0, 43.0, 29.0, 36.0, 34.0, 38.0, 42.0, 43.0, 39.0, 38.0, 38.0, 48.0, 39.0, 22.0, 33.0, 33.0, 18.0, 19.0, 20.0, 18.0, 16.0, 15.0, 11.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.180791854858398, -7.923776149749756, -7.666760444641113, -7.4097442626953125, -7.15272855758667, -6.895712852478027, -6.638696670532227, -6.381680965423584, -6.124665260314941, -5.867649555206299, -5.610633850097656, -5.3536176681518555, -5.096601963043213, -4.83958625793457, -4.5825700759887695, -4.325554370880127, -4.068538665771484, -3.811522960662842, -3.55450701713562, -3.2974910736083984, -3.040475368499756, -2.7834596633911133, -2.5264437198638916, -2.26942777633667, -2.0124120712280273, -1.7553962469100952, -1.498380422592163, -1.241364598274231, -0.9843487739562988, -0.7273329496383667, -0.47031712532043457, -0.21330130100250244, 0.043715476989746094, 0.3007313013076782, 0.5577471256256104, 0.8147629499435425, 1.0717787742614746, 1.3287945985794067, 1.5858104228973389, 1.842826247215271, 2.099842071533203, 2.3568577766418457, 2.6138737201690674, 2.870889663696289, 3.1279053688049316, 3.384921073913574, 3.641937017440796, 3.8989529609680176, 4.15596866607666, 4.412984371185303, 4.670000076293945, 4.927016258239746, 5.184031963348389, 5.441047668457031, 5.698063850402832, 5.955079555511475, 6.212095260620117, 6.46911096572876, 6.726126670837402, 6.983142852783203, 7.240158557891846, 7.497174263000488, 7.754190444946289, 8.011205673217773, 8.268221855163574]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 10.0, 6.0, 8.0, 8.0, 11.0, 13.0, 10.0, 17.0, 15.0, 18.0, 22.0, 27.0, 17.0, 35.0, 36.0, 40.0, 47.0, 39.0, 33.0, 42.0, 40.0, 34.0, 38.0, 40.0, 33.0, 39.0, 36.0, 26.0, 34.0, 33.0, 33.0, 21.0, 22.0, 21.0, 14.0, 15.0, 10.0, 13.0, 12.0, 5.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6953125, -1.63916015625, -1.5830078125, -1.52685546875, -1.470703125, -1.41455078125, -1.3583984375, -1.30224609375, -1.24609375, -1.18994140625, -1.1337890625, -1.07763671875, -1.021484375, -0.96533203125, -0.9091796875, -0.85302734375, -0.796875, -0.74072265625, -0.6845703125, -0.62841796875, -0.572265625, -0.51611328125, -0.4599609375, -0.40380859375, -0.34765625, -0.29150390625, -0.2353515625, -0.17919921875, -0.123046875, -0.06689453125, -0.0107421875, 0.04541015625, 0.1015625, 0.15771484375, 0.2138671875, 0.27001953125, 0.326171875, 0.38232421875, 0.4384765625, 0.49462890625, 0.55078125, 0.60693359375, 0.6630859375, 0.71923828125, 0.775390625, 0.83154296875, 0.8876953125, 0.94384765625, 1.0, 1.05615234375, 1.1123046875, 1.16845703125, 1.224609375, 1.28076171875, 1.3369140625, 1.39306640625, 1.44921875, 1.50537109375, 1.5615234375, 1.61767578125, 1.673828125, 1.72998046875, 1.7861328125, 1.84228515625, 1.8984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 15.0, 14.0, 15.0, 16.0, 37.0, 50.0, 102.0, 140.0, 239.0, 412.0, 710.0, 1226.0, 2179.0, 3872.0, 6614.0, 11598.0, 20478.0, 34676.0, 57610.0, 91483.0, 134014.0, 167119.0, 165496.0, 129514.0, 87857.0, 54776.0, 33001.0, 19265.0, 11164.0, 6359.0, 3622.0, 2032.0, 1191.0, 654.0, 408.0, 208.0, 142.0, 78.0, 62.0, 40.0, 29.0, 16.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31884765625, -0.308868408203125, -0.29888916015625, -0.288909912109375, -0.2789306640625, -0.268951416015625, -0.25897216796875, -0.248992919921875, -0.239013671875, -0.229034423828125, -0.21905517578125, -0.209075927734375, -0.1990966796875, -0.189117431640625, -0.17913818359375, -0.169158935546875, -0.1591796875, -0.149200439453125, -0.13922119140625, -0.129241943359375, -0.1192626953125, -0.109283447265625, -0.09930419921875, -0.089324951171875, -0.079345703125, -0.069366455078125, -0.05938720703125, -0.049407958984375, -0.0394287109375, -0.029449462890625, -0.01947021484375, -0.009490966796875, 0.00048828125, 0.010467529296875, 0.02044677734375, 0.030426025390625, 0.0404052734375, 0.050384521484375, 0.06036376953125, 0.070343017578125, 0.080322265625, 0.090301513671875, 0.10028076171875, 0.110260009765625, 0.1202392578125, 0.130218505859375, 0.14019775390625, 0.150177001953125, 0.16015625, 0.170135498046875, 0.18011474609375, 0.190093994140625, 0.2000732421875, 0.210052490234375, 0.22003173828125, 0.230010986328125, 0.239990234375, 0.249969482421875, 0.25994873046875, 0.269927978515625, 0.2799072265625, 0.289886474609375, 0.29986572265625, 0.309844970703125, 0.31982421875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 3.0, 12.0, 11.0, 13.0, 10.0, 26.0, 11.0, 21.0, 21.0, 23.0, 24.0, 27.0, 33.0, 37.0, 48.0, 35.0, 36.0, 29.0, 28.0, 1065.0, 40.0, 48.0, 34.0, 33.0, 48.0, 34.0, 29.0, 38.0, 22.0, 23.0, 20.0, 24.0, 21.0, 15.0, 12.0, 10.0, 8.0, 13.0, 11.0, 5.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1340789794921875, -1.092376708984375, -1.0506744384765625, -1.00897216796875, -0.9672698974609375, -0.925567626953125, -0.8838653564453125, -0.8421630859375, -0.8004608154296875, -0.758758544921875, -0.7170562744140625, -0.67535400390625, -0.6336517333984375, -0.591949462890625, -0.5502471923828125, -0.508544921875, -0.4668426513671875, -0.425140380859375, -0.3834381103515625, -0.34173583984375, -0.3000335693359375, -0.258331298828125, -0.2166290283203125, -0.1749267578125, -0.1332244873046875, -0.091522216796875, -0.0498199462890625, -0.00811767578125, 0.0335845947265625, 0.075286865234375, 0.1169891357421875, 0.15869140625, 0.2003936767578125, 0.242095947265625, 0.2837982177734375, 0.32550048828125, 0.3672027587890625, 0.408905029296875, 0.4506072998046875, 0.4923095703125, 0.5340118408203125, 0.575714111328125, 0.6174163818359375, 0.65911865234375, 0.7008209228515625, 0.742523193359375, 0.7842254638671875, 0.825927734375, 0.8676300048828125, 0.909332275390625, 0.9510345458984375, 0.99273681640625, 1.0344390869140625, 1.076141357421875, 1.1178436279296875, 1.1595458984375, 1.2012481689453125, 1.242950439453125, 1.2846527099609375, 1.32635498046875, 1.3680572509765625, 1.409759521484375, 1.4514617919921875, 1.4931640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 17.0, 35.0, 51.0, 60.0, 87.0, 154.0, 226.0, 342.0, 506.0, 838.0, 1380.0, 2147.0, 3374.0, 5335.0, 8353.0, 14008.0, 25531.0, 87401.0, 1633316.0, 232183.0, 36462.0, 17476.0, 10260.0, 6375.0, 4038.0, 2518.0, 1636.0, 1108.0, 679.0, 424.0, 285.0, 162.0, 109.0, 80.0, 46.0, 29.0, 16.0, 17.0, 13.0, 9.0, 11.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5643043518066406, -0.5480422973632812, -0.5317802429199219, -0.5155181884765625, -0.4992561340332031, -0.48299407958984375, -0.4667320251464844, -0.450469970703125, -0.4342079162597656, -0.41794586181640625, -0.4016838073730469, -0.3854217529296875, -0.3691596984863281, -0.35289764404296875, -0.3366355895996094, -0.32037353515625, -0.3041114807128906, -0.28784942626953125, -0.2715873718261719, -0.2553253173828125, -0.23906326293945312, -0.22280120849609375, -0.20653915405273438, -0.190277099609375, -0.17401504516601562, -0.15775299072265625, -0.14149093627929688, -0.1252288818359375, -0.10896682739257812, -0.09270477294921875, -0.07644271850585938, -0.0601806640625, -0.043918609619140625, -0.02765655517578125, -0.011394500732421875, 0.0048675537109375, 0.021129608154296875, 0.03739166259765625, 0.053653717041015625, 0.069915771484375, 0.08617782592773438, 0.10243988037109375, 0.11870193481445312, 0.1349639892578125, 0.15122604370117188, 0.16748809814453125, 0.18375015258789062, 0.20001220703125, 0.21627426147460938, 0.23253631591796875, 0.24879837036132812, 0.2650604248046875, 0.2813224792480469, 0.29758453369140625, 0.3138465881347656, 0.330108642578125, 0.3463706970214844, 0.36263275146484375, 0.3788948059082031, 0.3951568603515625, 0.4114189147949219, 0.42768096923828125, 0.4439430236816406, 0.460205078125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 14.0, 12.0, 34.0, 28.0, 49.0, 38.0, 47.0, 46.0, 61.0, 58.0, 65.0, 69.0, 67.0, 78.0, 39.0, 35.0, 35.0, 39.0, 32.0, 25.0, 11.0, 15.0, 11.0, 7.0, 14.0, 8.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.028961181640625, -0.028029441833496094, -0.027097702026367188, -0.02616596221923828, -0.025234222412109375, -0.02430248260498047, -0.023370742797851562, -0.022439002990722656, -0.02150726318359375, -0.020575523376464844, -0.019643783569335938, -0.01871204376220703, -0.017780303955078125, -0.01684856414794922, -0.015916824340820312, -0.014985084533691406, -0.0140533447265625, -0.013121604919433594, -0.012189865112304688, -0.011258125305175781, -0.010326385498046875, -0.009394645690917969, -0.008462905883789062, -0.007531166076660156, -0.00659942626953125, -0.005667686462402344, -0.0047359466552734375, -0.0038042068481445312, -0.002872467041015625, -0.0019407272338867188, -0.0010089874267578125, -7.724761962890625e-05, 0.0008544921875, 0.0017862319946289062, 0.0027179718017578125, 0.0036497116088867188, 0.004581451416015625, 0.005513191223144531, 0.0064449310302734375, 0.007376670837402344, 0.00830841064453125, 0.009240150451660156, 0.010171890258789062, 0.011103630065917969, 0.012035369873046875, 0.012967109680175781, 0.013898849487304688, 0.014830589294433594, 0.0157623291015625, 0.016694068908691406, 0.017625808715820312, 0.01855754852294922, 0.019489288330078125, 0.02042102813720703, 0.021352767944335938, 0.022284507751464844, 0.02321624755859375, 0.024147987365722656, 0.025079727172851562, 0.02601146697998047, 0.026943206787109375, 0.02787494659423828, 0.028806686401367188, 0.029738426208496094, 0.030670166015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 8.0, 6.0, 14.0, 16.0, 13.0, 21.0, 36.0, 59.0, 69.0, 85.0, 155.0, 290.0, 621.0, 3695.0, 975981.0, 65268.0, 1219.0, 369.0, 219.0, 118.0, 85.0, 61.0, 42.0, 25.0, 22.0, 7.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7216796875, -0.7003021240234375, -0.678924560546875, -0.6575469970703125, -0.63616943359375, -0.6147918701171875, -0.593414306640625, -0.5720367431640625, -0.5506591796875, -0.5292816162109375, -0.507904052734375, -0.4865264892578125, -0.46514892578125, -0.4437713623046875, -0.422393798828125, -0.4010162353515625, -0.379638671875, -0.3582611083984375, -0.336883544921875, -0.3155059814453125, -0.29412841796875, -0.2727508544921875, -0.251373291015625, -0.2299957275390625, -0.2086181640625, -0.1872406005859375, -0.165863037109375, -0.1444854736328125, -0.12310791015625, -0.1017303466796875, -0.080352783203125, -0.0589752197265625, -0.03759765625, -0.0162200927734375, 0.005157470703125, 0.0265350341796875, 0.04791259765625, 0.0692901611328125, 0.090667724609375, 0.1120452880859375, 0.1334228515625, 0.1548004150390625, 0.176177978515625, 0.1975555419921875, 0.21893310546875, 0.2403106689453125, 0.261688232421875, 0.2830657958984375, 0.304443359375, 0.3258209228515625, 0.347198486328125, 0.3685760498046875, 0.38995361328125, 0.4113311767578125, 0.432708740234375, 0.4540863037109375, 0.4754638671875, 0.4968414306640625, 0.518218994140625, 0.5395965576171875, 0.56097412109375, 0.5823516845703125, 0.603729248046875, 0.6251068115234375, 0.646484375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 28.0, 524.0, 450.0, 13.0, 4.0, 1.0], "bins": [-0.6063457131385803, -0.596233606338501, -0.5861214995384216, -0.5760093927383423, -0.5658973455429077, -0.5557852387428284, -0.545673131942749, -0.5355610251426697, -0.5254489183425903, -0.515336811542511, -0.5052247047424316, -0.4951126277446747, -0.48500052094459534, -0.474888414144516, -0.46477633714675903, -0.4546642303466797, -0.44455212354660034, -0.434440016746521, -0.42432790994644165, -0.4142158329486847, -0.40410372614860535, -0.393991619348526, -0.38387954235076904, -0.3737674355506897, -0.36365532875061035, -0.353543221950531, -0.34343111515045166, -0.3333190381526947, -0.32320693135261536, -0.313094824552536, -0.30298274755477905, -0.2928706407546997, -0.28275853395462036, -0.272646427154541, -0.26253432035446167, -0.2524222433567047, -0.24231013655662537, -0.23219802975654602, -0.22208593785762787, -0.21197384595870972, -0.20186173915863037, -0.19174963235855103, -0.18163754045963287, -0.17152544856071472, -0.16141334176063538, -0.15130123496055603, -0.14118914306163788, -0.13107705116271973, -0.12096494436264038, -0.11085284501314163, -0.10074074566364288, -0.09062864631414413, -0.08051654696464539, -0.07040444761514664, -0.06029234826564789, -0.05018024891614914, -0.04006815329194069, -0.02995605394244194, -0.01984395459294319, -0.009731855243444443, 0.00038024410605430603, 0.010492343455553055, 0.020604442805051804, 0.030716542154550552, 0.0408286415040493]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 12.0, 10.0, 19.0, 8.0, 15.0, 16.0, 18.0, 17.0, 14.0, 26.0, 25.0, 20.0, 33.0, 29.0, 37.0, 51.0, 36.0, 44.0, 53.0, 31.0, 47.0, 60.0, 40.0, 38.0, 35.0, 35.0, 36.0, 22.0, 20.0, 23.0, 18.0, 16.0, 18.0, 10.0, 15.0, 11.0, 5.0, 11.0, 6.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.026995837688446045, -0.026118773967027664, -0.025241708382964134, -0.024364642798900604, -0.023487579077482224, -0.022610515356063843, -0.021733449772000313, -0.020856384187936783, -0.019979320466518402, -0.01910225674510002, -0.01822519116103649, -0.01734812557697296, -0.01647106185555458, -0.015593997202813625, -0.01471693255007267, -0.013839867897331715, -0.01296280324459076, -0.012085738591849804, -0.011208673939108849, -0.010331609286367893, -0.009454544633626938, -0.008577479980885983, -0.007700415328145027, -0.006823350675404072, -0.0059462860226631165, -0.005069221369922161, -0.004192156717181206, -0.0033150920644402504, -0.002438027411699295, -0.0015609627589583397, -0.0006838981062173843, 0.00019316654652357101, 0.0010702311992645264, 0.0019472958520054817, 0.002824360504746437, 0.0037014251574873924, 0.004578489810228348, 0.005455554462969303, 0.0063326191157102585, 0.007209683768451214, 0.00808674842119217, 0.008963813073933125, 0.00984087772667408, 0.010717942379415035, 0.01159500703215599, 0.012472071684896946, 0.013349136337637901, 0.014226200990378857, 0.015103265643119812, 0.015980329364538193, 0.016857394948601723, 0.017734460532665253, 0.018611524254083633, 0.019488587975502014, 0.020365653559565544, 0.021242719143629074, 0.022119782865047455, 0.022996846586465836, 0.023873912170529366, 0.024750977754592896, 0.025628041476011276, 0.026505105197429657, 0.027382170781493187, 0.028259236365556717, 0.029136300086975098]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 9.0, 9.0, 7.0, 15.0, 10.0, 15.0, 16.0, 10.0, 19.0, 20.0, 20.0, 21.0, 37.0, 30.0, 27.0, 45.0, 37.0, 32.0, 44.0, 40.0, 38.0, 43.0, 31.0, 43.0, 40.0, 39.0, 24.0, 34.0, 37.0, 19.0, 32.0, 27.0, 15.0, 24.0, 20.0, 12.0, 10.0, 6.0, 10.0, 7.0, 6.0, 5.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9202728271484375, -1.864959716796875, -1.8096466064453125, -1.75433349609375, -1.6990203857421875, -1.643707275390625, -1.5883941650390625, -1.5330810546875, -1.4777679443359375, -1.422454833984375, -1.3671417236328125, -1.31182861328125, -1.2565155029296875, -1.201202392578125, -1.1458892822265625, -1.090576171875, -1.0352630615234375, -0.979949951171875, -0.9246368408203125, -0.86932373046875, -0.8140106201171875, -0.758697509765625, -0.7033843994140625, -0.6480712890625, -0.5927581787109375, -0.537445068359375, -0.4821319580078125, -0.42681884765625, -0.3715057373046875, -0.316192626953125, -0.2608795166015625, -0.20556640625, -0.1502532958984375, -0.094940185546875, -0.0396270751953125, 0.01568603515625, 0.0709991455078125, 0.126312255859375, 0.1816253662109375, 0.2369384765625, 0.2922515869140625, 0.347564697265625, 0.4028778076171875, 0.45819091796875, 0.5135040283203125, 0.568817138671875, 0.6241302490234375, 0.679443359375, 0.7347564697265625, 0.790069580078125, 0.8453826904296875, 0.90069580078125, 0.9560089111328125, 1.011322021484375, 1.0666351318359375, 1.1219482421875, 1.1772613525390625, 1.232574462890625, 1.2878875732421875, 1.34320068359375, 1.3985137939453125, 1.453826904296875, 1.5091400146484375, 1.564453125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 10.0, 8.0, 6.0, 8.0, 13.0, 30.0, 39.0, 68.0, 86.0, 120.0, 176.0, 236.0, 416.0, 636.0, 981.0, 1699.0, 3060.0, 5221.0, 9562.0, 18013.0, 35089.0, 71360.0, 150738.0, 291579.0, 236689.0, 110410.0, 53547.0, 26696.0, 14165.0, 7504.0, 4120.0, 2425.0, 1535.0, 821.0, 490.0, 329.0, 224.0, 137.0, 97.0, 72.0, 52.0, 30.0, 24.0, 12.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7184600830078125, -1.656646728515625, -1.5948333740234375, -1.53302001953125, -1.4712066650390625, -1.409393310546875, -1.3475799560546875, -1.2857666015625, -1.2239532470703125, -1.162139892578125, -1.1003265380859375, -1.03851318359375, -0.9766998291015625, -0.914886474609375, -0.8530731201171875, -0.791259765625, -0.7294464111328125, -0.667633056640625, -0.6058197021484375, -0.54400634765625, -0.4821929931640625, -0.420379638671875, -0.3585662841796875, -0.2967529296875, -0.2349395751953125, -0.173126220703125, -0.1113128662109375, -0.04949951171875, 0.0123138427734375, 0.074127197265625, 0.1359405517578125, 0.19775390625, 0.2595672607421875, 0.321380615234375, 0.3831939697265625, 0.44500732421875, 0.5068206787109375, 0.568634033203125, 0.6304473876953125, 0.6922607421875, 0.7540740966796875, 0.815887451171875, 0.8777008056640625, 0.93951416015625, 1.0013275146484375, 1.063140869140625, 1.1249542236328125, 1.186767578125, 1.2485809326171875, 1.310394287109375, 1.3722076416015625, 1.43402099609375, 1.4958343505859375, 1.557647705078125, 1.6194610595703125, 1.6812744140625, 1.7430877685546875, 1.804901123046875, 1.8667144775390625, 1.92852783203125, 1.9903411865234375, 2.052154541015625, 2.1139678955078125, 2.17578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 5.0, 9.0, 17.0, 7.0, 13.0, 22.0, 23.0, 23.0, 33.0, 34.0, 41.0, 43.0, 35.0, 59.0, 118.0, 229.0, 1404.0, 363.0, 154.0, 81.0, 40.0, 39.0, 30.0, 31.0, 30.0, 27.0, 28.0, 17.0, 15.0, 8.0, 8.0, 14.0, 7.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.921875, -4.7763671875, -4.630859375, -4.4853515625, -4.33984375, -4.1943359375, -4.048828125, -3.9033203125, -3.7578125, -3.6123046875, -3.466796875, -3.3212890625, -3.17578125, -3.0302734375, -2.884765625, -2.7392578125, -2.59375, -2.4482421875, -2.302734375, -2.1572265625, -2.01171875, -1.8662109375, -1.720703125, -1.5751953125, -1.4296875, -1.2841796875, -1.138671875, -0.9931640625, -0.84765625, -0.7021484375, -0.556640625, -0.4111328125, -0.265625, -0.1201171875, 0.025390625, 0.1708984375, 0.31640625, 0.4619140625, 0.607421875, 0.7529296875, 0.8984375, 1.0439453125, 1.189453125, 1.3349609375, 1.48046875, 1.6259765625, 1.771484375, 1.9169921875, 2.0625, 2.2080078125, 2.353515625, 2.4990234375, 2.64453125, 2.7900390625, 2.935546875, 3.0810546875, 3.2265625, 3.3720703125, 3.517578125, 3.6630859375, 3.80859375, 3.9541015625, 4.099609375, 4.2451171875, 4.390625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 4.0, 15.0, 15.0, 26.0, 40.0, 39.0, 51.0, 90.0, 95.0, 125.0, 182.0, 292.0, 464.0, 1016.0, 10232.0, 2963873.0, 164692.0, 2436.0, 733.0, 369.0, 249.0, 174.0, 109.0, 84.0, 84.0, 39.0, 32.0, 32.0, 20.0, 15.0, 14.0, 12.0, 6.0, 6.0, 9.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.765625, -11.356689453125, -10.94775390625, -10.538818359375, -10.1298828125, -9.720947265625, -9.31201171875, -8.903076171875, -8.494140625, -8.085205078125, -7.67626953125, -7.267333984375, -6.8583984375, -6.449462890625, -6.04052734375, -5.631591796875, -5.22265625, -4.813720703125, -4.40478515625, -3.995849609375, -3.5869140625, -3.177978515625, -2.76904296875, -2.360107421875, -1.951171875, -1.542236328125, -1.13330078125, -0.724365234375, -0.3154296875, 0.093505859375, 0.50244140625, 0.911376953125, 1.3203125, 1.729248046875, 2.13818359375, 2.547119140625, 2.9560546875, 3.364990234375, 3.77392578125, 4.182861328125, 4.591796875, 5.000732421875, 5.40966796875, 5.818603515625, 6.2275390625, 6.636474609375, 7.04541015625, 7.454345703125, 7.86328125, 8.272216796875, 8.68115234375, 9.090087890625, 9.4990234375, 9.907958984375, 10.31689453125, 10.725830078125, 11.134765625, 11.543701171875, 11.95263671875, 12.361572265625, 12.7705078125, 13.179443359375, 13.58837890625, 13.997314453125, 14.40625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 31.0, 359.0, 513.0, 104.0, 8.0, 1.0], "bins": [-94.95520782470703, -93.37904357910156, -91.8028793334961, -90.22671508789062, -88.65054321289062, -87.07437896728516, -85.49821472167969, -83.92205047607422, -82.34588623046875, -80.76972198486328, -79.19355773925781, -77.61739349365234, -76.04122924804688, -74.46505737304688, -72.8888931274414, -71.31272888183594, -69.73656463623047, -68.160400390625, -66.58423614501953, -65.00807189941406, -63.43190383911133, -61.85573959350586, -60.279571533203125, -58.703407287597656, -57.12724304199219, -55.55107879638672, -53.97491455078125, -52.398746490478516, -50.82258224487305, -49.24641799926758, -47.670249938964844, -46.094085693359375, -44.517921447753906, -42.94175720214844, -41.36559295654297, -39.789424896240234, -38.213260650634766, -36.6370964050293, -35.06092834472656, -33.484764099121094, -31.908601760864258, -30.332435607910156, -28.756271362304688, -27.18010711669922, -25.603940963745117, -24.027774810791016, -22.451610565185547, -20.875446319580078, -19.299280166625977, -17.723114013671875, -16.146949768066406, -14.570784568786621, -12.994619369506836, -11.41845417022705, -9.842288970947266, -8.26612377166748, -6.689958095550537, -5.113792896270752, -3.537627696990967, -1.9614624977111816, -0.3852972984313965, 1.1908679008483887, 2.767033100128174, 4.343198299407959, 5.919363498687744]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 4.0, 12.0, 8.0, 12.0, 14.0, 13.0, 18.0, 18.0, 24.0, 28.0, 22.0, 25.0, 24.0, 27.0, 44.0, 33.0, 40.0, 31.0, 30.0, 51.0, 47.0, 26.0, 44.0, 38.0, 42.0, 29.0, 38.0, 28.0, 29.0, 29.0, 24.0, 23.0, 14.0, 16.0, 17.0, 13.0, 10.0, 10.0, 8.0, 5.0, 6.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.294658660888672, -10.940302848815918, -10.58594799041748, -10.231592178344727, -9.877237319946289, -9.522881507873535, -9.168525695800781, -8.814170837402344, -8.459815979003906, -8.105460166931152, -7.751105308532715, -7.396749496459961, -7.042394638061523, -6.6880388259887695, -6.333683490753174, -5.979328155517578, -5.624972343444824, -5.2706170082092285, -4.916261672973633, -4.561905860900879, -4.207551002502441, -3.8531954288482666, -3.498839855194092, -3.144484519958496, -2.7901291847229004, -2.4357738494873047, -2.081418514251709, -1.7270629405975342, -1.3727076053619385, -1.0183522701263428, -0.663996696472168, -0.30964136123657227, 0.04471302032470703, 0.3990684151649475, 0.753423810005188, 1.1077792644500732, 1.462134599685669, 1.8164899349212646, 2.1708455085754395, 2.525200843811035, 2.879556179046631, 3.2339115142822266, 3.5882668495178223, 3.942622423171997, 4.296977996826172, 4.651332855224609, 5.005688667297363, 5.360044002532959, 5.714399337768555, 6.06875467300415, 6.423110008239746, 6.7774658203125, 7.1318206787109375, 7.486176490783691, 7.840531826019287, 8.194887161254883, 8.54924201965332, 8.903597831726074, 9.257952690124512, 9.612308502197266, 9.966663360595703, 10.321019172668457, 10.675374984741211, 11.029729843139648, 11.384085655212402]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 9.0, 12.0, 10.0, 10.0, 14.0, 14.0, 14.0, 20.0, 16.0, 32.0, 37.0, 29.0, 23.0, 36.0, 44.0, 36.0, 42.0, 35.0, 35.0, 28.0, 43.0, 31.0, 45.0, 38.0, 31.0, 31.0, 36.0, 24.0, 24.0, 21.0, 27.0, 17.0, 18.0, 9.0, 15.0, 17.0, 9.0, 11.0, 10.0, 1.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.590972900390625, -1.53741455078125, -1.483856201171875, -1.4302978515625, -1.376739501953125, -1.32318115234375, -1.269622802734375, -1.216064453125, -1.162506103515625, -1.10894775390625, -1.055389404296875, -1.0018310546875, -0.948272705078125, -0.89471435546875, -0.841156005859375, -0.78759765625, -0.734039306640625, -0.68048095703125, -0.626922607421875, -0.5733642578125, -0.519805908203125, -0.46624755859375, -0.412689208984375, -0.359130859375, -0.305572509765625, -0.25201416015625, -0.198455810546875, -0.1448974609375, -0.091339111328125, -0.03778076171875, 0.015777587890625, 0.0693359375, 0.122894287109375, 0.17645263671875, 0.230010986328125, 0.2835693359375, 0.337127685546875, 0.39068603515625, 0.444244384765625, 0.497802734375, 0.551361083984375, 0.60491943359375, 0.658477783203125, 0.7120361328125, 0.765594482421875, 0.81915283203125, 0.872711181640625, 0.92626953125, 0.979827880859375, 1.03338623046875, 1.086944580078125, 1.1405029296875, 1.194061279296875, 1.24761962890625, 1.301177978515625, 1.354736328125, 1.408294677734375, 1.46185302734375, 1.515411376953125, 1.5689697265625, 1.622528076171875, 1.67608642578125, 1.729644775390625, 1.783203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 7.0, 10.0, 9.0, 24.0, 39.0, 42.0, 69.0, 83.0, 148.0, 230.0, 316.0, 439.0, 722.0, 1214.0, 2217.0, 4784.0, 12668.0, 56318.0, 590082.0, 2721340.0, 711678.0, 65885.0, 14384.0, 5298.0, 2530.0, 1384.0, 814.0, 512.0, 305.0, 214.0, 126.0, 110.0, 86.0, 56.0, 33.0, 30.0, 24.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.695892333984375, -3.56170654296875, -3.427520751953125, -3.2933349609375, -3.159149169921875, -3.02496337890625, -2.890777587890625, -2.756591796875, -2.622406005859375, -2.48822021484375, -2.354034423828125, -2.2198486328125, -2.085662841796875, -1.95147705078125, -1.817291259765625, -1.68310546875, -1.548919677734375, -1.41473388671875, -1.280548095703125, -1.1463623046875, -1.012176513671875, -0.87799072265625, -0.743804931640625, -0.609619140625, -0.475433349609375, -0.34124755859375, -0.207061767578125, -0.0728759765625, 0.061309814453125, 0.19549560546875, 0.329681396484375, 0.4638671875, 0.598052978515625, 0.73223876953125, 0.866424560546875, 1.0006103515625, 1.134796142578125, 1.26898193359375, 1.403167724609375, 1.537353515625, 1.671539306640625, 1.80572509765625, 1.939910888671875, 2.0740966796875, 2.208282470703125, 2.34246826171875, 2.476654052734375, 2.61083984375, 2.745025634765625, 2.87921142578125, 3.013397216796875, 3.1475830078125, 3.281768798828125, 3.41595458984375, 3.550140380859375, 3.684326171875, 3.818511962890625, 3.95269775390625, 4.086883544921875, 4.2210693359375, 4.355255126953125, 4.48944091796875, 4.623626708984375, 4.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 18.0, 10.0, 34.0, 25.0, 37.0, 66.0, 68.0, 101.0, 170.0, 214.0, 329.0, 489.0, 629.0, 557.0, 418.0, 256.0, 179.0, 125.0, 94.0, 77.0, 58.0, 33.0, 25.0, 21.0, 10.0, 7.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.58770751953125, -4.4722900390625, -4.35687255859375, -4.241455078125, -4.12603759765625, -4.0106201171875, -3.89520263671875, -3.77978515625, -3.66436767578125, -3.5489501953125, -3.43353271484375, -3.318115234375, -3.20269775390625, -3.0872802734375, -2.97186279296875, -2.8564453125, -2.74102783203125, -2.6256103515625, -2.51019287109375, -2.394775390625, -2.27935791015625, -2.1639404296875, -2.04852294921875, -1.93310546875, -1.81768798828125, -1.7022705078125, -1.58685302734375, -1.471435546875, -1.35601806640625, -1.2406005859375, -1.12518310546875, -1.009765625, -0.89434814453125, -0.7789306640625, -0.66351318359375, -0.548095703125, -0.43267822265625, -0.3172607421875, -0.20184326171875, -0.08642578125, 0.02899169921875, 0.1444091796875, 0.25982666015625, 0.375244140625, 0.49066162109375, 0.6060791015625, 0.72149658203125, 0.8369140625, 0.95233154296875, 1.0677490234375, 1.18316650390625, 1.298583984375, 1.41400146484375, 1.5294189453125, 1.64483642578125, 1.76025390625, 1.87567138671875, 1.9910888671875, 2.10650634765625, 2.221923828125, 2.33734130859375, 2.4527587890625, 2.56817626953125, 2.68359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 13.0, 13.0, 29.0, 53.0, 91.0, 140.0, 293.0, 681.0, 1799.0, 6182.0, 34899.0, 537197.0, 3398630.0, 189741.0, 18417.0, 3830.0, 1184.0, 525.0, 239.0, 129.0, 66.0, 36.0, 29.0, 24.0, 10.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8343505859375, -7.606201171875, -7.3780517578125, -7.14990234375, -6.9217529296875, -6.693603515625, -6.4654541015625, -6.2373046875, -6.0091552734375, -5.781005859375, -5.5528564453125, -5.32470703125, -5.0965576171875, -4.868408203125, -4.6402587890625, -4.412109375, -4.1839599609375, -3.955810546875, -3.7276611328125, -3.49951171875, -3.2713623046875, -3.043212890625, -2.8150634765625, -2.5869140625, -2.3587646484375, -2.130615234375, -1.9024658203125, -1.67431640625, -1.4461669921875, -1.218017578125, -0.9898681640625, -0.76171875, -0.5335693359375, -0.305419921875, -0.0772705078125, 0.15087890625, 0.3790283203125, 0.607177734375, 0.8353271484375, 1.0634765625, 1.2916259765625, 1.519775390625, 1.7479248046875, 1.97607421875, 2.2042236328125, 2.432373046875, 2.6605224609375, 2.888671875, 3.1168212890625, 3.344970703125, 3.5731201171875, 3.80126953125, 4.0294189453125, 4.257568359375, 4.4857177734375, 4.7138671875, 4.9420166015625, 5.170166015625, 5.3983154296875, 5.62646484375, 5.8546142578125, 6.082763671875, 6.3109130859375, 6.5390625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 60.0, 202.0, 400.0, 240.0, 85.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.944175720214844, -33.57929229736328, -32.21440505981445, -30.84952163696289, -29.484634399414062, -28.1197509765625, -26.754865646362305, -25.38998031616211, -24.025094985961914, -22.66020965576172, -21.295324325561523, -19.930438995361328, -18.565555572509766, -17.200668334960938, -15.835784912109375, -14.47089958190918, -13.106014251708984, -11.741128921508789, -10.376243591308594, -9.011359214782715, -7.6464738845825195, -6.281588554382324, -4.916704177856445, -3.55181884765625, -2.1869335174560547, -0.8220484256744385, 0.5428366661071777, 1.9077215194702148, 3.27260684967041, 4.6374921798706055, 6.002376556396484, 7.36726188659668, 8.732147216796875, 10.09703254699707, 11.461917877197266, 12.826802253723145, 14.19168758392334, 15.556572914123535, 16.921457290649414, 18.28634262084961, 19.651227951049805, 21.01611328125, 22.380998611450195, 23.74588394165039, 25.110767364501953, 26.47565460205078, 27.840538024902344, 29.20542335510254, 30.570308685302734, 31.93519401550293, 33.300079345703125, 34.66496276855469, 36.029850006103516, 37.39473342895508, 38.759620666503906, 40.12450408935547, 41.48938751220703, 42.854270935058594, 44.21915817260742, 45.584041595458984, 46.94892883300781, 48.313812255859375, 49.67869567871094, 51.043582916259766, 52.408470153808594]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 4.0, 11.0, 13.0, 14.0, 14.0, 17.0, 18.0, 21.0, 24.0, 31.0, 20.0, 23.0, 34.0, 43.0, 44.0, 29.0, 41.0, 41.0, 38.0, 40.0, 36.0, 36.0, 41.0, 30.0, 42.0, 36.0, 47.0, 32.0, 25.0, 23.0, 24.0, 17.0, 16.0, 15.0, 8.0, 14.0, 5.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.979555130004883, -9.61448860168457, -9.249422073364258, -8.884355545043945, -8.519288063049316, -8.154221534729004, -7.789155006408691, -7.424088478088379, -7.059021472930908, -6.693954944610596, -6.328887939453125, -5.9638214111328125, -5.5987548828125, -5.233687877655029, -4.868621349334717, -4.503554344177246, -4.138487815856934, -3.773421049118042, -3.4083542823791504, -3.043287754058838, -2.6782209873199463, -2.3131542205810547, -1.9480876922607422, -1.5830209255218506, -1.217954158782959, -0.8528874516487122, -0.48782074451446533, -0.12275409698486328, 0.24231266975402832, 0.6073794364929199, 0.9724459648132324, 1.337512731552124, 1.7025794982910156, 2.0676462650299072, 2.432713031768799, 2.7977795600891113, 3.162846326828003, 3.5279130935668945, 3.892979621887207, 4.2580461502075195, 4.62311315536499, 4.988179683685303, 5.353246688842773, 5.718313217163086, 6.083379745483398, 6.448446750640869, 6.813513278961182, 7.178580284118652, 7.543646812438965, 7.908713340759277, 8.27377986907959, 8.638847351074219, 9.003913879394531, 9.368980407714844, 9.734046936035156, 10.099113464355469, 10.464179992675781, 10.829246520996094, 11.194313049316406, 11.559379577636719, 11.924447059631348, 12.28951358795166, 12.654580116271973, 13.019646644592285, 13.384714126586914]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 12.0, 12.0, 14.0, 19.0, 14.0, 17.0, 21.0, 20.0, 20.0, 33.0, 21.0, 40.0, 33.0, 33.0, 56.0, 41.0, 40.0, 35.0, 46.0, 41.0, 42.0, 41.0, 46.0, 35.0, 31.0, 25.0, 22.0, 22.0, 26.0, 25.0, 13.0, 18.0, 15.0, 16.0, 6.0, 11.0, 3.0, 10.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5146484375, -1.464385986328125, -1.41412353515625, -1.363861083984375, -1.3135986328125, -1.263336181640625, -1.21307373046875, -1.162811279296875, -1.112548828125, -1.062286376953125, -1.01202392578125, -0.961761474609375, -0.9114990234375, -0.861236572265625, -0.81097412109375, -0.760711669921875, -0.71044921875, -0.660186767578125, -0.60992431640625, -0.559661865234375, -0.5093994140625, -0.459136962890625, -0.40887451171875, -0.358612060546875, -0.308349609375, -0.258087158203125, -0.20782470703125, -0.157562255859375, -0.1072998046875, -0.057037353515625, -0.00677490234375, 0.043487548828125, 0.09375, 0.144012451171875, 0.19427490234375, 0.244537353515625, 0.2947998046875, 0.345062255859375, 0.39532470703125, 0.445587158203125, 0.495849609375, 0.546112060546875, 0.59637451171875, 0.646636962890625, 0.6968994140625, 0.747161865234375, 0.79742431640625, 0.847686767578125, 0.89794921875, 0.948211669921875, 0.99847412109375, 1.048736572265625, 1.0989990234375, 1.149261474609375, 1.19952392578125, 1.249786376953125, 1.300048828125, 1.350311279296875, 1.40057373046875, 1.450836181640625, 1.5010986328125, 1.551361083984375, 1.60162353515625, 1.651885986328125, 1.7021484375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 11.0, 16.0, 16.0, 37.0, 47.0, 83.0, 158.0, 203.0, 311.0, 507.0, 805.0, 1285.0, 1891.0, 2848.0, 4360.0, 6562.0, 9963.0, 14690.0, 22082.0, 32311.0, 46717.0, 65050.0, 87197.0, 110178.0, 125615.0, 124366.0, 106860.0, 85017.0, 62368.0, 44075.0, 30658.0, 20862.0, 14149.0, 9365.0, 6113.0, 4127.0, 2632.0, 1743.0, 1157.0, 752.0, 494.0, 314.0, 208.0, 125.0, 87.0, 45.0, 34.0, 19.0, 12.0, 7.0, 7.0, 6.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.1839599609375, -0.17801284790039062, -0.17206573486328125, -0.16611862182617188, -0.1601715087890625, -0.15422439575195312, -0.14827728271484375, -0.14233016967773438, -0.136383056640625, -0.13043594360351562, -0.12448883056640625, -0.11854171752929688, -0.1125946044921875, -0.10664749145507812, -0.10070037841796875, -0.09475326538085938, -0.08880615234375, -0.08285903930664062, -0.07691192626953125, -0.07096481323242188, -0.0650177001953125, -0.059070587158203125, -0.05312347412109375, -0.047176361083984375, -0.041229248046875, -0.035282135009765625, -0.02933502197265625, -0.023387908935546875, -0.0174407958984375, -0.011493682861328125, -0.00554656982421875, 0.000400543212890625, 0.00634765625, 0.012294769287109375, 0.01824188232421875, 0.024188995361328125, 0.0301361083984375, 0.036083221435546875, 0.04203033447265625, 0.047977447509765625, 0.053924560546875, 0.059871673583984375, 0.06581878662109375, 0.07176589965820312, 0.0777130126953125, 0.08366012573242188, 0.08960723876953125, 0.09555435180664062, 0.10150146484375, 0.10744857788085938, 0.11339569091796875, 0.11934280395507812, 0.1252899169921875, 0.13123703002929688, 0.13718414306640625, 0.14313125610351562, 0.149078369140625, 0.15502548217773438, 0.16097259521484375, 0.16691970825195312, 0.1728668212890625, 0.17881393432617188, 0.18476104736328125, 0.19070816040039062, 0.1966552734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 7.0, 9.0, 7.0, 13.0, 14.0, 14.0, 10.0, 27.0, 15.0, 28.0, 27.0, 38.0, 29.0, 49.0, 46.0, 43.0, 43.0, 44.0, 44.0, 1063.0, 51.0, 29.0, 36.0, 38.0, 35.0, 41.0, 33.0, 28.0, 27.0, 19.0, 17.0, 10.0, 30.0, 10.0, 9.0, 5.0, 8.0, 9.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2576751708984375, -1.218475341796875, -1.1792755126953125, -1.14007568359375, -1.1008758544921875, -1.061676025390625, -1.0224761962890625, -0.9832763671875, -0.9440765380859375, -0.904876708984375, -0.8656768798828125, -0.82647705078125, -0.7872772216796875, -0.748077392578125, -0.7088775634765625, -0.669677734375, -0.6304779052734375, -0.591278076171875, -0.5520782470703125, -0.51287841796875, -0.4736785888671875, -0.434478759765625, -0.3952789306640625, -0.3560791015625, -0.3168792724609375, -0.277679443359375, -0.2384796142578125, -0.19927978515625, -0.1600799560546875, -0.120880126953125, -0.0816802978515625, -0.04248046875, -0.0032806396484375, 0.035919189453125, 0.0751190185546875, 0.11431884765625, 0.1535186767578125, 0.192718505859375, 0.2319183349609375, 0.2711181640625, 0.3103179931640625, 0.349517822265625, 0.3887176513671875, 0.42791748046875, 0.4671173095703125, 0.506317138671875, 0.5455169677734375, 0.584716796875, 0.6239166259765625, 0.663116455078125, 0.7023162841796875, 0.74151611328125, 0.7807159423828125, 0.819915771484375, 0.8591156005859375, 0.8983154296875, 0.9375152587890625, 0.976715087890625, 1.0159149169921875, 1.05511474609375, 1.0943145751953125, 1.133514404296875, 1.1727142333984375, 1.2119140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 15.0, 13.0, 10.0, 15.0, 34.0, 46.0, 72.0, 87.0, 129.0, 182.0, 252.0, 465.0, 674.0, 1104.0, 1697.0, 2578.0, 4070.0, 6440.0, 10054.0, 16550.0, 33883.0, 186838.0, 1652267.0, 111940.0, 27858.0, 14851.0, 8866.0, 5728.0, 3704.0, 2306.0, 1493.0, 969.0, 672.0, 429.0, 290.0, 188.0, 119.0, 63.0, 55.0, 46.0, 20.0, 12.0, 10.0, 9.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.39208984375, -0.3787498474121094, -0.36540985107421875, -0.3520698547363281, -0.3387298583984375, -0.3253898620605469, -0.31204986572265625, -0.2987098693847656, -0.285369873046875, -0.2720298767089844, -0.25868988037109375, -0.24534988403320312, -0.2320098876953125, -0.21866989135742188, -0.20532989501953125, -0.19198989868164062, -0.17864990234375, -0.16530990600585938, -0.15196990966796875, -0.13862991333007812, -0.1252899169921875, -0.11194992065429688, -0.09860992431640625, -0.08526992797851562, -0.071929931640625, -0.058589935302734375, -0.04524993896484375, -0.031909942626953125, -0.0185699462890625, -0.005229949951171875, 0.00811004638671875, 0.021450042724609375, 0.0347900390625, 0.048130035400390625, 0.06147003173828125, 0.07481002807617188, 0.0881500244140625, 0.10149002075195312, 0.11483001708984375, 0.12817001342773438, 0.141510009765625, 0.15485000610351562, 0.16819000244140625, 0.18152999877929688, 0.1948699951171875, 0.20820999145507812, 0.22154998779296875, 0.23488998413085938, 0.24822998046875, 0.2615699768066406, 0.27490997314453125, 0.2882499694824219, 0.3015899658203125, 0.3149299621582031, 0.32826995849609375, 0.3416099548339844, 0.354949951171875, 0.3682899475097656, 0.38162994384765625, 0.3949699401855469, 0.4083099365234375, 0.4216499328613281, 0.43498992919921875, 0.4483299255371094, 0.461669921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 11.0, 11.0, 14.0, 19.0, 13.0, 23.0, 26.0, 24.0, 38.0, 55.0, 37.0, 55.0, 61.0, 58.0, 48.0, 56.0, 53.0, 60.0, 46.0, 51.0, 36.0, 25.0, 24.0, 23.0, 18.0, 23.0, 13.0, 7.0, 9.0, 11.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.0247802734375, -0.02407050132751465, -0.023360729217529297, -0.022650957107543945, -0.021941184997558594, -0.021231412887573242, -0.02052164077758789, -0.01981186866760254, -0.019102096557617188, -0.018392324447631836, -0.017682552337646484, -0.016972780227661133, -0.01626300811767578, -0.01555323600769043, -0.014843463897705078, -0.014133691787719727, -0.013423919677734375, -0.012714147567749023, -0.012004375457763672, -0.01129460334777832, -0.010584831237792969, -0.009875059127807617, -0.009165287017822266, -0.008455514907836914, -0.0077457427978515625, -0.007035970687866211, -0.006326198577880859, -0.005616426467895508, -0.004906654357910156, -0.004196882247924805, -0.003487110137939453, -0.0027773380279541016, -0.00206756591796875, -0.0013577938079833984, -0.0006480216979980469, 6.175041198730469e-05, 0.0007715225219726562, 0.0014812946319580078, 0.0021910667419433594, 0.002900838851928711, 0.0036106109619140625, 0.004320383071899414, 0.005030155181884766, 0.005739927291870117, 0.006449699401855469, 0.00715947151184082, 0.007869243621826172, 0.008579015731811523, 0.009288787841796875, 0.009998559951782227, 0.010708332061767578, 0.01141810417175293, 0.012127876281738281, 0.012837648391723633, 0.013547420501708984, 0.014257192611694336, 0.014966964721679688, 0.01567673683166504, 0.01638650894165039, 0.017096281051635742, 0.017806053161621094, 0.018515825271606445, 0.019225597381591797, 0.01993536949157715, 0.0206451416015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 7.0, 13.0, 18.0, 17.0, 17.0, 30.0, 48.0, 45.0, 52.0, 101.0, 116.0, 185.0, 298.0, 527.0, 1499.0, 75850.0, 958788.0, 8792.0, 864.0, 412.0, 239.0, 155.0, 119.0, 73.0, 56.0, 55.0, 41.0, 36.0, 18.0, 12.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.397216796875, -0.3831825256347656, -0.36914825439453125, -0.3551139831542969, -0.3410797119140625, -0.3270454406738281, -0.31301116943359375, -0.2989768981933594, -0.284942626953125, -0.2709083557128906, -0.25687408447265625, -0.24283981323242188, -0.2288055419921875, -0.21477127075195312, -0.20073699951171875, -0.18670272827148438, -0.17266845703125, -0.15863418579101562, -0.14459991455078125, -0.13056564331054688, -0.1165313720703125, -0.10249710083007812, -0.08846282958984375, -0.07442855834960938, -0.060394287109375, -0.046360015869140625, -0.03232574462890625, -0.018291473388671875, -0.0042572021484375, 0.009777069091796875, 0.02381134033203125, 0.037845611572265625, 0.0518798828125, 0.06591415405273438, 0.07994842529296875, 0.09398269653320312, 0.1080169677734375, 0.12205123901367188, 0.13608551025390625, 0.15011978149414062, 0.164154052734375, 0.17818832397460938, 0.19222259521484375, 0.20625686645507812, 0.2202911376953125, 0.23432540893554688, 0.24835968017578125, 0.2623939514160156, 0.27642822265625, 0.2904624938964844, 0.30449676513671875, 0.3185310363769531, 0.3325653076171875, 0.3465995788574219, 0.36063385009765625, 0.3746681213378906, 0.388702392578125, 0.4027366638183594, 0.41677093505859375, 0.4308052062988281, 0.4448394775390625, 0.4588737487792969, 0.47290802001953125, 0.4869422912597656, 0.5009765625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 6.0, 32.0, 223.0, 574.0, 160.0, 15.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03916732966899872, -0.03387698903679848, -0.028586646541953087, -0.023296304047107697, -0.018005963414907455, -0.012715622782707214, -0.007425278425216675, -0.0021349377930164337, 0.0031554028391838074, 0.008445744402706623, 0.013736085966229439, 0.01902642846107483, 0.02431676909327507, 0.02960710972547531, 0.03489745408296585, 0.04018779471516609, 0.04547813534736633, 0.050768475979566574, 0.056058816611766815, 0.061349160969257355, 0.0666394978761673, 0.07192984223365784, 0.07722018659114838, 0.08251053094863892, 0.08780086785554886, 0.0930912122130394, 0.09838154911994934, 0.10367189347743988, 0.10896223783493042, 0.11425257474184036, 0.1195429190993309, 0.12483325600624084, 0.1301235854625702, 0.13541392982006073, 0.14070427417755127, 0.14599460363388062, 0.15128494799137115, 0.1565752923488617, 0.16186563670635223, 0.16715598106384277, 0.17244631052017212, 0.17773665487766266, 0.1830269992351532, 0.18831732869148254, 0.19360767304897308, 0.19889801740646362, 0.20418836176395416, 0.2094787061214447, 0.21476905047893524, 0.22005939483642578, 0.22534973919391632, 0.23064008355140686, 0.2359304130077362, 0.24122075736522675, 0.24651110172271729, 0.25180143117904663, 0.25709179043769836, 0.2623821198940277, 0.26767247915267944, 0.2729628086090088, 0.2782531678676605, 0.28354349732398987, 0.2888338565826416, 0.29412418603897095, 0.2994145154953003]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 12.0, 6.0, 12.0, 21.0, 21.0, 25.0, 32.0, 57.0, 41.0, 60.0, 54.0, 70.0, 54.0, 68.0, 59.0, 60.0, 52.0, 57.0, 42.0, 36.0, 34.0, 30.0, 24.0, 22.0, 15.0, 16.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.047025442123413086, -0.04588892683386803, -0.04475241154432297, -0.04361589252948761, -0.04247937723994255, -0.04134286195039749, -0.040206342935562134, -0.039069827646017075, -0.037933312356472015, -0.036796797066926956, -0.0356602817773819, -0.03452376276254654, -0.03338724747300148, -0.03225073218345642, -0.031114215031266212, -0.029977697879076004, -0.028841182589530945, -0.027704667299985886, -0.026568150147795677, -0.02543163299560547, -0.02429511770606041, -0.02315860241651535, -0.022022085264325142, -0.020885568112134933, -0.019749052822589874, -0.018612537533044815, -0.017476020380854607, -0.016339503228664398, -0.015202987939119339, -0.014066471718251705, -0.012929955497384071, -0.011793439276516438, -0.010656923055648804, -0.00952040683478117, -0.008383890613913536, -0.007247374393045902, -0.006110858172178268, -0.004974341951310635, -0.003837825730443001, -0.002701309509575367, -0.0015647932887077332, -0.00042827706784009933, 0.0007082391530275345, 0.0018447553738951683, 0.002981271594762802, 0.004117787815630436, 0.00525430403649807, 0.006390820257365704, 0.007527336478233337, 0.008663852699100971, 0.009800368919968605, 0.010936885140836239, 0.012073401361703873, 0.013209917582571507, 0.01434643380343914, 0.015482950024306774, 0.016619466245174408, 0.017755981534719467, 0.018892498686909676, 0.020029015839099884, 0.021165531128644943, 0.022302046418190002, 0.02343856357038021, 0.02457508072257042, 0.02571159601211548]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 8.0, 9.0, 13.0, 11.0, 18.0, 20.0, 20.0, 15.0, 25.0, 29.0, 28.0, 28.0, 32.0, 40.0, 32.0, 41.0, 49.0, 30.0, 48.0, 43.0, 37.0, 34.0, 34.0, 30.0, 31.0, 32.0, 38.0, 39.0, 30.0, 23.0, 27.0, 25.0, 7.0, 13.0, 9.0, 12.0, 9.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.4086151123046875, -1.358245849609375, -1.3078765869140625, -1.25750732421875, -1.2071380615234375, -1.156768798828125, -1.1063995361328125, -1.0560302734375, -1.0056610107421875, -0.955291748046875, -0.9049224853515625, -0.85455322265625, -0.8041839599609375, -0.753814697265625, -0.7034454345703125, -0.653076171875, -0.6027069091796875, -0.552337646484375, -0.5019683837890625, -0.45159912109375, -0.4012298583984375, -0.350860595703125, -0.3004913330078125, -0.2501220703125, -0.1997528076171875, -0.149383544921875, -0.0990142822265625, -0.04864501953125, 0.0017242431640625, 0.052093505859375, 0.1024627685546875, 0.15283203125, 0.2032012939453125, 0.253570556640625, 0.3039398193359375, 0.35430908203125, 0.4046783447265625, 0.455047607421875, 0.5054168701171875, 0.5557861328125, 0.6061553955078125, 0.656524658203125, 0.7068939208984375, 0.75726318359375, 0.8076324462890625, 0.858001708984375, 0.9083709716796875, 0.958740234375, 1.0091094970703125, 1.059478759765625, 1.1098480224609375, 1.16021728515625, 1.2105865478515625, 1.260955810546875, 1.3113250732421875, 1.3616943359375, 1.4120635986328125, 1.462432861328125, 1.5128021240234375, 1.56317138671875, 1.6135406494140625, 1.663909912109375, 1.7142791748046875, 1.7646484375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 8.0, 10.0, 11.0, 23.0, 32.0, 46.0, 62.0, 86.0, 131.0, 217.0, 320.0, 431.0, 687.0, 1108.0, 1792.0, 3084.0, 5430.0, 10568.0, 24690.0, 71820.0, 283128.0, 459316.0, 117941.0, 36483.0, 14486.0, 6837.0, 3759.0, 2181.0, 1351.0, 833.0, 552.0, 374.0, 247.0, 155.0, 112.0, 74.0, 48.0, 38.0, 27.0, 21.0, 13.0, 10.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.65631103515625, -2.5762939453125, -2.49627685546875, -2.416259765625, -2.33624267578125, -2.2562255859375, -2.17620849609375, -2.09619140625, -2.01617431640625, -1.9361572265625, -1.85614013671875, -1.776123046875, -1.69610595703125, -1.6160888671875, -1.53607177734375, -1.4560546875, -1.37603759765625, -1.2960205078125, -1.21600341796875, -1.135986328125, -1.05596923828125, -0.9759521484375, -0.89593505859375, -0.81591796875, -0.73590087890625, -0.6558837890625, -0.57586669921875, -0.495849609375, -0.41583251953125, -0.3358154296875, -0.25579833984375, -0.17578125, -0.09576416015625, -0.0157470703125, 0.06427001953125, 0.144287109375, 0.22430419921875, 0.3043212890625, 0.38433837890625, 0.46435546875, 0.54437255859375, 0.6243896484375, 0.70440673828125, 0.784423828125, 0.86444091796875, 0.9444580078125, 1.02447509765625, 1.1044921875, 1.18450927734375, 1.2645263671875, 1.34454345703125, 1.424560546875, 1.50457763671875, 1.5845947265625, 1.66461181640625, 1.74462890625, 1.82464599609375, 1.9046630859375, 1.98468017578125, 2.064697265625, 2.14471435546875, 2.2247314453125, 2.30474853515625, 2.384765625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 2.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 14.0, 19.0, 16.0, 14.0, 22.0, 22.0, 35.0, 28.0, 37.0, 49.0, 73.0, 88.0, 96.0, 208.0, 1407.0, 262.0, 154.0, 86.0, 49.0, 35.0, 52.0, 34.0, 35.0, 25.0, 28.0, 29.0, 16.0, 13.0, 12.0, 12.0, 16.0, 10.0, 8.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.05859375, -3.9451904296875, -3.831787109375, -3.7183837890625, -3.60498046875, -3.4915771484375, -3.378173828125, -3.2647705078125, -3.1513671875, -3.0379638671875, -2.924560546875, -2.8111572265625, -2.69775390625, -2.5843505859375, -2.470947265625, -2.3575439453125, -2.244140625, -2.1307373046875, -2.017333984375, -1.9039306640625, -1.79052734375, -1.6771240234375, -1.563720703125, -1.4503173828125, -1.3369140625, -1.2235107421875, -1.110107421875, -0.9967041015625, -0.88330078125, -0.7698974609375, -0.656494140625, -0.5430908203125, -0.4296875, -0.3162841796875, -0.202880859375, -0.0894775390625, 0.02392578125, 0.1373291015625, 0.250732421875, 0.3641357421875, 0.4775390625, 0.5909423828125, 0.704345703125, 0.8177490234375, 0.93115234375, 1.0445556640625, 1.157958984375, 1.2713623046875, 1.384765625, 1.4981689453125, 1.611572265625, 1.7249755859375, 1.83837890625, 1.9517822265625, 2.065185546875, 2.1785888671875, 2.2919921875, 2.4053955078125, 2.518798828125, 2.6322021484375, 2.74560546875, 2.8590087890625, 2.972412109375, 3.0858154296875, 3.19921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 9.0, 8.0, 7.0, 12.0, 17.0, 26.0, 23.0, 21.0, 61.0, 87.0, 107.0, 153.0, 262.0, 456.0, 864.0, 3057.0, 124644.0, 3005783.0, 7356.0, 1301.0, 537.0, 309.0, 174.0, 127.0, 97.0, 52.0, 41.0, 27.0, 24.0, 19.0, 8.0, 7.0, 14.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8515625, -11.4591064453125, -11.066650390625, -10.6741943359375, -10.28173828125, -9.8892822265625, -9.496826171875, -9.1043701171875, -8.7119140625, -8.3194580078125, -7.927001953125, -7.5345458984375, -7.14208984375, -6.7496337890625, -6.357177734375, -5.9647216796875, -5.572265625, -5.1798095703125, -4.787353515625, -4.3948974609375, -4.00244140625, -3.6099853515625, -3.217529296875, -2.8250732421875, -2.4326171875, -2.0401611328125, -1.647705078125, -1.2552490234375, -0.86279296875, -0.4703369140625, -0.077880859375, 0.3145751953125, 0.70703125, 1.0994873046875, 1.491943359375, 1.8843994140625, 2.27685546875, 2.6693115234375, 3.061767578125, 3.4542236328125, 3.8466796875, 4.2391357421875, 4.631591796875, 5.0240478515625, 5.41650390625, 5.8089599609375, 6.201416015625, 6.5938720703125, 6.986328125, 7.3787841796875, 7.771240234375, 8.1636962890625, 8.55615234375, 8.9486083984375, 9.341064453125, 9.7335205078125, 10.1259765625, 10.5184326171875, 10.910888671875, 11.3033447265625, 11.69580078125, 12.0882568359375, 12.480712890625, 12.8731689453125, 13.265625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 17.0, 121.0, 352.0, 351.0, 129.0, 33.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.051490783691406, -53.881195068359375, -52.710899353027344, -51.54060363769531, -50.37030792236328, -49.200016021728516, -48.029720306396484, -46.85942459106445, -45.68912887573242, -44.51883316040039, -43.34853744506836, -42.17824172973633, -41.00794982910156, -39.83765411376953, -38.6673583984375, -37.49706268310547, -36.32676696777344, -35.156471252441406, -33.986175537109375, -32.815879821777344, -31.645586013793945, -30.475290298461914, -29.304996490478516, -28.134700775146484, -26.964405059814453, -25.794109344482422, -24.62381362915039, -23.453519821166992, -22.28322410583496, -21.11292839050293, -19.94263458251953, -18.7723388671875, -17.602046966552734, -16.431751251220703, -15.261456489562988, -14.091161727905273, -12.920866012573242, -11.750570297241211, -10.580275535583496, -9.409980773925781, -8.23968505859375, -7.069389820098877, -5.899094581604004, -4.728799343109131, -3.558504104614258, -2.3882088661193848, -1.2179136276245117, -0.047618865966796875, 1.1226768493652344, 2.2929720878601074, 3.4632673263549805, 4.6335625648498535, 5.803857803344727, 6.9741530418396, 8.144448280334473, 9.314743041992188, 10.485038757324219, 11.65533447265625, 12.825629234313965, 13.99592399597168, 15.166219711303711, 16.336515426635742, 17.50680923461914, 18.677104949951172, 19.847400665283203]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 6.0, 4.0, 3.0, 6.0, 5.0, 6.0, 4.0, 9.0, 14.0, 15.0, 16.0, 11.0, 19.0, 11.0, 11.0, 17.0, 17.0, 20.0, 19.0, 20.0, 22.0, 26.0, 47.0, 29.0, 21.0, 38.0, 39.0, 35.0, 33.0, 43.0, 28.0, 36.0, 23.0, 34.0, 29.0, 33.0, 30.0, 31.0, 21.0, 21.0, 19.0, 32.0, 12.0, 18.0, 14.0, 5.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.882428169250488, -7.606545925140381, -7.330663204193115, -7.054780960083008, -6.778898239135742, -6.503015995025635, -6.227133750915527, -5.951251029968262, -5.675368785858154, -5.399486541748047, -5.123603820800781, -4.847721576690674, -4.571839332580566, -4.295956611633301, -4.020074367523193, -3.744191884994507, -3.4683094024658203, -3.192426919937134, -2.9165444374084473, -2.64066219329834, -2.3647797107696533, -2.088897228240967, -1.8130148649215698, -1.5371325016021729, -1.2612500190734863, -0.9853675961494446, -0.7094851732254028, -0.4336027503013611, -0.15772032737731934, 0.11816215515136719, 0.39404451847076416, 0.6699268817901611, 0.9458093643188477, 1.2216918468475342, 1.4975742101669312, 1.7734565734863281, 2.0493390560150146, 2.325221538543701, 2.6011037826538086, 2.876986265182495, 3.1528687477111816, 3.428751230239868, 3.7046337127685547, 3.980515956878662, 4.2563982009887695, 4.532280921936035, 4.808163166046143, 5.08404541015625, 5.359928131103516, 5.635810375213623, 5.911693096160889, 6.187575340270996, 6.463458061218262, 6.739340305328369, 7.015222549438477, 7.291105270385742, 7.56698751449585, 7.842869758605957, 8.118752479553223, 8.394635200500488, 8.670516967773438, 8.946399688720703, 9.222282409667969, 9.498164176940918, 9.774046897888184]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 8.0, 4.0, 11.0, 15.0, 18.0, 21.0, 25.0, 23.0, 33.0, 31.0, 51.0, 34.0, 41.0, 38.0, 36.0, 36.0, 46.0, 41.0, 42.0, 40.0, 41.0, 44.0, 42.0, 36.0, 34.0, 32.0, 35.0, 26.0, 21.0, 15.0, 12.0, 11.0, 16.0, 8.0, 8.0, 5.0, 2.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.6447601318359375, -1.588348388671875, -1.5319366455078125, -1.47552490234375, -1.4191131591796875, -1.362701416015625, -1.3062896728515625, -1.2498779296875, -1.1934661865234375, -1.137054443359375, -1.0806427001953125, -1.02423095703125, -0.9678192138671875, -0.911407470703125, -0.8549957275390625, -0.798583984375, -0.7421722412109375, -0.685760498046875, -0.6293487548828125, -0.57293701171875, -0.5165252685546875, -0.460113525390625, -0.4037017822265625, -0.3472900390625, -0.2908782958984375, -0.234466552734375, -0.1780548095703125, -0.12164306640625, -0.0652313232421875, -0.008819580078125, 0.0475921630859375, 0.10400390625, 0.1604156494140625, 0.216827392578125, 0.2732391357421875, 0.32965087890625, 0.3860626220703125, 0.442474365234375, 0.4988861083984375, 0.5552978515625, 0.6117095947265625, 0.668121337890625, 0.7245330810546875, 0.78094482421875, 0.8373565673828125, 0.893768310546875, 0.9501800537109375, 1.006591796875, 1.0630035400390625, 1.119415283203125, 1.1758270263671875, 1.23223876953125, 1.2886505126953125, 1.345062255859375, 1.4014739990234375, 1.4578857421875, 1.5142974853515625, 1.570709228515625, 1.6271209716796875, 1.68353271484375, 1.7399444580078125, 1.796356201171875, 1.8527679443359375, 1.9091796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 25.0, 33.0, 34.0, 64.0, 93.0, 114.0, 168.0, 227.0, 318.0, 459.0, 635.0, 1011.0, 1616.0, 3124.0, 7154.0, 22899.0, 157042.0, 1659539.0, 2081296.0, 213235.0, 27975.0, 8279.0, 3486.0, 1874.0, 1134.0, 721.0, 507.0, 315.0, 228.0, 164.0, 129.0, 97.0, 66.0, 53.0, 42.0, 29.0, 19.0, 19.0, 10.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.923828125, -3.797515869140625, -3.67120361328125, -3.544891357421875, -3.4185791015625, -3.292266845703125, -3.16595458984375, -3.039642333984375, -2.913330078125, -2.787017822265625, -2.66070556640625, -2.534393310546875, -2.4080810546875, -2.281768798828125, -2.15545654296875, -2.029144287109375, -1.90283203125, -1.776519775390625, -1.65020751953125, -1.523895263671875, -1.3975830078125, -1.271270751953125, -1.14495849609375, -1.018646240234375, -0.892333984375, -0.766021728515625, -0.63970947265625, -0.513397216796875, -0.3870849609375, -0.260772705078125, -0.13446044921875, -0.008148193359375, 0.1181640625, 0.244476318359375, 0.37078857421875, 0.497100830078125, 0.6234130859375, 0.749725341796875, 0.87603759765625, 1.002349853515625, 1.128662109375, 1.254974365234375, 1.38128662109375, 1.507598876953125, 1.6339111328125, 1.760223388671875, 1.88653564453125, 2.012847900390625, 2.13916015625, 2.265472412109375, 2.39178466796875, 2.518096923828125, 2.6444091796875, 2.770721435546875, 2.89703369140625, 3.023345947265625, 3.149658203125, 3.275970458984375, 3.40228271484375, 3.528594970703125, 3.6549072265625, 3.781219482421875, 3.90753173828125, 4.033843994140625, 4.16015625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 29.0, 26.0, 44.0, 62.0, 104.0, 164.0, 245.0, 330.0, 515.0, 672.0, 586.0, 454.0, 264.0, 186.0, 106.0, 84.0, 80.0, 28.0, 18.0, 12.0, 9.0, 11.0, 5.0, 5.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.383880615234375, -3.26580810546875, -3.147735595703125, -3.0296630859375, -2.911590576171875, -2.79351806640625, -2.675445556640625, -2.557373046875, -2.439300537109375, -2.32122802734375, -2.203155517578125, -2.0850830078125, -1.967010498046875, -1.84893798828125, -1.730865478515625, -1.61279296875, -1.494720458984375, -1.37664794921875, -1.258575439453125, -1.1405029296875, -1.022430419921875, -0.90435791015625, -0.786285400390625, -0.668212890625, -0.550140380859375, -0.43206787109375, -0.313995361328125, -0.1959228515625, -0.077850341796875, 0.04022216796875, 0.158294677734375, 0.2763671875, 0.394439697265625, 0.51251220703125, 0.630584716796875, 0.7486572265625, 0.866729736328125, 0.98480224609375, 1.102874755859375, 1.220947265625, 1.339019775390625, 1.45709228515625, 1.575164794921875, 1.6932373046875, 1.811309814453125, 1.92938232421875, 2.047454833984375, 2.16552734375, 2.283599853515625, 2.40167236328125, 2.519744873046875, 2.6378173828125, 2.755889892578125, 2.87396240234375, 2.992034912109375, 3.110107421875, 3.228179931640625, 3.34625244140625, 3.464324951171875, 3.5823974609375, 3.700469970703125, 3.81854248046875, 3.936614990234375, 4.0546875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 13.0, 14.0, 10.0, 18.0, 24.0, 37.0, 59.0, 88.0, 135.0, 256.0, 545.0, 1402.0, 4836.0, 33938.0, 994288.0, 3061739.0, 85045.0, 8340.0, 1943.0, 738.0, 323.0, 182.0, 100.0, 69.0, 44.0, 15.0, 19.0, 12.0, 11.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.144775390625, -5.93408203125, -5.723388671875, -5.5126953125, -5.302001953125, -5.09130859375, -4.880615234375, -4.669921875, -4.459228515625, -4.24853515625, -4.037841796875, -3.8271484375, -3.616455078125, -3.40576171875, -3.195068359375, -2.984375, -2.773681640625, -2.56298828125, -2.352294921875, -2.1416015625, -1.930908203125, -1.72021484375, -1.509521484375, -1.298828125, -1.088134765625, -0.87744140625, -0.666748046875, -0.4560546875, -0.245361328125, -0.03466796875, 0.176025390625, 0.38671875, 0.597412109375, 0.80810546875, 1.018798828125, 1.2294921875, 1.440185546875, 1.65087890625, 1.861572265625, 2.072265625, 2.282958984375, 2.49365234375, 2.704345703125, 2.9150390625, 3.125732421875, 3.33642578125, 3.547119140625, 3.7578125, 3.968505859375, 4.17919921875, 4.389892578125, 4.6005859375, 4.811279296875, 5.02197265625, 5.232666015625, 5.443359375, 5.654052734375, 5.86474609375, 6.075439453125, 6.2861328125, 6.496826171875, 6.70751953125, 6.918212890625, 7.12890625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 277.0, 667.0, 59.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.44068908691406, -171.28453063964844, -168.12835693359375, -164.97219848632812, -161.81602478027344, -158.6598663330078, -155.50369262695312, -152.3475341796875, -149.19137573242188, -146.03521728515625, -142.87904357910156, -139.72288513183594, -136.56671142578125, -133.41055297851562, -130.25439453125, -127.09822082519531, -123.94205474853516, -120.785888671875, -117.62972259521484, -114.47355651855469, -111.31739807128906, -108.1612319946289, -105.00506591796875, -101.8488998413086, -98.69273376464844, -95.53656768798828, -92.38040161132812, -89.2242431640625, -86.06807708740234, -82.91191101074219, -79.75574493408203, -76.59957885742188, -73.44342041015625, -70.2872543334961, -67.13108825683594, -63.97492599487305, -60.818763732910156, -57.66259765625, -54.506431579589844, -51.35026550292969, -48.19410705566406, -45.037940979003906, -41.881778717041016, -38.72561264038086, -35.56945037841797, -32.41328430175781, -29.257118225097656, -26.100954055786133, -22.944787979125977, -19.788623809814453, -16.632457733154297, -13.476293563842773, -10.32012939453125, -7.163965225219727, -4.00779914855957, -0.8516349792480469, 2.3045291900634766, 5.460693836212158, 8.61685848236084, 11.77302360534668, 14.929187774658203, 18.085351943969727, 21.241518020629883, 24.397682189941406, 27.55384635925293]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 7.0, 16.0, 15.0, 14.0, 28.0, 33.0, 51.0, 50.0, 50.0, 62.0, 85.0, 62.0, 74.0, 74.0, 59.0, 62.0, 50.0, 39.0, 34.0, 36.0, 19.0, 26.0, 17.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.838165283203125, -16.26803970336914, -15.697914123535156, -15.127788543701172, -14.557662963867188, -13.987537384033203, -13.417411804199219, -12.847286224365234, -12.27716064453125, -11.707035064697266, -11.136909484863281, -10.566783905029297, -9.996658325195312, -9.426532745361328, -8.856407165527344, -8.28628158569336, -7.716156959533691, -7.146031379699707, -6.575905799865723, -6.005780220031738, -5.435654640197754, -4.8655290603637695, -4.295403957366943, -3.725278377532959, -3.1551527976989746, -2.5850272178649902, -2.014901638031006, -1.4447762966156006, -0.8746507167816162, -0.30452513694763184, 0.26560020446777344, 0.8357257843017578, 1.4058513641357422, 1.9759769439697266, 2.546102523803711, 3.116227865219116, 3.6863534450531006, 4.256479263305664, 4.82660436630249, 5.396729946136475, 5.966855525970459, 6.536981105804443, 7.107106685638428, 7.677231788635254, 8.247357368469238, 8.817482948303223, 9.387608528137207, 9.957734107971191, 10.527859687805176, 11.09798526763916, 11.668110847473145, 12.238236427307129, 12.808362007141113, 13.378487586975098, 13.948612213134766, 14.51873779296875, 15.088863372802734, 15.658988952636719, 16.229114532470703, 16.799240112304688, 17.369365692138672, 17.939491271972656, 18.50961685180664, 19.079742431640625, 19.64986801147461]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 18.0, 13.0, 15.0, 21.0, 29.0, 26.0, 29.0, 29.0, 37.0, 35.0, 45.0, 34.0, 31.0, 34.0, 34.0, 42.0, 37.0, 39.0, 41.0, 27.0, 48.0, 39.0, 37.0, 32.0, 28.0, 31.0, 22.0, 13.0, 18.0, 12.0, 11.0, 13.0, 14.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.5654296875, -1.51898193359375, -1.4725341796875, -1.42608642578125, -1.379638671875, -1.33319091796875, -1.2867431640625, -1.24029541015625, -1.19384765625, -1.14739990234375, -1.1009521484375, -1.05450439453125, -1.008056640625, -0.96160888671875, -0.9151611328125, -0.86871337890625, -0.822265625, -0.77581787109375, -0.7293701171875, -0.68292236328125, -0.636474609375, -0.59002685546875, -0.5435791015625, -0.49713134765625, -0.45068359375, -0.40423583984375, -0.3577880859375, -0.31134033203125, -0.264892578125, -0.21844482421875, -0.1719970703125, -0.12554931640625, -0.0791015625, -0.03265380859375, 0.0137939453125, 0.06024169921875, 0.106689453125, 0.15313720703125, 0.1995849609375, 0.24603271484375, 0.29248046875, 0.33892822265625, 0.3853759765625, 0.43182373046875, 0.478271484375, 0.52471923828125, 0.5711669921875, 0.61761474609375, 0.6640625, 0.71051025390625, 0.7569580078125, 0.80340576171875, 0.849853515625, 0.89630126953125, 0.9427490234375, 0.98919677734375, 1.03564453125, 1.08209228515625, 1.1285400390625, 1.17498779296875, 1.221435546875, 1.26788330078125, 1.3143310546875, 1.36077880859375, 1.4072265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 11.0, 14.0, 28.0, 34.0, 62.0, 89.0, 158.0, 196.0, 328.0, 509.0, 805.0, 1235.0, 1863.0, 3020.0, 4692.0, 7090.0, 10958.0, 16804.0, 26018.0, 39258.0, 58269.0, 84562.0, 113186.0, 137796.0, 140782.0, 120319.0, 91368.0, 64257.0, 43468.0, 28485.0, 18669.0, 12182.0, 7760.0, 5107.0, 3216.0, 2127.0, 1346.0, 868.0, 558.0, 386.0, 220.0, 153.0, 92.0, 66.0, 43.0, 36.0, 23.0, 12.0, 8.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1658935546875, -0.16056251525878906, -0.15523147583007812, -0.1499004364013672, -0.14456939697265625, -0.1392383575439453, -0.13390731811523438, -0.12857627868652344, -0.1232452392578125, -0.11791419982910156, -0.11258316040039062, -0.10725212097167969, -0.10192108154296875, -0.09659004211425781, -0.09125900268554688, -0.08592796325683594, -0.080596923828125, -0.07526588439941406, -0.06993484497070312, -0.06460380554199219, -0.05927276611328125, -0.05394172668457031, -0.048610687255859375, -0.04327964782714844, -0.0379486083984375, -0.03261756896972656, -0.027286529541015625, -0.021955490112304688, -0.01662445068359375, -0.011293411254882812, -0.005962371826171875, -0.0006313323974609375, 0.00469970703125, 0.010030746459960938, 0.015361785888671875, 0.020692825317382812, 0.02602386474609375, 0.03135490417480469, 0.036685943603515625, 0.04201698303222656, 0.0473480224609375, 0.05267906188964844, 0.058010101318359375, 0.06334114074707031, 0.06867218017578125, 0.07400321960449219, 0.07933425903320312, 0.08466529846191406, 0.089996337890625, 0.09532737731933594, 0.10065841674804688, 0.10598945617675781, 0.11132049560546875, 0.11665153503417969, 0.12198257446289062, 0.12731361389160156, 0.1326446533203125, 0.13797569274902344, 0.14330673217773438, 0.1486377716064453, 0.15396881103515625, 0.1592998504638672, 0.16463088989257812, 0.16996192932128906, 0.17529296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 7.0, 7.0, 11.0, 13.0, 11.0, 8.0, 10.0, 24.0, 16.0, 20.0, 21.0, 23.0, 23.0, 31.0, 37.0, 31.0, 32.0, 24.0, 35.0, 39.0, 33.0, 1057.0, 35.0, 43.0, 46.0, 40.0, 41.0, 44.0, 33.0, 30.0, 21.0, 27.0, 22.0, 14.0, 23.0, 17.0, 11.0, 11.0, 12.0, 7.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9267578125, -0.8947296142578125, -0.862701416015625, -0.8306732177734375, -0.79864501953125, -0.7666168212890625, -0.734588623046875, -0.7025604248046875, -0.6705322265625, -0.6385040283203125, -0.606475830078125, -0.5744476318359375, -0.54241943359375, -0.5103912353515625, -0.478363037109375, -0.4463348388671875, -0.414306640625, -0.3822784423828125, -0.350250244140625, -0.3182220458984375, -0.28619384765625, -0.2541656494140625, -0.222137451171875, -0.1901092529296875, -0.1580810546875, -0.1260528564453125, -0.094024658203125, -0.0619964599609375, -0.02996826171875, 0.0020599365234375, 0.034088134765625, 0.0661163330078125, 0.09814453125, 0.1301727294921875, 0.162200927734375, 0.1942291259765625, 0.22625732421875, 0.2582855224609375, 0.290313720703125, 0.3223419189453125, 0.3543701171875, 0.3863983154296875, 0.418426513671875, 0.4504547119140625, 0.48248291015625, 0.5145111083984375, 0.546539306640625, 0.5785675048828125, 0.610595703125, 0.6426239013671875, 0.674652099609375, 0.7066802978515625, 0.73870849609375, 0.7707366943359375, 0.802764892578125, 0.8347930908203125, 0.8668212890625, 0.8988494873046875, 0.930877685546875, 0.9629058837890625, 0.99493408203125, 1.0269622802734375, 1.058990478515625, 1.0910186767578125, 1.123046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 12.0, 25.0, 19.0, 35.0, 55.0, 90.0, 132.0, 199.0, 308.0, 484.0, 722.0, 1218.0, 1800.0, 3005.0, 4722.0, 7521.0, 12135.0, 21398.0, 55846.0, 1219662.0, 664883.0, 50919.0, 20906.0, 11791.0, 7117.0, 4359.0, 2658.0, 1870.0, 1143.0, 735.0, 458.0, 338.0, 187.0, 123.0, 73.0, 40.0, 38.0, 30.0, 23.0, 9.0, 6.0, 7.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.40045166015625, -0.3883056640625, -0.37615966796875, -0.364013671875, -0.35186767578125, -0.3397216796875, -0.32757568359375, -0.3154296875, -0.30328369140625, -0.2911376953125, -0.27899169921875, -0.266845703125, -0.25469970703125, -0.2425537109375, -0.23040771484375, -0.21826171875, -0.20611572265625, -0.1939697265625, -0.18182373046875, -0.169677734375, -0.15753173828125, -0.1453857421875, -0.13323974609375, -0.12109375, -0.10894775390625, -0.0968017578125, -0.08465576171875, -0.072509765625, -0.06036376953125, -0.0482177734375, -0.03607177734375, -0.02392578125, -0.01177978515625, 0.0003662109375, 0.01251220703125, 0.024658203125, 0.03680419921875, 0.0489501953125, 0.06109619140625, 0.0732421875, 0.08538818359375, 0.0975341796875, 0.10968017578125, 0.121826171875, 0.13397216796875, 0.1461181640625, 0.15826416015625, 0.17041015625, 0.18255615234375, 0.1947021484375, 0.20684814453125, 0.218994140625, 0.23114013671875, 0.2432861328125, 0.25543212890625, 0.267578125, 0.27972412109375, 0.2918701171875, 0.30401611328125, 0.316162109375, 0.32830810546875, 0.3404541015625, 0.35260009765625, 0.36474609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 2.0, 7.0, 3.0, 7.0, 5.0, 20.0, 23.0, 29.0, 39.0, 40.0, 55.0, 66.0, 85.0, 71.0, 83.0, 96.0, 63.0, 62.0, 52.0, 40.0, 29.0, 25.0, 19.0, 19.0, 15.0, 11.0, 5.0, 3.0, 7.0, 7.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02166748046875, -0.020815372467041016, -0.01996326446533203, -0.019111156463623047, -0.018259048461914062, -0.017406940460205078, -0.016554832458496094, -0.01570272445678711, -0.014850616455078125, -0.01399850845336914, -0.013146400451660156, -0.012294292449951172, -0.011442184448242188, -0.010590076446533203, -0.009737968444824219, -0.008885860443115234, -0.00803375244140625, -0.007181644439697266, -0.006329536437988281, -0.005477428436279297, -0.0046253204345703125, -0.003773212432861328, -0.0029211044311523438, -0.0020689964294433594, -0.001216888427734375, -0.0003647804260253906, 0.00048732757568359375, 0.0013394355773925781, 0.0021915435791015625, 0.003043651580810547, 0.0038957595825195312, 0.004747867584228516, 0.0055999755859375, 0.006452083587646484, 0.007304191589355469, 0.008156299591064453, 0.009008407592773438, 0.009860515594482422, 0.010712623596191406, 0.01156473159790039, 0.012416839599609375, 0.01326894760131836, 0.014121055603027344, 0.014973163604736328, 0.015825271606445312, 0.016677379608154297, 0.01752948760986328, 0.018381595611572266, 0.01923370361328125, 0.020085811614990234, 0.02093791961669922, 0.021790027618408203, 0.022642135620117188, 0.023494243621826172, 0.024346351623535156, 0.02519845962524414, 0.026050567626953125, 0.02690267562866211, 0.027754783630371094, 0.028606891632080078, 0.029458999633789062, 0.030311107635498047, 0.03116321563720703, 0.032015323638916016, 0.032867431640625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 10.0, 23.0, 16.0, 27.0, 39.0, 45.0, 67.0, 101.0, 139.0, 189.0, 399.0, 897.0, 5459.0, 875027.0, 161761.0, 2780.0, 620.0, 299.0, 201.0, 114.0, 83.0, 73.0, 47.0, 23.0, 14.0, 13.0, 16.0, 16.0, 7.0, 4.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0], "bins": [-0.54931640625, -0.5355339050292969, -0.5217514038085938, -0.5079689025878906, -0.4941864013671875, -0.4804039001464844, -0.46662139892578125, -0.4528388977050781, -0.439056396484375, -0.4252738952636719, -0.41149139404296875, -0.3977088928222656, -0.3839263916015625, -0.3701438903808594, -0.35636138916015625, -0.3425788879394531, -0.32879638671875, -0.3150138854980469, -0.30123138427734375, -0.2874488830566406, -0.2736663818359375, -0.2598838806152344, -0.24610137939453125, -0.23231887817382812, -0.218536376953125, -0.20475387573242188, -0.19097137451171875, -0.17718887329101562, -0.1634063720703125, -0.14962387084960938, -0.13584136962890625, -0.12205886840820312, -0.1082763671875, -0.09449386596679688, -0.08071136474609375, -0.06692886352539062, -0.0531463623046875, -0.039363861083984375, -0.02558135986328125, -0.011798858642578125, 0.001983642578125, 0.015766143798828125, 0.02954864501953125, 0.043331146240234375, 0.0571136474609375, 0.07089614868164062, 0.08467864990234375, 0.09846115112304688, 0.11224365234375, 0.12602615356445312, 0.13980865478515625, 0.15359115600585938, 0.1673736572265625, 0.18115615844726562, 0.19493865966796875, 0.20872116088867188, 0.222503662109375, 0.23628616333007812, 0.25006866455078125, 0.2638511657714844, 0.2776336669921875, 0.2914161682128906, 0.30519866943359375, 0.3189811706542969, 0.332763671875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 20.0, 48.0, 93.0, 231.0, 281.0, 163.0, 85.0, 32.0, 20.0, 10.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.09890901297330856, -0.09705847501754761, -0.09520793706178665, -0.0933573916554451, -0.09150685369968414, -0.08965631574392319, -0.08780577778816223, -0.08595523238182068, -0.08410469442605972, -0.08225415647029877, -0.08040361851453781, -0.07855307310819626, -0.0767025351524353, -0.07485199719667435, -0.07300145924091339, -0.07115091383457184, -0.06930038332939148, -0.06744984537363052, -0.06559930741786957, -0.06374876201152802, -0.06189822405576706, -0.060047686100006104, -0.05819714814424515, -0.05634660646319389, -0.05449606478214264, -0.05264552682638168, -0.05079498514533043, -0.04894444718956947, -0.04709390550851822, -0.04524336755275726, -0.04339282959699631, -0.04154228791594505, -0.0396917499601841, -0.03784121200442314, -0.03599067032337189, -0.03414013236761093, -0.03228959068655968, -0.03043905273079872, -0.028588512912392616, -0.02673797309398651, -0.024887433275580406, -0.0230368934571743, -0.021186353638768196, -0.01933581382036209, -0.017485275864601135, -0.01563473418354988, -0.013784196227788925, -0.01193365640938282, -0.010083116590976715, -0.00823257677257061, -0.006382037419825792, -0.004531498067080975, -0.0026809582486748695, -0.0008304184302687645, 0.001020120456814766, 0.002870660275220871, 0.004721200093626976, 0.006571739912033081, 0.008422279730439186, 0.010272818617522717, 0.012123358435928822, 0.013973898254334927, 0.015824437141418457, 0.017674976959824562, 0.019525516778230667]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 2.0, 8.0, 9.0, 5.0, 8.0, 10.0, 14.0, 17.0, 17.0, 20.0, 18.0, 18.0, 26.0, 25.0, 36.0, 44.0, 34.0, 40.0, 41.0, 37.0, 41.0, 36.0, 47.0, 32.0, 37.0, 35.0, 34.0, 24.0, 34.0, 25.0, 25.0, 22.0, 25.0, 16.0, 24.0, 20.0, 15.0, 17.0, 14.0, 8.0, 8.0, 9.0, 7.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017521142959594727, -0.016970328986644745, -0.016419516876339912, -0.01586870476603508, -0.015317890793085098, -0.014767077751457691, -0.014216264709830284, -0.013665451668202877, -0.01311463862657547, -0.012563825584948063, -0.012013012543320656, -0.011462199501693249, -0.010911386460065842, -0.010360573418438435, -0.009809760376811028, -0.00925894733518362, -0.008708134293556213, -0.008157321251928806, -0.007606508210301399, -0.007055695168673992, -0.006504882127046585, -0.005954069085419178, -0.005403256043791771, -0.004852443002164364, -0.004301629960536957, -0.0037508169189095497, -0.0032000038772821426, -0.0026491908356547356, -0.0020983777940273285, -0.0015475647523999214, -0.0009967517107725143, -0.00044593866914510727, 0.0001048743724822998, 0.0006556874141097069, 0.001206500455737114, 0.001757313497364521, 0.002308126538991928, 0.002858939580619335, 0.0034097526222467422, 0.003960565663874149, 0.004511378705501556, 0.0050621917471289635, 0.0056130047887563705, 0.006163817830383778, 0.006714630872011185, 0.007265443913638592, 0.007816256955265999, 0.008367069996893406, 0.008917883038520813, 0.00946869608014822, 0.010019509121775627, 0.010570322163403034, 0.011121135205030441, 0.011671948246657848, 0.012222761288285255, 0.012773574329912663, 0.01332438737154007, 0.013875200413167477, 0.014426013454794884, 0.01497682649642229, 0.015527639538049698, 0.01607845351099968, 0.016629265621304512, 0.017180077731609344, 0.017730891704559326]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 8.0, 12.0, 10.0, 15.0, 15.0, 10.0, 19.0, 14.0, 26.0, 31.0, 20.0, 31.0, 42.0, 35.0, 27.0, 39.0, 42.0, 32.0, 29.0, 22.0, 43.0, 39.0, 34.0, 42.0, 29.0, 35.0, 40.0, 23.0, 23.0, 19.0, 17.0, 32.0, 10.0, 21.0, 16.0, 12.0, 12.0, 7.0, 8.0, 8.0, 10.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.34375, -1.302459716796875, -1.26116943359375, -1.219879150390625, -1.1785888671875, -1.137298583984375, -1.09600830078125, -1.054718017578125, -1.013427734375, -0.972137451171875, -0.93084716796875, -0.889556884765625, -0.8482666015625, -0.806976318359375, -0.76568603515625, -0.724395751953125, -0.68310546875, -0.641815185546875, -0.60052490234375, -0.559234619140625, -0.5179443359375, -0.476654052734375, -0.43536376953125, -0.394073486328125, -0.352783203125, -0.311492919921875, -0.27020263671875, -0.228912353515625, -0.1876220703125, -0.146331787109375, -0.10504150390625, -0.063751220703125, -0.0224609375, 0.018829345703125, 0.06011962890625, 0.101409912109375, 0.1427001953125, 0.183990478515625, 0.22528076171875, 0.266571044921875, 0.307861328125, 0.349151611328125, 0.39044189453125, 0.431732177734375, 0.4730224609375, 0.514312744140625, 0.55560302734375, 0.596893310546875, 0.63818359375, 0.679473876953125, 0.72076416015625, 0.762054443359375, 0.8033447265625, 0.844635009765625, 0.88592529296875, 0.927215576171875, 0.968505859375, 1.009796142578125, 1.05108642578125, 1.092376708984375, 1.1336669921875, 1.174957275390625, 1.21624755859375, 1.257537841796875, 1.298828125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 10.0, 4.0, 12.0, 9.0, 17.0, 25.0, 33.0, 52.0, 72.0, 76.0, 110.0, 158.0, 238.0, 363.0, 531.0, 873.0, 1471.0, 2584.0, 5193.0, 11319.0, 29042.0, 96421.0, 354947.0, 381468.0, 107520.0, 31365.0, 12149.0, 5406.0, 2818.0, 1540.0, 926.0, 643.0, 348.0, 233.0, 166.0, 100.0, 85.0, 50.0, 37.0, 36.0, 23.0, 21.0, 13.0, 9.0, 9.0, 8.0, 4.0, 4.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.708740234375, -1.65185546875, -1.594970703125, -1.5380859375, -1.481201171875, -1.42431640625, -1.367431640625, -1.310546875, -1.253662109375, -1.19677734375, -1.139892578125, -1.0830078125, -1.026123046875, -0.96923828125, -0.912353515625, -0.85546875, -0.798583984375, -0.74169921875, -0.684814453125, -0.6279296875, -0.571044921875, -0.51416015625, -0.457275390625, -0.400390625, -0.343505859375, -0.28662109375, -0.229736328125, -0.1728515625, -0.115966796875, -0.05908203125, -0.002197265625, 0.0546875, 0.111572265625, 0.16845703125, 0.225341796875, 0.2822265625, 0.339111328125, 0.39599609375, 0.452880859375, 0.509765625, 0.566650390625, 0.62353515625, 0.680419921875, 0.7373046875, 0.794189453125, 0.85107421875, 0.907958984375, 0.96484375, 1.021728515625, 1.07861328125, 1.135498046875, 1.1923828125, 1.249267578125, 1.30615234375, 1.363037109375, 1.419921875, 1.476806640625, 1.53369140625, 1.590576171875, 1.6474609375, 1.704345703125, 1.76123046875, 1.818115234375, 1.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 14.0, 26.0, 19.0, 37.0, 44.0, 49.0, 61.0, 71.0, 77.0, 164.0, 1506.0, 409.0, 165.0, 90.0, 61.0, 46.0, 37.0, 24.0, 25.0, 25.0, 13.0, 17.0, 6.0, 9.0, 9.0, 3.0, 6.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.43359375, -5.2685546875, -5.103515625, -4.9384765625, -4.7734375, -4.6083984375, -4.443359375, -4.2783203125, -4.11328125, -3.9482421875, -3.783203125, -3.6181640625, -3.453125, -3.2880859375, -3.123046875, -2.9580078125, -2.79296875, -2.6279296875, -2.462890625, -2.2978515625, -2.1328125, -1.9677734375, -1.802734375, -1.6376953125, -1.47265625, -1.3076171875, -1.142578125, -0.9775390625, -0.8125, -0.6474609375, -0.482421875, -0.3173828125, -0.15234375, 0.0126953125, 0.177734375, 0.3427734375, 0.5078125, 0.6728515625, 0.837890625, 1.0029296875, 1.16796875, 1.3330078125, 1.498046875, 1.6630859375, 1.828125, 1.9931640625, 2.158203125, 2.3232421875, 2.48828125, 2.6533203125, 2.818359375, 2.9833984375, 3.1484375, 3.3134765625, 3.478515625, 3.6435546875, 3.80859375, 3.9736328125, 4.138671875, 4.3037109375, 4.46875, 4.6337890625, 4.798828125, 4.9638671875, 5.12890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 6.0, 10.0, 14.0, 9.0, 13.0, 18.0, 25.0, 34.0, 50.0, 77.0, 81.0, 151.0, 197.0, 416.0, 1237.0, 11367.0, 3064622.0, 63747.0, 2163.0, 593.0, 310.0, 154.0, 104.0, 74.0, 68.0, 50.0, 34.0, 23.0, 9.0, 12.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.4375, -8.171142578125, -7.90478515625, -7.638427734375, -7.3720703125, -7.105712890625, -6.83935546875, -6.572998046875, -6.306640625, -6.040283203125, -5.77392578125, -5.507568359375, -5.2412109375, -4.974853515625, -4.70849609375, -4.442138671875, -4.17578125, -3.909423828125, -3.64306640625, -3.376708984375, -3.1103515625, -2.843994140625, -2.57763671875, -2.311279296875, -2.044921875, -1.778564453125, -1.51220703125, -1.245849609375, -0.9794921875, -0.713134765625, -0.44677734375, -0.180419921875, 0.0859375, 0.352294921875, 0.61865234375, 0.885009765625, 1.1513671875, 1.417724609375, 1.68408203125, 1.950439453125, 2.216796875, 2.483154296875, 2.74951171875, 3.015869140625, 3.2822265625, 3.548583984375, 3.81494140625, 4.081298828125, 4.34765625, 4.614013671875, 4.88037109375, 5.146728515625, 5.4130859375, 5.679443359375, 5.94580078125, 6.212158203125, 6.478515625, 6.744873046875, 7.01123046875, 7.277587890625, 7.5439453125, 7.810302734375, 8.07666015625, 8.343017578125, 8.609375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 530.0, 480.0], "bins": [-170.3904571533203, -167.68580627441406, -164.98114013671875, -162.2764892578125, -159.57183837890625, -156.86717224121094, -154.1625213623047, -151.45787048339844, -148.75320434570312, -146.04855346679688, -143.34388732910156, -140.6392364501953, -137.93458557128906, -135.22991943359375, -132.5252685546875, -129.82061767578125, -127.11595916748047, -124.41130065917969, -121.70664978027344, -119.00199127197266, -116.29733276367188, -113.59268188476562, -110.88802337646484, -108.18336486816406, -105.47871398925781, -102.77405548095703, -100.06940460205078, -97.36474609375, -94.66008758544922, -91.95542907714844, -89.25077819824219, -86.5461196899414, -83.8414535522461, -81.13679504394531, -78.43214416503906, -75.72748565673828, -73.0228271484375, -70.31817626953125, -67.61351776123047, -64.90885925292969, -62.20420455932617, -59.499549865722656, -56.794891357421875, -54.09023666381836, -51.385581970214844, -48.68092346191406, -45.97626876831055, -43.27161407470703, -40.56695556640625, -37.862300872802734, -35.15764236450195, -32.45298767089844, -29.74833106994629, -27.04367446899414, -24.339019775390625, -21.634363174438477, -18.929706573486328, -16.22504997253418, -13.520394325256348, -10.815738677978516, -8.111082077026367, -5.406425476074219, -2.701770782470703, 0.0028858184814453125, 2.7075419425964355]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 11.0, 14.0, 15.0, 18.0, 36.0, 28.0, 32.0, 44.0, 51.0, 44.0, 54.0, 46.0, 59.0, 66.0, 54.0, 67.0, 49.0, 52.0, 41.0, 40.0, 50.0, 19.0, 21.0, 19.0, 22.0, 6.0, 9.0, 4.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.213035583496094, -14.82083797454834, -14.42863941192627, -14.036441802978516, -13.644243240356445, -13.252045631408691, -12.859847068786621, -12.467649459838867, -12.075450897216797, -11.683253288269043, -11.291054725646973, -10.898857116699219, -10.506658554077148, -10.114460945129395, -9.722262382507324, -9.33006477355957, -8.9378662109375, -8.545668601989746, -8.153470039367676, -7.761271953582764, -7.369073867797852, -6.9768757820129395, -6.584677696228027, -6.192480087280273, -5.8002824783325195, -5.408084392547607, -5.015886306762695, -4.623688220977783, -4.231490135192871, -3.839292049407959, -3.447094202041626, -3.054896116256714, -2.6626977920532227, -2.2704997062683105, -1.8783016204833984, -1.4861036539077759, -1.0939055681228638, -0.7017074823379517, -0.3095095157623291, 0.08268857002258301, 0.4748866558074951, 0.8670847415924072, 1.2592828273773193, 1.651480793952942, 2.0436787605285645, 2.4358768463134766, 2.8280749320983887, 3.220273017883301, 3.612471103668213, 4.004669189453125, 4.396867275238037, 4.789065361022949, 5.181263446807861, 5.573461532592773, 5.965659141540527, 6.357857704162598, 6.750055313110352, 7.142253398895264, 7.534451484680176, 7.926649570465088, 8.31884765625, 8.711045265197754, 9.103243827819824, 9.495441436767578, 9.887639999389648]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 2.0, 8.0, 10.0, 9.0, 13.0, 16.0, 20.0, 25.0, 23.0, 33.0, 34.0, 31.0, 32.0, 37.0, 42.0, 42.0, 43.0, 41.0, 35.0, 35.0, 45.0, 42.0, 44.0, 47.0, 46.0, 31.0, 42.0, 28.0, 27.0, 20.0, 14.0, 20.0, 13.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.752838134765625, -1.69903564453125, -1.645233154296875, -1.5914306640625, -1.537628173828125, -1.48382568359375, -1.430023193359375, -1.376220703125, -1.322418212890625, -1.26861572265625, -1.214813232421875, -1.1610107421875, -1.107208251953125, -1.05340576171875, -0.999603271484375, -0.94580078125, -0.891998291015625, -0.83819580078125, -0.784393310546875, -0.7305908203125, -0.676788330078125, -0.62298583984375, -0.569183349609375, -0.515380859375, -0.461578369140625, -0.40777587890625, -0.353973388671875, -0.3001708984375, -0.246368408203125, -0.19256591796875, -0.138763427734375, -0.0849609375, -0.031158447265625, 0.02264404296875, 0.076446533203125, 0.1302490234375, 0.184051513671875, 0.23785400390625, 0.291656494140625, 0.345458984375, 0.399261474609375, 0.45306396484375, 0.506866455078125, 0.5606689453125, 0.614471435546875, 0.66827392578125, 0.722076416015625, 0.77587890625, 0.829681396484375, 0.88348388671875, 0.937286376953125, 0.9910888671875, 1.044891357421875, 1.09869384765625, 1.152496337890625, 1.206298828125, 1.260101318359375, 1.31390380859375, 1.367706298828125, 1.4215087890625, 1.475311279296875, 1.52911376953125, 1.582916259765625, 1.63671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 8.0, 9.0, 15.0, 24.0, 33.0, 45.0, 62.0, 91.0, 115.0, 175.0, 278.0, 388.0, 660.0, 1099.0, 2350.0, 6588.0, 27755.0, 328664.0, 3400779.0, 383013.0, 29708.0, 7011.0, 2345.0, 1183.0, 616.0, 423.0, 260.0, 163.0, 115.0, 85.0, 61.0, 47.0, 31.0, 23.0, 16.0, 11.0, 3.0, 5.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.94940185546875, -7.7191162109375, -7.48883056640625, -7.258544921875, -7.02825927734375, -6.7979736328125, -6.56768798828125, -6.33740234375, -6.10711669921875, -5.8768310546875, -5.64654541015625, -5.416259765625, -5.18597412109375, -4.9556884765625, -4.72540283203125, -4.4951171875, -4.26483154296875, -4.0345458984375, -3.80426025390625, -3.573974609375, -3.34368896484375, -3.1134033203125, -2.88311767578125, -2.65283203125, -2.42254638671875, -2.1922607421875, -1.96197509765625, -1.731689453125, -1.50140380859375, -1.2711181640625, -1.04083251953125, -0.810546875, -0.58026123046875, -0.3499755859375, -0.11968994140625, 0.110595703125, 0.34088134765625, 0.5711669921875, 0.80145263671875, 1.03173828125, 1.26202392578125, 1.4923095703125, 1.72259521484375, 1.952880859375, 2.18316650390625, 2.4134521484375, 2.64373779296875, 2.8740234375, 3.10430908203125, 3.3345947265625, 3.56488037109375, 3.795166015625, 4.02545166015625, 4.2557373046875, 4.48602294921875, 4.71630859375, 4.94659423828125, 5.1768798828125, 5.40716552734375, 5.637451171875, 5.86773681640625, 6.0980224609375, 6.32830810546875, 6.55859375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 19.0, 24.0, 40.0, 43.0, 91.0, 100.0, 184.0, 263.0, 381.0, 599.0, 600.0, 468.0, 407.0, 271.0, 197.0, 128.0, 86.0, 60.0, 32.0, 30.0, 15.0, 6.0, 8.0, 8.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.6680908203125, -3.543212890625, -3.4183349609375, -3.29345703125, -3.1685791015625, -3.043701171875, -2.9188232421875, -2.7939453125, -2.6690673828125, -2.544189453125, -2.4193115234375, -2.29443359375, -2.1695556640625, -2.044677734375, -1.9197998046875, -1.794921875, -1.6700439453125, -1.545166015625, -1.4202880859375, -1.29541015625, -1.1705322265625, -1.045654296875, -0.9207763671875, -0.7958984375, -0.6710205078125, -0.546142578125, -0.4212646484375, -0.29638671875, -0.1715087890625, -0.046630859375, 0.0782470703125, 0.203125, 0.3280029296875, 0.452880859375, 0.5777587890625, 0.70263671875, 0.8275146484375, 0.952392578125, 1.0772705078125, 1.2021484375, 1.3270263671875, 1.451904296875, 1.5767822265625, 1.70166015625, 1.8265380859375, 1.951416015625, 2.0762939453125, 2.201171875, 2.3260498046875, 2.450927734375, 2.5758056640625, 2.70068359375, 2.8255615234375, 2.950439453125, 3.0753173828125, 3.2001953125, 3.3250732421875, 3.449951171875, 3.5748291015625, 3.69970703125, 3.8245849609375, 3.949462890625, 4.0743408203125, 4.19921875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 7.0, 14.0, 32.0, 51.0, 129.0, 245.0, 597.0, 1556.0, 4099.0, 13643.0, 54366.0, 322248.0, 2344646.0, 1253447.0, 154655.0, 30975.0, 8753.0, 2828.0, 1077.0, 466.0, 204.0, 121.0, 42.0, 35.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.804779052734375, -2.68182373046875, -2.558868408203125, -2.4359130859375, -2.312957763671875, -2.19000244140625, -2.067047119140625, -1.944091796875, -1.821136474609375, -1.69818115234375, -1.575225830078125, -1.4522705078125, -1.329315185546875, -1.20635986328125, -1.083404541015625, -0.96044921875, -0.837493896484375, -0.71453857421875, -0.591583251953125, -0.4686279296875, -0.345672607421875, -0.22271728515625, -0.099761962890625, 0.023193359375, 0.146148681640625, 0.26910400390625, 0.392059326171875, 0.5150146484375, 0.637969970703125, 0.76092529296875, 0.883880615234375, 1.0068359375, 1.129791259765625, 1.25274658203125, 1.375701904296875, 1.4986572265625, 1.621612548828125, 1.74456787109375, 1.867523193359375, 1.990478515625, 2.113433837890625, 2.23638916015625, 2.359344482421875, 2.4822998046875, 2.605255126953125, 2.72821044921875, 2.851165771484375, 2.97412109375, 3.097076416015625, 3.22003173828125, 3.342987060546875, 3.4659423828125, 3.588897705078125, 3.71185302734375, 3.834808349609375, 3.957763671875, 4.080718994140625, 4.20367431640625, 4.326629638671875, 4.4495849609375, 4.572540283203125, 4.69549560546875, 4.818450927734375, 4.94140625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 16.0, 23.0, 27.0, 36.0, 34.0, 44.0, 60.0, 63.0, 61.0, 72.0, 57.0, 86.0, 59.0, 59.0, 58.0, 41.0, 26.0, 31.0, 35.0, 11.0, 20.0, 13.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.702457427978516, -19.16834259033203, -18.63422966003418, -18.100114822387695, -17.56599998474121, -17.03188705444336, -16.497772216796875, -15.96365737915039, -15.429543495178223, -14.895429611206055, -14.36131477355957, -13.827200889587402, -13.293087005615234, -12.75897216796875, -12.224858283996582, -11.690744400024414, -11.15662956237793, -10.622515678405762, -10.088400840759277, -9.55428695678711, -9.020172119140625, -8.486058235168457, -7.951944351196289, -7.417829990386963, -6.883715629577637, -6.3496012687683105, -5.815486907958984, -5.281373023986816, -4.74725866317749, -4.213144302368164, -3.679030179977417, -3.14491605758667, -2.6108016967773438, -2.0766873359680176, -1.5425732135772705, -1.0084589719772339, -0.47434473037719727, 0.059769630432128906, 0.593883752822876, 1.127997875213623, 1.6621122360229492, 2.1962265968322754, 2.7303407192230225, 3.2644548416137695, 3.7985692024230957, 4.332683563232422, 4.86679744720459, 5.400911808013916, 5.935026168823242, 6.469140529632568, 7.0032548904418945, 7.5373687744140625, 8.071483612060547, 8.605597496032715, 9.139711380004883, 9.673826217651367, 10.207940101623535, 10.742053985595703, 11.276168823242188, 11.810282707214355, 12.344396591186523, 12.878511428833008, 13.412625312805176, 13.946739196777344, 14.480854034423828]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 12.0, 6.0, 1.0, 9.0, 14.0, 13.0, 11.0, 15.0, 12.0, 20.0, 20.0, 23.0, 26.0, 40.0, 31.0, 32.0, 29.0, 31.0, 34.0, 42.0, 31.0, 41.0, 40.0, 41.0, 41.0, 27.0, 37.0, 33.0, 35.0, 39.0, 38.0, 26.0, 23.0, 24.0, 18.0, 16.0, 7.0, 10.0, 12.0, 8.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.171516418457031, -11.80154800415039, -11.431578636169434, -11.061610221862793, -10.691641807556152, -10.321672439575195, -9.951704025268555, -9.581735610961914, -9.211767196655273, -8.841798782348633, -8.471829414367676, -8.101861000061035, -7.7318925857543945, -7.361923694610596, -6.991954803466797, -6.621986389160156, -6.252017021179199, -5.8820481300354, -5.51207971572876, -5.142110824584961, -4.77214241027832, -4.4021735191345215, -4.032204627990723, -3.662235975265503, -3.292267322540283, -2.9222986698150635, -2.5523300170898438, -2.182361125946045, -1.8123924732208252, -1.4424238204956055, -1.0724549293518066, -0.7024862766265869, -0.3325166702270508, 0.03745204210281372, 0.4074207544326782, 0.7773895263671875, 1.1473581790924072, 1.517326831817627, 1.8872957229614258, 2.2572643756866455, 2.6272330284118652, 2.997201681137085, 3.3671703338623047, 3.7371392250061035, 4.107108116149902, 4.477076530456543, 4.847045421600342, 5.217014312744141, 5.586982727050781, 5.95695161819458, 6.326920032501221, 6.6968889236450195, 7.06685733795166, 7.436826229095459, 7.806795120239258, 8.176763534545898, 8.546731948852539, 8.91670036315918, 9.286669731140137, 9.656638145446777, 10.026606559753418, 10.396575927734375, 10.766544342041016, 11.136512756347656, 11.506482124328613]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 8.0, 6.0, 9.0, 16.0, 12.0, 20.0, 20.0, 22.0, 28.0, 43.0, 37.0, 28.0, 38.0, 49.0, 35.0, 44.0, 48.0, 43.0, 58.0, 38.0, 55.0, 41.0, 39.0, 33.0, 31.0, 22.0, 23.0, 27.0, 23.0, 18.0, 14.0, 10.0, 11.0, 5.0, 9.0, 4.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-31.015625, -30.175048828125, -29.33447265625, -28.493896484375, -27.6533203125, -26.812744140625, -25.97216796875, -25.131591796875, -24.291015625, -23.450439453125, -22.60986328125, -21.769287109375, -20.9287109375, -20.088134765625, -19.24755859375, -18.406982421875, -17.56640625, -16.725830078125, -15.88525390625, -15.044677734375, -14.2041015625, -13.363525390625, -12.52294921875, -11.682373046875, -10.841796875, -10.001220703125, -9.16064453125, -8.320068359375, -7.4794921875, -6.638916015625, -5.79833984375, -4.957763671875, -4.1171875, -3.276611328125, -2.43603515625, -1.595458984375, -0.7548828125, 0.085693359375, 0.92626953125, 1.766845703125, 2.607421875, 3.447998046875, 4.28857421875, 5.129150390625, 5.9697265625, 6.810302734375, 7.65087890625, 8.491455078125, 9.33203125, 10.172607421875, 11.01318359375, 11.853759765625, 12.6943359375, 13.534912109375, 14.37548828125, 15.216064453125, 16.056640625, 16.897216796875, 17.73779296875, 18.578369140625, 19.4189453125, 20.259521484375, 21.10009765625, 21.940673828125, 22.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 10.0, 9.0, 11.0, 12.0, 17.0, 41.0, 63.0, 72.0, 130.0, 177.0, 273.0, 407.0, 629.0, 930.0, 1510.0, 2234.0, 3338.0, 5154.0, 7985.0, 12388.0, 19069.0, 30234.0, 47968.0, 74778.0, 112496.0, 151490.0, 165353.0, 137808.0, 97445.0, 63699.0, 40724.0, 25538.0, 16386.0, 10447.0, 6756.0, 4403.0, 2902.0, 1867.0, 1242.0, 869.0, 586.0, 347.0, 240.0, 198.0, 119.0, 69.0, 53.0, 31.0, 17.0, 12.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.8369140625, -1.78338623046875, -1.7298583984375, -1.67633056640625, -1.622802734375, -1.56927490234375, -1.5157470703125, -1.46221923828125, -1.40869140625, -1.35516357421875, -1.3016357421875, -1.24810791015625, -1.194580078125, -1.14105224609375, -1.0875244140625, -1.03399658203125, -0.98046875, -0.92694091796875, -0.8734130859375, -0.81988525390625, -0.766357421875, -0.71282958984375, -0.6593017578125, -0.60577392578125, -0.55224609375, -0.49871826171875, -0.4451904296875, -0.39166259765625, -0.338134765625, -0.28460693359375, -0.2310791015625, -0.17755126953125, -0.1240234375, -0.07049560546875, -0.0169677734375, 0.03656005859375, 0.090087890625, 0.14361572265625, 0.1971435546875, 0.25067138671875, 0.30419921875, 0.35772705078125, 0.4112548828125, 0.46478271484375, 0.518310546875, 0.57183837890625, 0.6253662109375, 0.67889404296875, 0.732421875, 0.78594970703125, 0.8394775390625, 0.89300537109375, 0.946533203125, 1.00006103515625, 1.0535888671875, 1.10711669921875, 1.16064453125, 1.21417236328125, 1.2677001953125, 1.32122802734375, 1.374755859375, 1.42828369140625, 1.4818115234375, 1.53533935546875, 1.5888671875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 10.0, 9.0, 9.0, 8.0, 10.0, 16.0, 11.0, 30.0, 29.0, 18.0, 18.0, 36.0, 28.0, 26.0, 33.0, 40.0, 37.0, 24.0, 23.0, 36.0, 1065.0, 42.0, 39.0, 31.0, 35.0, 31.0, 32.0, 38.0, 30.0, 22.0, 33.0, 22.0, 18.0, 23.0, 17.0, 14.0, 12.0, 12.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-13.640625, -13.2186279296875, -12.796630859375, -12.3746337890625, -11.95263671875, -11.5306396484375, -11.108642578125, -10.6866455078125, -10.2646484375, -9.8426513671875, -9.420654296875, -8.9986572265625, -8.57666015625, -8.1546630859375, -7.732666015625, -7.3106689453125, -6.888671875, -6.4666748046875, -6.044677734375, -5.6226806640625, -5.20068359375, -4.7786865234375, -4.356689453125, -3.9346923828125, -3.5126953125, -3.0906982421875, -2.668701171875, -2.2467041015625, -1.82470703125, -1.4027099609375, -0.980712890625, -0.5587158203125, -0.13671875, 0.2852783203125, 0.707275390625, 1.1292724609375, 1.55126953125, 1.9732666015625, 2.395263671875, 2.8172607421875, 3.2392578125, 3.6612548828125, 4.083251953125, 4.5052490234375, 4.92724609375, 5.3492431640625, 5.771240234375, 6.1932373046875, 6.615234375, 7.0372314453125, 7.459228515625, 7.8812255859375, 8.30322265625, 8.7252197265625, 9.147216796875, 9.5692138671875, 9.9912109375, 10.4132080078125, 10.835205078125, 11.2572021484375, 11.67919921875, 12.1011962890625, 12.523193359375, 12.9451904296875, 13.3671875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 7.0, 6.0, 14.0, 20.0, 16.0, 29.0, 44.0, 69.0, 74.0, 138.0, 188.0, 270.0, 385.0, 653.0, 991.0, 1533.0, 2472.0, 3863.0, 6245.0, 10580.0, 18983.0, 45858.0, 314383.0, 1548948.0, 82211.0, 25604.0, 13085.0, 7601.0, 4680.0, 2909.0, 1818.0, 1140.0, 748.0, 480.0, 350.0, 207.0, 160.0, 116.0, 66.0, 36.0, 45.0, 32.0, 19.0, 9.0, 14.0, 4.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.58203125, -4.4302978515625, -4.278564453125, -4.1268310546875, -3.97509765625, -3.8233642578125, -3.671630859375, -3.5198974609375, -3.3681640625, -3.2164306640625, -3.064697265625, -2.9129638671875, -2.76123046875, -2.6094970703125, -2.457763671875, -2.3060302734375, -2.154296875, -2.0025634765625, -1.850830078125, -1.6990966796875, -1.54736328125, -1.3956298828125, -1.243896484375, -1.0921630859375, -0.9404296875, -0.7886962890625, -0.636962890625, -0.4852294921875, -0.33349609375, -0.1817626953125, -0.030029296875, 0.1217041015625, 0.2734375, 0.4251708984375, 0.576904296875, 0.7286376953125, 0.88037109375, 1.0321044921875, 1.183837890625, 1.3355712890625, 1.4873046875, 1.6390380859375, 1.790771484375, 1.9425048828125, 2.09423828125, 2.2459716796875, 2.397705078125, 2.5494384765625, 2.701171875, 2.8529052734375, 3.004638671875, 3.1563720703125, 3.30810546875, 3.4598388671875, 3.611572265625, 3.7633056640625, 3.9150390625, 4.0667724609375, 4.218505859375, 4.3702392578125, 4.52197265625, 4.6737060546875, 4.825439453125, 4.9771728515625, 5.12890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 10.0, 5.0, 4.0, 13.0, 9.0, 8.0, 9.0, 12.0, 17.0, 24.0, 34.0, 41.0, 39.0, 43.0, 48.0, 52.0, 47.0, 65.0, 66.0, 53.0, 42.0, 48.0, 42.0, 32.0, 26.0, 30.0, 31.0, 26.0, 19.0, 16.0, 22.0, 20.0, 4.0, 11.0, 5.0, 5.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08343219757080078, -0.08037757873535156, -0.07732295989990234, -0.07426834106445312, -0.0712137222290039, -0.06815910339355469, -0.06510448455810547, -0.06204986572265625, -0.05899524688720703, -0.05594062805175781, -0.052886009216308594, -0.049831390380859375, -0.046776771545410156, -0.04372215270996094, -0.04066753387451172, -0.0376129150390625, -0.03455829620361328, -0.03150367736816406, -0.028449058532714844, -0.025394439697265625, -0.022339820861816406, -0.019285202026367188, -0.01623058319091797, -0.01317596435546875, -0.010121345520019531, -0.0070667266845703125, -0.004012107849121094, -0.000957489013671875, 0.0020971298217773438, 0.0051517486572265625, 0.008206367492675781, 0.011260986328125, 0.014315605163574219, 0.017370223999023438, 0.020424842834472656, 0.023479461669921875, 0.026534080505371094, 0.029588699340820312, 0.03264331817626953, 0.03569793701171875, 0.03875255584716797, 0.04180717468261719, 0.044861793518066406, 0.047916412353515625, 0.050971031188964844, 0.05402565002441406, 0.05708026885986328, 0.0601348876953125, 0.06318950653076172, 0.06624412536621094, 0.06929874420166016, 0.07235336303710938, 0.0754079818725586, 0.07846260070800781, 0.08151721954345703, 0.08457183837890625, 0.08762645721435547, 0.09068107604980469, 0.0937356948852539, 0.09679031372070312, 0.09984493255615234, 0.10289955139160156, 0.10595417022705078, 0.1090087890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 9.0, 12.0, 10.0, 14.0, 24.0, 30.0, 53.0, 89.0, 113.0, 177.0, 262.0, 408.0, 684.0, 1125.0, 1955.0, 3639.0, 7301.0, 15691.0, 37372.0, 96569.0, 225756.0, 314631.0, 199950.0, 82753.0, 32128.0, 13594.0, 6390.0, 3280.0, 1743.0, 1012.0, 603.0, 400.0, 226.0, 182.0, 121.0, 75.0, 48.0, 35.0, 39.0, 20.0, 4.0, 10.0, 4.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4833984375, -0.46935272216796875, -0.4553070068359375, -0.44126129150390625, -0.427215576171875, -0.41316986083984375, -0.3991241455078125, -0.38507843017578125, -0.37103271484375, -0.35698699951171875, -0.3429412841796875, -0.32889556884765625, -0.314849853515625, -0.30080413818359375, -0.2867584228515625, -0.27271270751953125, -0.2586669921875, -0.24462127685546875, -0.2305755615234375, -0.21652984619140625, -0.202484130859375, -0.18843841552734375, -0.1743927001953125, -0.16034698486328125, -0.14630126953125, -0.13225555419921875, -0.1182098388671875, -0.10416412353515625, -0.090118408203125, -0.07607269287109375, -0.0620269775390625, -0.04798126220703125, -0.033935546875, -0.01988983154296875, -0.0058441162109375, 0.00820159912109375, 0.022247314453125, 0.03629302978515625, 0.0503387451171875, 0.06438446044921875, 0.07843017578125, 0.09247589111328125, 0.1065216064453125, 0.12056732177734375, 0.134613037109375, 0.14865875244140625, 0.1627044677734375, 0.17675018310546875, 0.1907958984375, 0.20484161376953125, 0.2188873291015625, 0.23293304443359375, 0.246978759765625, 0.26102447509765625, 0.2750701904296875, 0.28911590576171875, 0.30316162109375, 0.31720733642578125, 0.3312530517578125, 0.34529876708984375, 0.359344482421875, 0.37339019775390625, 0.3874359130859375, 0.40148162841796875, 0.41552734375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 3.0, 10.0, 13.0, 30.0, 22.0, 27.0, 52.0, 37.0, 62.0, 69.0, 67.0, 70.0, 71.0, 85.0, 71.0, 63.0, 50.0, 39.0, 37.0, 25.0, 13.0, 17.0, 15.0, 8.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11321540921926498, -0.10929177701473236, -0.10536813735961914, -0.10144450515508652, -0.0975208654999733, -0.09359723329544067, -0.08967359364032745, -0.08574996143579483, -0.08182632923126221, -0.07790269702672958, -0.07397905737161636, -0.07005542516708374, -0.06613178551197052, -0.0622081533074379, -0.058284517377614975, -0.05436088144779205, -0.05043724179267883, -0.04651360586285591, -0.04258996993303299, -0.038666337728500366, -0.034742698073387146, -0.030819064006209373, -0.0268954299390316, -0.02297179400920868, -0.019048158079385757, -0.015124522149562836, -0.011200887151062489, -0.007277252152562141, -0.0033536162227392197, 0.0005700197070837021, 0.004493653774261475, 0.008417289704084396, 0.012340933084487915, 0.016264569014310837, 0.02018820494413376, 0.02411183901131153, 0.028035474941134453, 0.031959109008312225, 0.03588274493813515, 0.03980638086795807, 0.04373001679778099, 0.04765365272760391, 0.051577288657426834, 0.055500924587249756, 0.05942455679178238, 0.0633481964468956, 0.06727182865142822, 0.07119546830654144, 0.07511910051107407, 0.07904273271560669, 0.08296637237071991, 0.08689000457525253, 0.09081364423036575, 0.09473727643489838, 0.0986609160900116, 0.10258454829454422, 0.10650818049907684, 0.11043181270360947, 0.11435545235872269, 0.11827908456325531, 0.12220272421836853, 0.12612636387348175, 0.13004998862743378, 0.133973628282547, 0.13789726793766022]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 10.0, 9.0, 18.0, 18.0, 26.0, 28.0, 20.0, 23.0, 24.0, 30.0, 39.0, 45.0, 50.0, 43.0, 48.0, 49.0, 48.0, 35.0, 30.0, 49.0, 40.0, 37.0, 29.0, 31.0, 31.0, 28.0, 20.0, 24.0, 18.0, 11.0, 19.0, 13.0, 6.0, 4.0, 9.0, 3.0, 1.0, 2.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08047318458557129, -0.07789602130651474, -0.07531885802745819, -0.07274169474840164, -0.07016453146934509, -0.06758736819028854, -0.065010204911232, -0.062433041632175446, -0.059855878353118896, -0.05727871507406235, -0.0547015517950058, -0.05212438851594925, -0.0495472252368927, -0.04697006195783615, -0.0443928986787796, -0.04181573539972305, -0.039238572120666504, -0.036661408841609955, -0.034084245562553406, -0.03150708228349686, -0.028929919004440308, -0.02635275572538376, -0.02377559244632721, -0.02119842916727066, -0.01862126588821411, -0.016044102609157562, -0.013466939330101013, -0.010889776051044464, -0.008312612771987915, -0.005735449492931366, -0.003158286213874817, -0.0005811229348182678, 0.0019960403442382812, 0.00457320362329483, 0.007150366902351379, 0.009727530181407928, 0.012304693460464478, 0.014881856739521027, 0.017459020018577576, 0.020036183297634125, 0.022613346576690674, 0.025190509855747223, 0.027767673134803772, 0.03034483641386032, 0.03292199969291687, 0.03549916297197342, 0.03807632625102997, 0.04065348953008652, 0.043230652809143066, 0.045807816088199615, 0.048384979367256165, 0.050962142646312714, 0.05353930592536926, 0.05611646920442581, 0.05869363248348236, 0.06127079576253891, 0.06384795904159546, 0.06642512232065201, 0.06900228559970856, 0.0715794488787651, 0.07415661215782166, 0.0767337754368782, 0.07931093871593475, 0.0818881019949913, 0.08446526527404785]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 12.0, 8.0, 7.0, 5.0, 20.0, 13.0, 20.0, 19.0, 23.0, 20.0, 29.0, 26.0, 24.0, 33.0, 34.0, 35.0, 47.0, 40.0, 48.0, 45.0, 34.0, 44.0, 47.0, 38.0, 36.0, 30.0, 27.0, 36.0, 18.0, 24.0, 30.0, 8.0, 24.0, 17.0, 10.0, 13.0, 6.0, 10.0, 11.0, 2.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.359375, -22.6142578125, -21.869140625, -21.1240234375, -20.37890625, -19.6337890625, -18.888671875, -18.1435546875, -17.3984375, -16.6533203125, -15.908203125, -15.1630859375, -14.41796875, -13.6728515625, -12.927734375, -12.1826171875, -11.4375, -10.6923828125, -9.947265625, -9.2021484375, -8.45703125, -7.7119140625, -6.966796875, -6.2216796875, -5.4765625, -4.7314453125, -3.986328125, -3.2412109375, -2.49609375, -1.7509765625, -1.005859375, -0.2607421875, 0.484375, 1.2294921875, 1.974609375, 2.7197265625, 3.46484375, 4.2099609375, 4.955078125, 5.7001953125, 6.4453125, 7.1904296875, 7.935546875, 8.6806640625, 9.42578125, 10.1708984375, 10.916015625, 11.6611328125, 12.40625, 13.1513671875, 13.896484375, 14.6416015625, 15.38671875, 16.1318359375, 16.876953125, 17.6220703125, 18.3671875, 19.1123046875, 19.857421875, 20.6025390625, 21.34765625, 22.0927734375, 22.837890625, 23.5830078125, 24.328125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 13.0, 9.0, 5.0, 13.0, 14.0, 21.0, 22.0, 21.0, 31.0, 26.0, 51.0, 90.0, 215.0, 533.0, 1847.0, 7481.0, 45061.0, 391356.0, 520457.0, 67634.0, 10045.0, 2255.0, 665.0, 265.0, 100.0, 55.0, 32.0, 29.0, 35.0, 20.0, 16.0, 15.0, 14.0, 18.0, 8.0, 10.0, 7.0, 10.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.35546875, -5.1885986328125, -5.021728515625, -4.8548583984375, -4.68798828125, -4.5211181640625, -4.354248046875, -4.1873779296875, -4.0205078125, -3.8536376953125, -3.686767578125, -3.5198974609375, -3.35302734375, -3.1861572265625, -3.019287109375, -2.8524169921875, -2.685546875, -2.5186767578125, -2.351806640625, -2.1849365234375, -2.01806640625, -1.8511962890625, -1.684326171875, -1.5174560546875, -1.3505859375, -1.1837158203125, -1.016845703125, -0.8499755859375, -0.68310546875, -0.5162353515625, -0.349365234375, -0.1824951171875, -0.015625, 0.1512451171875, 0.318115234375, 0.4849853515625, 0.65185546875, 0.8187255859375, 0.985595703125, 1.1524658203125, 1.3193359375, 1.4862060546875, 1.653076171875, 1.8199462890625, 1.98681640625, 2.1536865234375, 2.320556640625, 2.4874267578125, 2.654296875, 2.8211669921875, 2.988037109375, 3.1549072265625, 3.32177734375, 3.4886474609375, 3.655517578125, 3.8223876953125, 3.9892578125, 4.1561279296875, 4.322998046875, 4.4898681640625, 4.65673828125, 4.8236083984375, 4.990478515625, 5.1573486328125, 5.32421875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 10.0, 10.0, 19.0, 18.0, 31.0, 31.0, 35.0, 37.0, 58.0, 63.0, 84.0, 69.0, 2115.0, 68.0, 70.0, 47.0, 51.0, 42.0, 39.0, 40.0, 21.0, 23.0, 15.0, 10.0, 13.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.0, -47.52734375, -46.0546875, -44.58203125, -43.109375, -41.63671875, -40.1640625, -38.69140625, -37.21875, -35.74609375, -34.2734375, -32.80078125, -31.328125, -29.85546875, -28.3828125, -26.91015625, -25.4375, -23.96484375, -22.4921875, -21.01953125, -19.546875, -18.07421875, -16.6015625, -15.12890625, -13.65625, -12.18359375, -10.7109375, -9.23828125, -7.765625, -6.29296875, -4.8203125, -3.34765625, -1.875, -0.40234375, 1.0703125, 2.54296875, 4.015625, 5.48828125, 6.9609375, 8.43359375, 9.90625, 11.37890625, 12.8515625, 14.32421875, 15.796875, 17.26953125, 18.7421875, 20.21484375, 21.6875, 23.16015625, 24.6328125, 26.10546875, 27.578125, 29.05078125, 30.5234375, 31.99609375, 33.46875, 34.94140625, 36.4140625, 37.88671875, 39.359375, 40.83203125, 42.3046875, 43.77734375, 45.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 12.0, 15.0, 14.0, 20.0, 37.0, 48.0, 79.0, 127.0, 175.0, 241.0, 444.0, 822.0, 1618.0, 3763.0, 11599.0, 46541.0, 224188.0, 2600945.0, 196565.0, 41198.0, 10249.0, 3536.0, 1507.0, 775.0, 438.0, 243.0, 162.0, 101.0, 67.0, 54.0, 28.0, 16.0, 25.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.1640625, -3.072235107421875, -2.98040771484375, -2.888580322265625, -2.7967529296875, -2.704925537109375, -2.61309814453125, -2.521270751953125, -2.429443359375, -2.337615966796875, -2.24578857421875, -2.153961181640625, -2.0621337890625, -1.970306396484375, -1.87847900390625, -1.786651611328125, -1.69482421875, -1.602996826171875, -1.51116943359375, -1.419342041015625, -1.3275146484375, -1.235687255859375, -1.14385986328125, -1.052032470703125, -0.960205078125, -0.868377685546875, -0.77655029296875, -0.684722900390625, -0.5928955078125, -0.501068115234375, -0.40924072265625, -0.317413330078125, -0.2255859375, -0.133758544921875, -0.04193115234375, 0.049896240234375, 0.1417236328125, 0.233551025390625, 0.32537841796875, 0.417205810546875, 0.509033203125, 0.600860595703125, 0.69268798828125, 0.784515380859375, 0.8763427734375, 0.968170166015625, 1.05999755859375, 1.151824951171875, 1.24365234375, 1.335479736328125, 1.42730712890625, 1.519134521484375, 1.6109619140625, 1.702789306640625, 1.79461669921875, 1.886444091796875, 1.978271484375, 2.070098876953125, 2.16192626953125, 2.253753662109375, 2.3455810546875, 2.437408447265625, 2.52923583984375, 2.621063232421875, 2.712890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 7.0, 9.0, 20.0, 30.0, 51.0, 72.0, 110.0, 182.0, 145.0, 119.0, 75.0, 56.0, 40.0, 24.0, 13.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.18195343017578, -45.56523132324219, -43.948509216308594, -42.331787109375, -40.715065002441406, -39.09834289550781, -37.48162078857422, -35.864898681640625, -34.24817657470703, -32.63145446777344, -31.014732360839844, -29.39801025390625, -27.781288146972656, -26.164566040039062, -24.54784393310547, -22.931121826171875, -21.314401626586914, -19.69767951965332, -18.080957412719727, -16.464235305786133, -14.847513198852539, -13.230792045593262, -11.614069938659668, -9.997347831726074, -8.38062572479248, -6.763903617858887, -5.147181510925293, -3.5304598808288574, -1.9137377738952637, -0.2970161437988281, 1.3197059631347656, 2.9364280700683594, 4.553150177001953, 6.169872283935547, 7.786594390869141, 9.403316497802734, 11.020038604736328, 12.636759757995605, 14.2534818649292, 15.870203971862793, 17.486927032470703, 19.103649139404297, 20.72037124633789, 22.337093353271484, 23.953815460205078, 25.570537567138672, 27.187259674072266, 28.80398178100586, 30.42070198059082, 32.03742218017578, 33.654144287109375, 35.27086639404297, 36.88758850097656, 38.504310607910156, 40.12103271484375, 41.737754821777344, 43.35447692871094, 44.97119903564453, 46.587921142578125, 48.20464324951172, 49.82136535644531, 51.438087463378906, 53.0548095703125, 54.671531677246094, 56.28825378417969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 9.0, 6.0, 5.0, 10.0, 13.0, 16.0, 18.0, 15.0, 24.0, 23.0, 36.0, 24.0, 33.0, 31.0, 34.0, 44.0, 35.0, 44.0, 34.0, 47.0, 48.0, 45.0, 39.0, 45.0, 40.0, 25.0, 35.0, 38.0, 18.0, 23.0, 24.0, 15.0, 23.0, 12.0, 20.0, 12.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.71887969970703, -41.32689666748047, -39.934913635253906, -38.542930603027344, -37.15094757080078, -35.758968353271484, -34.36698532104492, -32.97500228881836, -31.583019256591797, -30.191036224365234, -28.799053192138672, -27.407072067260742, -26.01508903503418, -24.623106002807617, -23.231124877929688, -21.839141845703125, -20.447158813476562, -19.05517578125, -17.663192749023438, -16.271211624145508, -14.879228591918945, -13.487245559692383, -12.095263481140137, -10.70328140258789, -9.311298370361328, -7.919315814971924, -6.5273332595825195, -5.135350704193115, -3.743368148803711, -2.3513855934143066, -0.9594030380249023, 0.43257904052734375, 1.8245620727539062, 3.2165446281433105, 4.608527183532715, 6.000509738922119, 7.392492294311523, 8.784475326538086, 10.176457405090332, 11.568439483642578, 12.96042251586914, 14.352405548095703, 15.74438762664795, 17.136369705200195, 18.528352737426758, 19.92033576965332, 21.31231689453125, 22.704299926757812, 24.096282958984375, 25.488265991210938, 26.8802490234375, 28.27223014831543, 29.664213180541992, 31.056196212768555, 32.448177337646484, 33.84016036987305, 35.23214340209961, 36.62412643432617, 38.016109466552734, 39.4080924987793, 40.800071716308594, 42.192054748535156, 43.58403778076172, 44.97602081298828, 46.368003845214844]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 7.0, 11.0, 9.0, 20.0, 30.0, 38.0, 57.0, 61.0, 114.0, 114.0, 211.0, 383.0, 683.0, 1435.0, 3201.0, 8722.0, 1025654.0, 4072.0, 1749.0, 819.0, 387.0, 221.0, 164.0, 94.0, 72.0, 53.0, 30.0, 21.0, 12.0, 16.0, 19.0, 16.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.935699462890625, -15.388357162475586, -14.841014862060547, -14.293672561645508, -13.746330261230469, -13.19898796081543, -12.65164566040039, -12.104303359985352, -11.556961059570312, -11.009618759155273, -10.462276458740234, -9.914934158325195, -9.367591857910156, -8.820249557495117, -8.272907257080078, -7.725565433502197, -7.178223609924316, -6.630881309509277, -6.083539009094238, -5.536196708679199, -4.98885440826416, -4.441512107849121, -3.8941702842712402, -3.346827983856201, -2.799485683441162, -2.252143383026123, -1.7048012018203735, -1.157459020614624, -0.610116720199585, -0.0627744197845459, 0.48456764221191406, 1.0319099426269531, 1.5792522430419922, 2.1265945434570312, 2.6739368438720703, 3.2212789058685303, 3.7686212062835693, 4.3159637451171875, 4.863305568695068, 5.410647869110107, 5.9579901695251465, 6.5053324699401855, 7.052674770355225, 7.6000165939331055, 8.147358894348145, 8.694701194763184, 9.242043495178223, 9.789385795593262, 10.3367280960083, 10.88407039642334, 11.431412696838379, 11.978754997253418, 12.526097297668457, 13.073439598083496, 13.620780944824219, 14.168123245239258, 14.715465545654297, 15.262807846069336, 15.810150146484375, 16.357492446899414, 16.904834747314453, 17.452177047729492, 17.99951934814453, 18.54686164855957, 19.09420394897461]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 12.0, 4.0, 10.0, 45.0, 649.0, 51460040.0, 2251.0, 106.0, 15.0, 6.0, 10.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-693.6778564453125, -675.2608642578125, -656.8438720703125, -638.4268798828125, -620.0098876953125, -601.5928955078125, -583.1759033203125, -564.7589111328125, -546.3419189453125, -527.9249267578125, -509.5079345703125, -491.0909423828125, -472.6739501953125, -454.2569580078125, -435.8399963378906, -417.4230041503906, -399.00604248046875, -380.58905029296875, -362.17205810546875, -343.75506591796875, -325.33807373046875, -306.92108154296875, -288.5041198730469, -270.0871276855469, -251.67013549804688, -233.25314331054688, -214.83615112304688, -196.41917419433594, -178.00218200683594, -159.58518981933594, -141.168212890625, -122.751220703125, -104.33425903320312, -85.91726684570312, -67.50028228759766, -49.08329391479492, -30.666305541992188, -12.249313354492188, 6.167671203613281, 24.58465576171875, 43.00164794921875, 61.418636322021484, 79.83562469482422, 98.25260925292969, 116.66960144042969, 135.0865936279297, 153.50357055664062, 171.92056274414062, 190.33755493164062, 208.75454711914062, 227.17153930664062, 245.58851623535156, 264.0054931640625, 282.4224853515625, 300.8394775390625, 319.2564697265625, 337.6734619140625, 356.0904541015625, 374.5074462890625, 392.9244384765625, 411.3414306640625, 429.7584228515625, 448.1753845214844, 466.5923767089844, 485.0093688964844]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 13.0, 13.0, 22.0, 34.0, 36.0, 45.0, 59.0, 68.0, 82.0, 104.0, 114.0, 90.0, 65.0, 54.0, 36.0, 30.0, 25.0, 14.0, 18.0, 6.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.240867614746094, -43.900184631347656, -42.559505462646484, -41.21882247924805, -39.878143310546875, -38.53746032714844, -37.19677734375, -35.85609817504883, -34.51541519165039, -33.17473220825195, -31.83405303955078, -30.493370056152344, -29.15268898010254, -27.812007904052734, -26.47132682800293, -25.130645751953125, -23.78996467590332, -22.449283599853516, -21.10860252380371, -19.767921447753906, -18.42723846435547, -17.086557388305664, -15.74587631225586, -14.405194282531738, -13.064513206481934, -11.723832130432129, -10.383150100708008, -9.042469024658203, -7.70178747177124, -6.361105918884277, -5.020424842834473, -3.6797428131103516, -2.339061737060547, -0.9983803033828735, 0.3423011302947998, 1.6829824447631836, 3.0236639976501465, 4.364345550537109, 5.705026626586914, 7.045708656311035, 8.38638973236084, 9.727070808410645, 11.067752838134766, 12.40843391418457, 13.749114990234375, 15.089797019958496, 16.430477142333984, 17.771160125732422, 19.111841201782227, 20.45252227783203, 21.793203353881836, 23.13388442993164, 24.474567413330078, 25.815248489379883, 27.155929565429688, 28.496612548828125, 29.837291717529297, 31.1779727935791, 32.518653869628906, 33.859336853027344, 35.200016021728516, 36.54069900512695, 37.881378173828125, 39.22206115722656, 40.562744140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 15.0, 9.0, 9.0, 15.0, 12.0, 30.0, 15.0, 25.0, 30.0, 38.0, 35.0, 32.0, 33.0, 35.0, 36.0, 31.0, 56.0, 34.0, 51.0, 39.0, 41.0, 35.0, 46.0, 28.0, 37.0, 25.0, 21.0, 22.0, 18.0, 23.0, 20.0, 12.0, 5.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.677288055419922, -27.8645076751709, -27.051727294921875, -26.238948822021484, -25.42616844177246, -24.613388061523438, -23.800607681274414, -22.98782730102539, -22.175048828125, -21.362268447875977, -20.549488067626953, -19.736709594726562, -18.92392921447754, -18.111148834228516, -17.298368453979492, -16.48558807373047, -15.672807693481445, -14.860027313232422, -14.047247886657715, -13.234467506408691, -12.421688079833984, -11.608907699584961, -10.796127319335938, -9.983346939086914, -9.170567512512207, -8.357787132263184, -7.545007705688477, -6.732227325439453, -5.919447422027588, -5.106667518615723, -4.293887138366699, -3.481107234954834, -2.6683292388916016, -1.8555492162704468, -1.042769193649292, -0.22998905181884766, 0.5827908515930176, 1.3955707550048828, 2.2083511352539062, 3.0211310386657715, 3.8339109420776367, 4.646690845489502, 5.459470748901367, 6.272251129150391, 7.085031032562256, 7.897810935974121, 8.710591316223145, 9.523370742797852, 10.336151123046875, 11.148931503295898, 11.961710929870605, 12.774491310119629, 13.587270736694336, 14.40005111694336, 15.212831497192383, 16.025611877441406, 16.838390350341797, 17.65117073059082, 18.463951110839844, 19.276729583740234, 20.089509963989258, 20.90229034423828, 21.715070724487305, 22.527851104736328, 23.34063148498535]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 9.0, 6.0, 15.0, 18.0, 27.0, 31.0, 54.0, 87.0, 112.0, 211.0, 306.0, 496.0, 815.0, 1403.0, 2568.0, 4939.0, 10453.0, 25256.0, 92052.0, 3099234.0, 851509.0, 69149.0, 19663.0, 7784.0, 3661.0, 1851.0, 997.0, 605.0, 365.0, 213.0, 122.0, 63.0, 73.0, 38.0, 32.0, 22.0, 15.0, 5.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.513092041015625, -1.46075439453125, -1.408416748046875, -1.3560791015625, -1.303741455078125, -1.25140380859375, -1.199066162109375, -1.146728515625, -1.094390869140625, -1.04205322265625, -0.989715576171875, -0.9373779296875, -0.885040283203125, -0.83270263671875, -0.780364990234375, -0.72802734375, -0.675689697265625, -0.62335205078125, -0.571014404296875, -0.5186767578125, -0.466339111328125, -0.41400146484375, -0.361663818359375, -0.309326171875, -0.256988525390625, -0.20465087890625, -0.152313232421875, -0.0999755859375, -0.047637939453125, 0.00469970703125, 0.057037353515625, 0.109375, 0.161712646484375, 0.21405029296875, 0.266387939453125, 0.3187255859375, 0.371063232421875, 0.42340087890625, 0.475738525390625, 0.528076171875, 0.580413818359375, 0.63275146484375, 0.685089111328125, 0.7374267578125, 0.789764404296875, 0.84210205078125, 0.894439697265625, 0.94677734375, 0.999114990234375, 1.05145263671875, 1.103790283203125, 1.1561279296875, 1.208465576171875, 1.26080322265625, 1.313140869140625, 1.365478515625, 1.417816162109375, 1.47015380859375, 1.522491455078125, 1.5748291015625, 1.627166748046875, 1.67950439453125, 1.731842041015625, 1.7841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 14.0, 13.0, 18.0, 19.0, 43.0, 71.0, 113.0, 153.0, 150.0, 138.0, 91.0, 50.0, 21.0, 19.0, 12.0, 11.0, 6.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2433013916015625, -0.236114501953125, -0.2289276123046875, -0.22174072265625, -0.2145538330078125, -0.207366943359375, -0.2001800537109375, -0.1929931640625, -0.1858062744140625, -0.178619384765625, -0.1714324951171875, -0.16424560546875, -0.1570587158203125, -0.149871826171875, -0.1426849365234375, -0.135498046875, -0.1283111572265625, -0.121124267578125, -0.1139373779296875, -0.10675048828125, -0.0995635986328125, -0.092376708984375, -0.0851898193359375, -0.0780029296875, -0.0708160400390625, -0.063629150390625, -0.0564422607421875, -0.04925537109375, -0.0420684814453125, -0.034881591796875, -0.0276947021484375, -0.0205078125, -0.0133209228515625, -0.006134033203125, 0.0010528564453125, 0.00823974609375, 0.0154266357421875, 0.022613525390625, 0.0298004150390625, 0.0369873046875, 0.0441741943359375, 0.051361083984375, 0.0585479736328125, 0.06573486328125, 0.0729217529296875, 0.080108642578125, 0.0872955322265625, 0.094482421875, 0.1016693115234375, 0.108856201171875, 0.1160430908203125, 0.12322998046875, 0.1304168701171875, 0.137603759765625, 0.1447906494140625, 0.1519775390625, 0.1591644287109375, 0.166351318359375, 0.1735382080078125, 0.18072509765625, 0.1879119873046875, 0.195098876953125, 0.2022857666015625, 0.20947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 13.0, 7.0, 5.0, 12.0, 20.0, 25.0, 53.0, 84.0, 107.0, 144.0, 246.0, 372.0, 523.0, 848.0, 1436.0, 2447.0, 4232.0, 8276.0, 16801.0, 38302.0, 102800.0, 376937.0, 2878066.0, 542047.0, 131524.0, 47248.0, 19899.0, 9627.0, 4963.0, 2810.0, 1625.0, 976.0, 614.0, 383.0, 261.0, 171.0, 129.0, 71.0, 66.0, 35.0, 22.0, 20.0, 15.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0602264404296875, -1.021820068359375, -0.9834136962890625, -0.94500732421875, -0.9066009521484375, -0.868194580078125, -0.8297882080078125, -0.7913818359375, -0.7529754638671875, -0.714569091796875, -0.6761627197265625, -0.63775634765625, -0.5993499755859375, -0.560943603515625, -0.5225372314453125, -0.484130859375, -0.4457244873046875, -0.407318115234375, -0.3689117431640625, -0.33050537109375, -0.2920989990234375, -0.253692626953125, -0.2152862548828125, -0.1768798828125, -0.1384735107421875, -0.100067138671875, -0.0616607666015625, -0.02325439453125, 0.0151519775390625, 0.053558349609375, 0.0919647216796875, 0.13037109375, 0.1687774658203125, 0.207183837890625, 0.2455902099609375, 0.28399658203125, 0.3224029541015625, 0.360809326171875, 0.3992156982421875, 0.4376220703125, 0.4760284423828125, 0.514434814453125, 0.5528411865234375, 0.59124755859375, 0.6296539306640625, 0.668060302734375, 0.7064666748046875, 0.744873046875, 0.7832794189453125, 0.821685791015625, 0.8600921630859375, 0.89849853515625, 0.9369049072265625, 0.975311279296875, 1.0137176513671875, 1.0521240234375, 1.0905303955078125, 1.128936767578125, 1.1673431396484375, 1.20574951171875, 1.2441558837890625, 1.282562255859375, 1.3209686279296875, 1.359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 15.0, 17.0, 24.0, 29.0, 51.0, 48.0, 62.0, 83.0, 118.0, 148.0, 257.0, 384.0, 1020.0, 676.0, 328.0, 198.0, 131.0, 95.0, 73.0, 68.0, 46.0, 50.0, 28.0, 16.0, 22.0, 13.0, 10.0, 3.0, 8.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2673225402832031, -0.25656890869140625, -0.24581527709960938, -0.2350616455078125, -0.22430801391601562, -0.21355438232421875, -0.20280075073242188, -0.192047119140625, -0.18129348754882812, -0.17053985595703125, -0.15978622436523438, -0.1490325927734375, -0.13827896118164062, -0.12752532958984375, -0.11677169799804688, -0.10601806640625, -0.09526443481445312, -0.08451080322265625, -0.07375717163085938, -0.0630035400390625, -0.052249908447265625, -0.04149627685546875, -0.030742645263671875, -0.019989013671875, -0.009235382080078125, 0.00151824951171875, 0.012271881103515625, 0.0230255126953125, 0.033779144287109375, 0.04453277587890625, 0.055286407470703125, 0.0660400390625, 0.07679367065429688, 0.08754730224609375, 0.09830093383789062, 0.1090545654296875, 0.11980819702148438, 0.13056182861328125, 0.14131546020507812, 0.152069091796875, 0.16282272338867188, 0.17357635498046875, 0.18432998657226562, 0.1950836181640625, 0.20583724975585938, 0.21659088134765625, 0.22734451293945312, 0.23809814453125, 0.24885177612304688, 0.25960540771484375, 0.2703590393066406, 0.2811126708984375, 0.2918663024902344, 0.30261993408203125, 0.3133735656738281, 0.324127197265625, 0.3348808288574219, 0.34563446044921875, 0.3563880920410156, 0.3671417236328125, 0.3778953552246094, 0.38864898681640625, 0.3994026184082031, 0.41015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 7.0, 6.0, 14.0, 12.0, 33.0, 43.0, 79.0, 113.0, 178.0, 169.0, 120.0, 69.0, 66.0, 26.0, 21.0, 9.0, 12.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6453351974487305, -3.504408836364746, -3.3634824752807617, -3.2225561141967773, -3.081629753112793, -2.9407033920288086, -2.799777030944824, -2.65885066986084, -2.5179243087768555, -2.376997947692871, -2.2360715866088867, -2.0951452255249023, -1.954218864440918, -1.8132925033569336, -1.6723662614822388, -1.5314399003982544, -1.3905136585235596, -1.2495872974395752, -1.1086609363555908, -0.9677346348762512, -0.8268082737922668, -0.6858819127082825, -0.5449556112289429, -0.4040292501449585, -0.2631028890609741, -0.12217654287815094, 0.01874980330467224, 0.15967613458633423, 0.3006024956703186, 0.441528856754303, 0.5824551582336426, 0.723381519317627, 0.8643078804016113, 1.0052342414855957, 1.14616060256958, 1.2870869636535645, 1.4280133247375488, 1.5689396858215332, 1.709865927696228, 1.8507922887802124, 1.9917186498641968, 2.1326448917388916, 2.273571252822876, 2.4144976139068604, 2.5554239749908447, 2.696350336074829, 2.8372766971588135, 2.978203058242798, 3.1191294193267822, 3.2600557804107666, 3.400982141494751, 3.5419085025787354, 3.6828348636627197, 3.823761224746704, 3.9646873474121094, 4.105613708496094, 4.246540069580078, 4.3874664306640625, 4.528392791748047, 4.669319152832031, 4.810245513916016, 4.951171875, 5.092098236083984, 5.233024597167969, 5.373950958251953]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 12.0, 9.0, 13.0, 16.0, 13.0, 23.0, 23.0, 23.0, 31.0, 33.0, 50.0, 39.0, 47.0, 50.0, 50.0, 53.0, 42.0, 43.0, 56.0, 38.0, 44.0, 38.0, 34.0, 32.0, 29.0, 20.0, 18.0, 11.0, 14.0, 13.0, 12.0, 8.0, 9.0, 2.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.381821870803833, -1.3363724946975708, -1.2909231185913086, -1.2454737424850464, -1.2000243663787842, -1.154574990272522, -1.1091256141662598, -1.063676118850708, -1.0182268619537354, -0.9727774858474731, -0.9273281097412109, -0.8818787336349487, -0.8364293575286865, -0.7909799814224243, -0.7455305457115173, -0.7000811696052551, -0.6546317338943481, -0.6091823577880859, -0.5637329816818237, -0.5182836055755615, -0.47283419966697693, -0.4273848235607147, -0.3819354176521301, -0.3364860415458679, -0.2910366654396057, -0.2455872893333435, -0.2001378983259201, -0.1546885073184967, -0.1092391312122345, -0.06378975510597229, -0.018340349197387695, 0.02710902690887451, 0.07255840301513672, 0.11800778657197952, 0.16345717012882233, 0.20890656113624573, 0.25435593724250793, 0.29980531334877014, 0.34525471925735474, 0.39070409536361694, 0.43615347146987915, 0.48160284757614136, 0.5270522236824036, 0.5725016593933105, 0.6179510354995728, 0.663400411605835, 0.7088497877120972, 0.7542991638183594, 0.7997485399246216, 0.8451979160308838, 0.890647292137146, 0.9360966682434082, 0.9815460443496704, 1.0269954204559326, 1.0724449157714844, 1.117894172668457, 1.1633436679840088, 1.208793044090271, 1.2542424201965332, 1.2996917963027954, 1.3451411724090576, 1.3905905485153198, 1.436039924621582, 1.4814894199371338, 1.5269386768341064]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 19.0, 19.0, 26.0, 33.0, 42.0, 71.0, 115.0, 152.0, 279.0, 385.0, 584.0, 954.0, 1606.0, 2561.0, 4395.0, 7627.0, 14201.0, 32527.0, 100604.0, 372430.0, 354090.0, 93001.0, 30859.0, 13772.0, 7141.0, 4212.0, 2552.0, 1596.0, 952.0, 612.0, 385.0, 243.0, 150.0, 117.0, 75.0, 50.0, 26.0, 26.0, 22.0, 12.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9428558349609375, -0.909149169921875, -0.8754425048828125, -0.84173583984375, -0.8080291748046875, -0.774322509765625, -0.7406158447265625, -0.7069091796875, -0.6732025146484375, -0.639495849609375, -0.6057891845703125, -0.57208251953125, -0.5383758544921875, -0.504669189453125, -0.4709625244140625, -0.437255859375, -0.4035491943359375, -0.369842529296875, -0.3361358642578125, -0.30242919921875, -0.2687225341796875, -0.235015869140625, -0.2013092041015625, -0.1676025390625, -0.1338958740234375, -0.100189208984375, -0.0664825439453125, -0.03277587890625, 0.0009307861328125, 0.034637451171875, 0.0683441162109375, 0.10205078125, 0.1357574462890625, 0.169464111328125, 0.2031707763671875, 0.23687744140625, 0.2705841064453125, 0.304290771484375, 0.3379974365234375, 0.3717041015625, 0.4054107666015625, 0.439117431640625, 0.4728240966796875, 0.50653076171875, 0.5402374267578125, 0.573944091796875, 0.6076507568359375, 0.641357421875, 0.6750640869140625, 0.708770751953125, 0.7424774169921875, 0.77618408203125, 0.8098907470703125, 0.843597412109375, 0.8773040771484375, 0.9110107421875, 0.9447174072265625, 0.978424072265625, 1.0121307373046875, 1.04583740234375, 1.0795440673828125, 1.113250732421875, 1.1469573974609375, 1.1806640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 10.0, 3.0, 9.0, 9.0, 11.0, 20.0, 44.0, 56.0, 85.0, 151.0, 145.0, 138.0, 113.0, 66.0, 39.0, 21.0, 19.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.297607421875, -0.2900409698486328, -0.2824745178222656, -0.27490806579589844, -0.26734161376953125, -0.25977516174316406, -0.2522087097167969, -0.2446422576904297, -0.2370758056640625, -0.2295093536376953, -0.22194290161132812, -0.21437644958496094, -0.20680999755859375, -0.19924354553222656, -0.19167709350585938, -0.1841106414794922, -0.176544189453125, -0.1689777374267578, -0.16141128540039062, -0.15384483337402344, -0.14627838134765625, -0.13871192932128906, -0.13114547729492188, -0.12357902526855469, -0.1160125732421875, -0.10844612121582031, -0.10087966918945312, -0.09331321716308594, -0.08574676513671875, -0.07818031311035156, -0.07061386108398438, -0.06304740905761719, -0.05548095703125, -0.04791450500488281, -0.040348052978515625, -0.03278160095214844, -0.02521514892578125, -0.017648696899414062, -0.010082244873046875, -0.0025157928466796875, 0.0050506591796875, 0.012617111206054688, 0.020183563232421875, 0.027750015258789062, 0.03531646728515625, 0.04288291931152344, 0.050449371337890625, 0.05801582336425781, 0.065582275390625, 0.07314872741699219, 0.08071517944335938, 0.08828163146972656, 0.09584808349609375, 0.10341453552246094, 0.11098098754882812, 0.11854743957519531, 0.1261138916015625, 0.1336803436279297, 0.14124679565429688, 0.14881324768066406, 0.15637969970703125, 0.16394615173339844, 0.17151260375976562, 0.1790790557861328, 0.1866455078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 8.0, 10.0, 13.0, 15.0, 25.0, 45.0, 71.0, 103.0, 167.0, 240.0, 384.0, 596.0, 941.0, 1519.0, 2678.0, 4476.0, 8166.0, 15942.0, 31912.0, 69580.0, 157375.0, 300588.0, 241203.0, 111686.0, 49610.0, 23859.0, 12021.0, 6353.0, 3506.0, 2006.0, 1258.0, 832.0, 460.0, 296.0, 224.0, 138.0, 78.0, 57.0, 32.0, 30.0, 25.0, 10.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8852386474609375, -0.857391357421875, -0.8295440673828125, -0.80169677734375, -0.7738494873046875, -0.746002197265625, -0.7181549072265625, -0.6903076171875, -0.6624603271484375, -0.634613037109375, -0.6067657470703125, -0.57891845703125, -0.5510711669921875, -0.523223876953125, -0.4953765869140625, -0.467529296875, -0.4396820068359375, -0.411834716796875, -0.3839874267578125, -0.35614013671875, -0.3282928466796875, -0.300445556640625, -0.2725982666015625, -0.2447509765625, -0.2169036865234375, -0.189056396484375, -0.1612091064453125, -0.13336181640625, -0.1055145263671875, -0.077667236328125, -0.0498199462890625, -0.02197265625, 0.0058746337890625, 0.033721923828125, 0.0615692138671875, 0.08941650390625, 0.1172637939453125, 0.145111083984375, 0.1729583740234375, 0.2008056640625, 0.2286529541015625, 0.256500244140625, 0.2843475341796875, 0.31219482421875, 0.3400421142578125, 0.367889404296875, 0.3957366943359375, 0.423583984375, 0.4514312744140625, 0.479278564453125, 0.5071258544921875, 0.53497314453125, 0.5628204345703125, 0.590667724609375, 0.6185150146484375, 0.6463623046875, 0.6742095947265625, 0.702056884765625, 0.7299041748046875, 0.75775146484375, 0.7855987548828125, 0.813446044921875, 0.8412933349609375, 0.869140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 3.0, 15.0, 14.0, 17.0, 17.0, 18.0, 38.0, 32.0, 33.0, 29.0, 37.0, 34.0, 45.0, 33.0, 43.0, 43.0, 68.0, 45.0, 33.0, 35.0, 39.0, 39.0, 34.0, 19.0, 27.0, 19.0, 23.0, 18.0, 13.0, 13.0, 14.0, 13.0, 10.0, 9.0, 6.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.8369140625, -0.810455322265625, -0.78399658203125, -0.757537841796875, -0.7310791015625, -0.704620361328125, -0.67816162109375, -0.651702880859375, -0.625244140625, -0.598785400390625, -0.57232666015625, -0.545867919921875, -0.5194091796875, -0.492950439453125, -0.46649169921875, -0.440032958984375, -0.41357421875, -0.387115478515625, -0.36065673828125, -0.334197998046875, -0.3077392578125, -0.281280517578125, -0.25482177734375, -0.228363037109375, -0.201904296875, -0.175445556640625, -0.14898681640625, -0.122528076171875, -0.0960693359375, -0.069610595703125, -0.04315185546875, -0.016693115234375, 0.009765625, 0.036224365234375, 0.06268310546875, 0.089141845703125, 0.1156005859375, 0.142059326171875, 0.16851806640625, 0.194976806640625, 0.221435546875, 0.247894287109375, 0.27435302734375, 0.300811767578125, 0.3272705078125, 0.353729248046875, 0.38018798828125, 0.406646728515625, 0.43310546875, 0.459564208984375, 0.48602294921875, 0.512481689453125, 0.5389404296875, 0.565399169921875, 0.59185791015625, 0.618316650390625, 0.644775390625, 0.671234130859375, 0.69769287109375, 0.724151611328125, 0.7506103515625, 0.777069091796875, 0.80352783203125, 0.829986572265625, 0.8564453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 9.0, 10.0, 17.0, 10.0, 28.0, 46.0, 66.0, 87.0, 159.0, 283.0, 542.0, 1112.0, 2483.0, 6578.0, 22727.0, 144994.0, 721116.0, 117769.0, 19863.0, 5956.0, 2394.0, 1048.0, 517.0, 290.0, 166.0, 97.0, 63.0, 42.0, 30.0, 19.0, 9.0, 7.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.97930908203125, -2.8902587890625, -2.80120849609375, -2.712158203125, -2.62310791015625, -2.5340576171875, -2.44500732421875, -2.35595703125, -2.26690673828125, -2.1778564453125, -2.08880615234375, -1.999755859375, -1.91070556640625, -1.8216552734375, -1.73260498046875, -1.6435546875, -1.55450439453125, -1.4654541015625, -1.37640380859375, -1.287353515625, -1.19830322265625, -1.1092529296875, -1.02020263671875, -0.93115234375, -0.84210205078125, -0.7530517578125, -0.66400146484375, -0.574951171875, -0.48590087890625, -0.3968505859375, -0.30780029296875, -0.21875, -0.12969970703125, -0.0406494140625, 0.04840087890625, 0.137451171875, 0.22650146484375, 0.3155517578125, 0.40460205078125, 0.49365234375, 0.58270263671875, 0.6717529296875, 0.76080322265625, 0.849853515625, 0.93890380859375, 1.0279541015625, 1.11700439453125, 1.2060546875, 1.29510498046875, 1.3841552734375, 1.47320556640625, 1.562255859375, 1.65130615234375, 1.7403564453125, 1.82940673828125, 1.91845703125, 2.00750732421875, 2.0965576171875, 2.18560791015625, 2.274658203125, 2.36370849609375, 2.4527587890625, 2.54180908203125, 2.630859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 10.0, 12.0, 30.0, 16.0, 34.0, 29.0, 26.0, 45.0, 58.0, 60.0, 62.0, 71.0, 62.0, 75.0, 61.0, 58.0, 34.0, 38.0, 30.0, 32.0, 24.0, 28.0, 12.0, 9.0, 13.0, 2.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00022840499877929688, -0.00022223219275474548, -0.0002160593867301941, -0.0002098865807056427, -0.0002037137746810913, -0.00019754096865653992, -0.00019136816263198853, -0.00018519535660743713, -0.00017902255058288574, -0.00017284974455833435, -0.00016667693853378296, -0.00016050413250923157, -0.00015433132648468018, -0.00014815852046012878, -0.0001419857144355774, -0.000135812908411026, -0.0001296401023864746, -0.00012346729636192322, -0.00011729449033737183, -0.00011112168431282043, -0.00010494887828826904, -9.877607226371765e-05, -9.260326623916626e-05, -8.643046021461487e-05, -8.025765419006348e-05, -7.408484816551208e-05, -6.79120421409607e-05, -6.17392361164093e-05, -5.556643009185791e-05, -4.939362406730652e-05, -4.322081804275513e-05, -3.7048012018203735e-05, -3.0875205993652344e-05, -2.4702399969100952e-05, -1.852959394454956e-05, -1.2356787919998169e-05, -6.183981895446777e-06, -1.1175870895385742e-08, 6.161630153656006e-06, 1.2334436178207397e-05, 1.850724220275879e-05, 2.468004822731018e-05, 3.085285425186157e-05, 3.7025660276412964e-05, 4.3198466300964355e-05, 4.937127232551575e-05, 5.554407835006714e-05, 6.171688437461853e-05, 6.788969039916992e-05, 7.406249642372131e-05, 8.02353024482727e-05, 8.64081084728241e-05, 9.258091449737549e-05, 9.875372052192688e-05, 0.00010492652654647827, 0.00011109933257102966, 0.00011727213859558105, 0.00012344494462013245, 0.00012961775064468384, 0.00013579055666923523, 0.00014196336269378662, 0.000148136168718338, 0.0001543089747428894, 0.0001604817807674408, 0.0001666545867919922]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 6.0, 5.0, 14.0, 21.0, 24.0, 45.0, 62.0, 72.0, 170.0, 263.0, 514.0, 1024.0, 2108.0, 4673.0, 11779.0, 35738.0, 154226.0, 552093.0, 215150.0, 45627.0, 14399.0, 5527.0, 2434.0, 1146.0, 623.0, 297.0, 180.0, 122.0, 64.0, 41.0, 30.0, 22.0, 16.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3706817626953125, -1.324371337890625, -1.2780609130859375, -1.23175048828125, -1.1854400634765625, -1.139129638671875, -1.0928192138671875, -1.0465087890625, -1.0001983642578125, -0.953887939453125, -0.9075775146484375, -0.86126708984375, -0.8149566650390625, -0.768646240234375, -0.7223358154296875, -0.676025390625, -0.6297149658203125, -0.583404541015625, -0.5370941162109375, -0.49078369140625, -0.4444732666015625, -0.398162841796875, -0.3518524169921875, -0.3055419921875, -0.2592315673828125, -0.212921142578125, -0.1666107177734375, -0.12030029296875, -0.0739898681640625, -0.027679443359375, 0.0186309814453125, 0.06494140625, 0.1112518310546875, 0.157562255859375, 0.2038726806640625, 0.25018310546875, 0.2964935302734375, 0.342803955078125, 0.3891143798828125, 0.4354248046875, 0.4817352294921875, 0.528045654296875, 0.5743560791015625, 0.62066650390625, 0.6669769287109375, 0.713287353515625, 0.7595977783203125, 0.805908203125, 0.8522186279296875, 0.898529052734375, 0.9448394775390625, 0.99114990234375, 1.0374603271484375, 1.083770751953125, 1.1300811767578125, 1.1763916015625, 1.2227020263671875, 1.269012451171875, 1.3153228759765625, 1.36163330078125, 1.4079437255859375, 1.454254150390625, 1.5005645751953125, 1.546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 6.0, 13.0, 14.0, 22.0, 40.0, 23.0, 66.0, 77.0, 67.0, 104.0, 114.0, 108.0, 102.0, 70.0, 45.0, 44.0, 27.0, 23.0, 11.0, 10.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0078125, -0.9669952392578125, -0.926177978515625, -0.8853607177734375, -0.84454345703125, -0.8037261962890625, -0.762908935546875, -0.7220916748046875, -0.6812744140625, -0.6404571533203125, -0.599639892578125, -0.5588226318359375, -0.51800537109375, -0.4771881103515625, -0.436370849609375, -0.3955535888671875, -0.354736328125, -0.3139190673828125, -0.273101806640625, -0.2322845458984375, -0.19146728515625, -0.1506500244140625, -0.109832763671875, -0.0690155029296875, -0.0281982421875, 0.0126190185546875, 0.053436279296875, 0.0942535400390625, 0.13507080078125, 0.1758880615234375, 0.216705322265625, 0.2575225830078125, 0.29833984375, 0.3391571044921875, 0.379974365234375, 0.4207916259765625, 0.46160888671875, 0.5024261474609375, 0.543243408203125, 0.5840606689453125, 0.6248779296875, 0.6656951904296875, 0.706512451171875, 0.7473297119140625, 0.78814697265625, 0.8289642333984375, 0.869781494140625, 0.9105987548828125, 0.951416015625, 0.9922332763671875, 1.033050537109375, 1.0738677978515625, 1.11468505859375, 1.1555023193359375, 1.196319580078125, 1.2371368408203125, 1.2779541015625, 1.3187713623046875, 1.359588623046875, 1.4004058837890625, 1.44122314453125, 1.4820404052734375, 1.522857666015625, 1.5636749267578125, 1.6044921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 15.0, 19.0, 32.0, 62.0, 86.0, 130.0, 194.0, 179.0, 111.0, 55.0, 34.0, 27.0, 10.0, 8.0, 12.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.016237258911133, -24.386547088623047, -23.75685691833496, -23.127168655395508, -22.497478485107422, -21.867788314819336, -21.23809814453125, -20.608409881591797, -19.97871971130371, -19.349029541015625, -18.71933937072754, -18.089651107788086, -17.4599609375, -16.830270767211914, -16.200580596923828, -15.570891380310059, -14.941201210021973, -14.311511039733887, -13.681821823120117, -13.052131652832031, -12.422442436218262, -11.792752265930176, -11.163063049316406, -10.53337287902832, -9.903682708740234, -9.273992538452148, -8.644303321838379, -8.014613151550293, -7.384923934936523, -6.7552337646484375, -6.12554407119751, -5.495854377746582, -4.866164207458496, -4.236474514007568, -3.6067848205566406, -2.977094888687134, -2.347405195236206, -1.7177155017852783, -1.0880255699157715, -0.45833587646484375, 0.17135381698608398, 0.8010435700416565, 1.430733323097229, 2.0604231357574463, 2.690112829208374, 3.3198025226593018, 3.9494924545288086, 4.579182147979736, 5.208871841430664, 5.838561534881592, 6.4682512283325195, 7.0979413986206055, 7.727630615234375, 8.357320785522461, 8.987010955810547, 9.616700172424316, 10.246389389038086, 10.876079559326172, 11.505768775939941, 12.135458946228027, 12.765148162841797, 13.394838333129883, 14.024528503417969, 14.654217720031738, 15.283907890319824]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 17.0, 13.0, 26.0, 89.0, 142.0, 180.0, 176.0, 135.0, 67.0, 39.0, 33.0, 19.0, 14.0, 9.0, 4.0, 7.0, 2.0, 0.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.70224952697754, -15.984796524047852, -15.267342567443848, -14.549888610839844, -13.832435607910156, -13.114982604980469, -12.397528648376465, -11.680074691772461, -10.962621688842773, -10.245168685913086, -9.527714729309082, -8.810260772705078, -8.09280776977539, -7.375354290008545, -6.657900810241699, -5.9404473304748535, -5.222993850708008, -4.505540370941162, -3.7880868911743164, -3.0706334114074707, -2.353179931640625, -1.6357264518737793, -0.9182729721069336, -0.2008194923400879, 0.5166339874267578, 1.2340874671936035, 1.9515409469604492, 2.668994426727295, 3.3864479064941406, 4.103901386260986, 4.821354866027832, 5.538808345794678, 6.256259918212891, 6.973713397979736, 7.691166877746582, 8.408620834350586, 9.126073837280273, 9.843526840209961, 10.560980796813965, 11.278434753417969, 11.995887756347656, 12.713340759277344, 13.430794715881348, 14.148248672485352, 14.865701675415039, 15.583154678344727, 16.300609588623047, 17.018062591552734, 17.735515594482422, 18.45296859741211, 19.170421600341797, 19.887876510620117, 20.605329513549805, 21.322782516479492, 22.040237426757812, 22.7576904296875, 23.475143432617188, 24.192596435546875, 24.910049438476562, 25.627504348754883, 26.34495735168457, 27.062410354614258, 27.779865264892578, 28.497318267822266, 29.214771270751953]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 8.0, 11.0, 13.0, 21.0, 34.0, 70.0, 80.0, 133.0, 244.0, 470.0, 862.0, 1772.0, 4346.0, 13133.0, 63436.0, 3699084.0, 362857.0, 32721.0, 8552.0, 3266.0, 1472.0, 710.0, 368.0, 187.0, 133.0, 87.0, 57.0, 38.0, 32.0, 16.0, 10.0, 15.0, 3.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7109375, -2.616851806640625, -2.52276611328125, -2.428680419921875, -2.3345947265625, -2.240509033203125, -2.14642333984375, -2.052337646484375, -1.958251953125, -1.864166259765625, -1.77008056640625, -1.675994873046875, -1.5819091796875, -1.487823486328125, -1.39373779296875, -1.299652099609375, -1.20556640625, -1.111480712890625, -1.01739501953125, -0.923309326171875, -0.8292236328125, -0.735137939453125, -0.64105224609375, -0.546966552734375, -0.452880859375, -0.358795166015625, -0.26470947265625, -0.170623779296875, -0.0765380859375, 0.017547607421875, 0.11163330078125, 0.205718994140625, 0.2998046875, 0.393890380859375, 0.48797607421875, 0.582061767578125, 0.6761474609375, 0.770233154296875, 0.86431884765625, 0.958404541015625, 1.052490234375, 1.146575927734375, 1.24066162109375, 1.334747314453125, 1.4288330078125, 1.522918701171875, 1.61700439453125, 1.711090087890625, 1.80517578125, 1.899261474609375, 1.99334716796875, 2.087432861328125, 2.1815185546875, 2.275604248046875, 2.36968994140625, 2.463775634765625, 2.557861328125, 2.651947021484375, 2.74603271484375, 2.840118408203125, 2.9342041015625, 3.028289794921875, 3.12237548828125, 3.216461181640625, 3.310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 9.0, 10.0, 15.0, 17.0, 20.0, 50.0, 51.0, 80.0, 107.0, 121.0, 108.0, 95.0, 79.0, 63.0, 42.0, 30.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2236328125, -0.21726036071777344, -0.21088790893554688, -0.2045154571533203, -0.19814300537109375, -0.1917705535888672, -0.18539810180664062, -0.17902565002441406, -0.1726531982421875, -0.16628074645996094, -0.15990829467773438, -0.1535358428955078, -0.14716339111328125, -0.1407909393310547, -0.13441848754882812, -0.12804603576660156, -0.121673583984375, -0.11530113220214844, -0.10892868041992188, -0.10255622863769531, -0.09618377685546875, -0.08981132507324219, -0.08343887329101562, -0.07706642150878906, -0.0706939697265625, -0.06432151794433594, -0.057949066162109375, -0.05157661437988281, -0.04520416259765625, -0.03883171081542969, -0.032459259033203125, -0.026086807250976562, -0.01971435546875, -0.013341903686523438, -0.006969451904296875, -0.0005970001220703125, 0.00577545166015625, 0.012147903442382812, 0.018520355224609375, 0.024892807006835938, 0.0312652587890625, 0.03763771057128906, 0.044010162353515625, 0.05038261413574219, 0.05675506591796875, 0.06312751770019531, 0.06949996948242188, 0.07587242126464844, 0.082244873046875, 0.08861732482910156, 0.09498977661132812, 0.10136222839355469, 0.10773468017578125, 0.11410713195800781, 0.12047958374023438, 0.12685203552246094, 0.1332244873046875, 0.13959693908691406, 0.14596939086914062, 0.1523418426513672, 0.15871429443359375, 0.1650867462158203, 0.17145919799804688, 0.17783164978027344, 0.1842041015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 22.0, 30.0, 60.0, 61.0, 105.0, 148.0, 221.0, 349.0, 538.0, 884.0, 1496.0, 2677.0, 5025.0, 10376.0, 23179.0, 58548.0, 199921.0, 2850101.0, 830002.0, 131316.0, 43004.0, 18029.0, 8378.0, 4243.0, 2170.0, 1276.0, 779.0, 434.0, 289.0, 180.0, 122.0, 77.0, 62.0, 44.0, 28.0, 17.0, 15.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6639862060546875, -1.608245849609375, -1.5525054931640625, -1.49676513671875, -1.4410247802734375, -1.385284423828125, -1.3295440673828125, -1.2738037109375, -1.2180633544921875, -1.162322998046875, -1.1065826416015625, -1.05084228515625, -0.9951019287109375, -0.939361572265625, -0.8836212158203125, -0.827880859375, -0.7721405029296875, -0.716400146484375, -0.6606597900390625, -0.60491943359375, -0.5491790771484375, -0.493438720703125, -0.4376983642578125, -0.3819580078125, -0.3262176513671875, -0.270477294921875, -0.2147369384765625, -0.15899658203125, -0.1032562255859375, -0.047515869140625, 0.0082244873046875, 0.06396484375, 0.1197052001953125, 0.175445556640625, 0.2311859130859375, 0.28692626953125, 0.3426666259765625, 0.398406982421875, 0.4541473388671875, 0.5098876953125, 0.5656280517578125, 0.621368408203125, 0.6771087646484375, 0.73284912109375, 0.7885894775390625, 0.844329833984375, 0.9000701904296875, 0.955810546875, 1.0115509033203125, 1.067291259765625, 1.1230316162109375, 1.17877197265625, 1.2345123291015625, 1.290252685546875, 1.3459930419921875, 1.4017333984375, 1.4574737548828125, 1.513214111328125, 1.5689544677734375, 1.62469482421875, 1.6804351806640625, 1.736175537109375, 1.7919158935546875, 1.84765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 23.0, 17.0, 32.0, 37.0, 37.0, 75.0, 118.0, 157.0, 300.0, 922.0, 1577.0, 285.0, 178.0, 98.0, 52.0, 41.0, 25.0, 25.0, 16.0, 10.0, 7.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.43161964416503906, -0.4208564758300781, -0.4100933074951172, -0.39933013916015625, -0.3885669708251953, -0.3778038024902344, -0.36704063415527344, -0.3562774658203125, -0.34551429748535156, -0.3347511291503906, -0.3239879608154297, -0.31322479248046875, -0.3024616241455078, -0.2916984558105469, -0.28093528747558594, -0.270172119140625, -0.25940895080566406, -0.24864578247070312, -0.2378826141357422, -0.22711944580078125, -0.2163562774658203, -0.20559310913085938, -0.19482994079589844, -0.1840667724609375, -0.17330360412597656, -0.16254043579101562, -0.1517772674560547, -0.14101409912109375, -0.1302509307861328, -0.11948776245117188, -0.10872459411621094, -0.09796142578125, -0.08719825744628906, -0.07643508911132812, -0.06567192077636719, -0.05490875244140625, -0.04414558410644531, -0.033382415771484375, -0.022619247436523438, -0.0118560791015625, -0.0010929107666015625, 0.009670257568359375, 0.020433425903320312, 0.03119659423828125, 0.04195976257324219, 0.052722930908203125, 0.06348609924316406, 0.074249267578125, 0.08501243591308594, 0.09577560424804688, 0.10653877258300781, 0.11730194091796875, 0.1280651092529297, 0.13882827758789062, 0.14959144592285156, 0.1603546142578125, 0.17111778259277344, 0.18188095092773438, 0.1926441192626953, 0.20340728759765625, 0.2141704559326172, 0.22493362426757812, 0.23569679260253906, 0.2464599609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 8.0, 13.0, 20.0, 50.0, 62.0, 95.0, 138.0, 167.0, 177.0, 97.0, 82.0, 36.0, 25.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0077247619628906, -2.92850923538208, -2.8492939472198486, -2.770078659057617, -2.6908631324768066, -2.611647605895996, -2.5324323177337646, -2.453217029571533, -2.3740015029907227, -2.294785976409912, -2.2155706882476807, -2.136355400085449, -2.0571398735046387, -1.9779244661331177, -1.8987090587615967, -1.8194936513900757, -1.7402782440185547, -1.6610628366470337, -1.5818474292755127, -1.5026320219039917, -1.4234166145324707, -1.3442012071609497, -1.2649857997894287, -1.1857703924179077, -1.1065549850463867, -1.0273395776748657, -0.9481241703033447, -0.8689087629318237, -0.7896933555603027, -0.7104779481887817, -0.6312625408172607, -0.5520471334457397, -0.47283172607421875, -0.39361631870269775, -0.31440091133117676, -0.23518550395965576, -0.15597009658813477, -0.07675468921661377, 0.0024607181549072266, 0.08167612552642822, 0.16089153289794922, 0.24010694026947021, 0.3193223476409912, 0.3985377550125122, 0.4777531623840332, 0.5569685697555542, 0.6361839771270752, 0.7153993844985962, 0.7946147918701172, 0.8738301992416382, 0.9530456066131592, 1.0322610139846802, 1.1114764213562012, 1.1906918287277222, 1.2699072360992432, 1.3491226434707642, 1.4283380508422852, 1.5075534582138062, 1.5867688655853271, 1.6659842729568481, 1.7451996803283691, 1.8244150876998901, 1.9036304950714111, 1.9828459024429321, 2.062061309814453]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 6.0, 5.0, 11.0, 16.0, 15.0, 24.0, 19.0, 36.0, 36.0, 38.0, 51.0, 48.0, 58.0, 71.0, 47.0, 59.0, 53.0, 45.0, 52.0, 44.0, 44.0, 32.0, 38.0, 22.0, 29.0, 13.0, 15.0, 8.0, 17.0, 5.0, 4.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1543371677398682, -1.1169861555099487, -1.0796351432800293, -1.0422840118408203, -1.0049329996109009, -0.9675819873809814, -0.9302309155464172, -0.892879843711853, -0.8555288314819336, -0.8181778192520142, -0.78082674741745, -0.7434756755828857, -0.7061246633529663, -0.6687736511230469, -0.6314225792884827, -0.5940715074539185, -0.556720495223999, -0.5193694829940796, -0.4820184111595154, -0.44466736912727356, -0.40731632709503174, -0.3699652850627899, -0.3326142430305481, -0.2952632009983063, -0.25791215896606445, -0.22056111693382263, -0.1832100749015808, -0.145859032869339, -0.10850799083709717, -0.07115694880485535, -0.033805906772613525, 0.003545135259628296, 0.040896058082580566, 0.07824710011482239, 0.11559814214706421, 0.15294918417930603, 0.19030022621154785, 0.22765126824378967, 0.2650023102760315, 0.3023533523082733, 0.33970439434051514, 0.37705543637275696, 0.4144064784049988, 0.4517575204372406, 0.4891085624694824, 0.5264595746994019, 0.5638106465339661, 0.6011617183685303, 0.6385127305984497, 0.6758637428283691, 0.7132148146629333, 0.7505658864974976, 0.787916898727417, 0.8252679109573364, 0.8626189827919006, 0.8999700546264648, 0.9373210668563843, 0.9746720790863037, 1.0120232105255127, 1.0493742227554321, 1.0867252349853516, 1.124076247215271, 1.1614272594451904, 1.1987783908843994, 1.2361294031143188]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 12.0, 23.0, 26.0, 42.0, 65.0, 89.0, 111.0, 184.0, 292.0, 458.0, 836.0, 1430.0, 2553.0, 4835.0, 9489.0, 20818.0, 50557.0, 142291.0, 340486.0, 291306.0, 109212.0, 39293.0, 16816.0, 7924.0, 3937.0, 2183.0, 1264.0, 691.0, 471.0, 292.0, 176.0, 122.0, 74.0, 49.0, 37.0, 27.0, 20.0, 14.0, 11.0, 5.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0939483642578125, -1.056060791015625, -1.0181732177734375, -0.98028564453125, -0.9423980712890625, -0.904510498046875, -0.8666229248046875, -0.8287353515625, -0.7908477783203125, -0.752960205078125, -0.7150726318359375, -0.67718505859375, -0.6392974853515625, -0.601409912109375, -0.5635223388671875, -0.525634765625, -0.4877471923828125, -0.449859619140625, -0.4119720458984375, -0.37408447265625, -0.3361968994140625, -0.298309326171875, -0.2604217529296875, -0.2225341796875, -0.1846466064453125, -0.146759033203125, -0.1088714599609375, -0.07098388671875, -0.0330963134765625, 0.004791259765625, 0.0426788330078125, 0.08056640625, 0.1184539794921875, 0.156341552734375, 0.1942291259765625, 0.23211669921875, 0.2700042724609375, 0.307891845703125, 0.3457794189453125, 0.3836669921875, 0.4215545654296875, 0.459442138671875, 0.4973297119140625, 0.53521728515625, 0.5731048583984375, 0.610992431640625, 0.6488800048828125, 0.686767578125, 0.7246551513671875, 0.762542724609375, 0.8004302978515625, 0.83831787109375, 0.8762054443359375, 0.914093017578125, 0.9519805908203125, 0.9898681640625, 1.0277557373046875, 1.065643310546875, 1.1035308837890625, 1.14141845703125, 1.1793060302734375, 1.217193603515625, 1.2550811767578125, 1.29296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 8.0, 31.0, 34.0, 49.0, 64.0, 92.0, 92.0, 109.0, 104.0, 83.0, 60.0, 52.0, 57.0, 29.0, 23.0, 9.0, 16.0, 8.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2281494140625, -0.22223663330078125, -0.2163238525390625, -0.21041107177734375, -0.204498291015625, -0.19858551025390625, -0.1926727294921875, -0.18675994873046875, -0.18084716796875, -0.17493438720703125, -0.1690216064453125, -0.16310882568359375, -0.157196044921875, -0.15128326416015625, -0.1453704833984375, -0.13945770263671875, -0.133544921875, -0.12763214111328125, -0.1217193603515625, -0.11580657958984375, -0.109893798828125, -0.10398101806640625, -0.0980682373046875, -0.09215545654296875, -0.08624267578125, -0.08032989501953125, -0.0744171142578125, -0.06850433349609375, -0.062591552734375, -0.05667877197265625, -0.0507659912109375, -0.04485321044921875, -0.0389404296875, -0.03302764892578125, -0.0271148681640625, -0.02120208740234375, -0.015289306640625, -0.00937652587890625, -0.0034637451171875, 0.00244903564453125, 0.00836181640625, 0.01427459716796875, 0.0201873779296875, 0.02610015869140625, 0.032012939453125, 0.03792572021484375, 0.0438385009765625, 0.04975128173828125, 0.0556640625, 0.06157684326171875, 0.0674896240234375, 0.07340240478515625, 0.079315185546875, 0.08522796630859375, 0.0911407470703125, 0.09705352783203125, 0.10296630859375, 0.10887908935546875, 0.1147918701171875, 0.12070465087890625, 0.126617431640625, 0.13253021240234375, 0.1384429931640625, 0.14435577392578125, 0.1502685546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 22.0, 18.0, 42.0, 61.0, 82.0, 131.0, 206.0, 313.0, 575.0, 813.0, 1450.0, 2490.0, 4326.0, 7764.0, 14812.0, 29618.0, 60416.0, 121799.0, 215829.0, 251743.0, 166475.0, 84690.0, 40642.0, 20190.0, 10496.0, 5613.0, 3133.0, 1818.0, 1101.0, 641.0, 448.0, 262.0, 168.0, 114.0, 66.0, 41.0, 30.0, 40.0, 16.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.622650146484375, -0.59979248046875, -0.576934814453125, -0.5540771484375, -0.531219482421875, -0.50836181640625, -0.485504150390625, -0.462646484375, -0.439788818359375, -0.41693115234375, -0.394073486328125, -0.3712158203125, -0.348358154296875, -0.32550048828125, -0.302642822265625, -0.27978515625, -0.256927490234375, -0.23406982421875, -0.211212158203125, -0.1883544921875, -0.165496826171875, -0.14263916015625, -0.119781494140625, -0.096923828125, -0.074066162109375, -0.05120849609375, -0.028350830078125, -0.0054931640625, 0.017364501953125, 0.04022216796875, 0.063079833984375, 0.0859375, 0.108795166015625, 0.13165283203125, 0.154510498046875, 0.1773681640625, 0.200225830078125, 0.22308349609375, 0.245941162109375, 0.268798828125, 0.291656494140625, 0.31451416015625, 0.337371826171875, 0.3602294921875, 0.383087158203125, 0.40594482421875, 0.428802490234375, 0.45166015625, 0.474517822265625, 0.49737548828125, 0.520233154296875, 0.5430908203125, 0.565948486328125, 0.58880615234375, 0.611663818359375, 0.634521484375, 0.657379150390625, 0.68023681640625, 0.703094482421875, 0.7259521484375, 0.748809814453125, 0.77166748046875, 0.794525146484375, 0.8173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 14.0, 6.0, 11.0, 14.0, 10.0, 15.0, 17.0, 21.0, 29.0, 43.0, 36.0, 43.0, 39.0, 37.0, 40.0, 47.0, 64.0, 52.0, 48.0, 48.0, 53.0, 38.0, 39.0, 48.0, 37.0, 28.0, 32.0, 20.0, 18.0, 15.0, 12.0, 3.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.57342529296875, -0.5516357421875, -0.52984619140625, -0.508056640625, -0.48626708984375, -0.4644775390625, -0.44268798828125, -0.4208984375, -0.39910888671875, -0.3773193359375, -0.35552978515625, -0.333740234375, -0.31195068359375, -0.2901611328125, -0.26837158203125, -0.24658203125, -0.22479248046875, -0.2030029296875, -0.18121337890625, -0.159423828125, -0.13763427734375, -0.1158447265625, -0.09405517578125, -0.072265625, -0.05047607421875, -0.0286865234375, -0.00689697265625, 0.014892578125, 0.03668212890625, 0.0584716796875, 0.08026123046875, 0.10205078125, 0.12384033203125, 0.1456298828125, 0.16741943359375, 0.189208984375, 0.21099853515625, 0.2327880859375, 0.25457763671875, 0.2763671875, 0.29815673828125, 0.3199462890625, 0.34173583984375, 0.363525390625, 0.38531494140625, 0.4071044921875, 0.42889404296875, 0.45068359375, 0.47247314453125, 0.4942626953125, 0.51605224609375, 0.537841796875, 0.55963134765625, 0.5814208984375, 0.60321044921875, 0.625, 0.64678955078125, 0.6685791015625, 0.69036865234375, 0.712158203125, 0.73394775390625, 0.7557373046875, 0.77752685546875, 0.79931640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 15.0, 21.0, 32.0, 31.0, 42.0, 62.0, 87.0, 169.0, 215.0, 342.0, 608.0, 1082.0, 2316.0, 4904.0, 12765.0, 42012.0, 188267.0, 534420.0, 194420.0, 43301.0, 13204.0, 5002.0, 2353.0, 1174.0, 646.0, 332.0, 246.0, 145.0, 97.0, 69.0, 35.0, 43.0, 16.0, 20.0, 14.0, 5.0, 6.0, 2.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7614593505859375, -1.699676513671875, -1.6378936767578125, -1.57611083984375, -1.5143280029296875, -1.452545166015625, -1.3907623291015625, -1.3289794921875, -1.2671966552734375, -1.205413818359375, -1.1436309814453125, -1.08184814453125, -1.0200653076171875, -0.958282470703125, -0.8964996337890625, -0.834716796875, -0.7729339599609375, -0.711151123046875, -0.6493682861328125, -0.58758544921875, -0.5258026123046875, -0.464019775390625, -0.4022369384765625, -0.3404541015625, -0.2786712646484375, -0.216888427734375, -0.1551055908203125, -0.09332275390625, -0.0315399169921875, 0.030242919921875, 0.0920257568359375, 0.15380859375, 0.2155914306640625, 0.277374267578125, 0.3391571044921875, 0.40093994140625, 0.4627227783203125, 0.524505615234375, 0.5862884521484375, 0.6480712890625, 0.7098541259765625, 0.771636962890625, 0.8334197998046875, 0.89520263671875, 0.9569854736328125, 1.018768310546875, 1.0805511474609375, 1.142333984375, 1.2041168212890625, 1.265899658203125, 1.3276824951171875, 1.38946533203125, 1.4512481689453125, 1.513031005859375, 1.5748138427734375, 1.6365966796875, 1.6983795166015625, 1.760162353515625, 1.8219451904296875, 1.88372802734375, 1.9455108642578125, 2.007293701171875, 2.0690765380859375, 2.130859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 10.0, 23.0, 12.0, 35.0, 46.0, 75.0, 92.0, 96.0, 139.0, 113.0, 114.0, 64.0, 62.0, 28.0, 34.0, 22.0, 13.0, 12.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003039836883544922, -0.0002952590584754944, -0.0002865344285964966, -0.0002778097987174988, -0.000269085168838501, -0.0002603605389595032, -0.00025163590908050537, -0.00024291127920150757, -0.00023418664932250977, -0.00022546201944351196, -0.00021673738956451416, -0.00020801275968551636, -0.00019928812980651855, -0.00019056349992752075, -0.00018183887004852295, -0.00017311424016952515, -0.00016438961029052734, -0.00015566498041152954, -0.00014694035053253174, -0.00013821572065353394, -0.00012949109077453613, -0.00012076646089553833, -0.00011204183101654053, -0.00010331720113754272, -9.459257125854492e-05, -8.586794137954712e-05, -7.714331150054932e-05, -6.841868162155151e-05, -5.969405174255371e-05, -5.096942186355591e-05, -4.2244791984558105e-05, -3.35201621055603e-05, -2.47955322265625e-05, -1.6070902347564697e-05, -7.3462724685668945e-06, 1.3783574104309082e-06, 1.0102987289428711e-05, 1.8827617168426514e-05, 2.7552247047424316e-05, 3.627687692642212e-05, 4.500150680541992e-05, 5.3726136684417725e-05, 6.245076656341553e-05, 7.117539644241333e-05, 7.990002632141113e-05, 8.862465620040894e-05, 9.734928607940674e-05, 0.00010607391595840454, 0.00011479854583740234, 0.00012352317571640015, 0.00013224780559539795, 0.00014097243547439575, 0.00014969706535339355, 0.00015842169523239136, 0.00016714632511138916, 0.00017587095499038696, 0.00018459558486938477, 0.00019332021474838257, 0.00020204484462738037, 0.00021076947450637817, 0.00021949410438537598, 0.00022821873426437378, 0.00023694336414337158, 0.0002456679940223694, 0.0002543926239013672]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 10.0, 15.0, 11.0, 23.0, 27.0, 51.0, 68.0, 96.0, 162.0, 228.0, 406.0, 587.0, 976.0, 1801.0, 3465.0, 6727.0, 14791.0, 35825.0, 102464.0, 286168.0, 355432.0, 149761.0, 50495.0, 19989.0, 8859.0, 4342.0, 2364.0, 1322.0, 730.0, 475.0, 316.0, 186.0, 121.0, 92.0, 47.0, 40.0, 17.0, 21.0, 18.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.030120849609375, -0.99481201171875, -0.959503173828125, -0.9241943359375, -0.888885498046875, -0.85357666015625, -0.818267822265625, -0.782958984375, -0.747650146484375, -0.71234130859375, -0.677032470703125, -0.6417236328125, -0.606414794921875, -0.57110595703125, -0.535797119140625, -0.50048828125, -0.465179443359375, -0.42987060546875, -0.394561767578125, -0.3592529296875, -0.323944091796875, -0.28863525390625, -0.253326416015625, -0.218017578125, -0.182708740234375, -0.14739990234375, -0.112091064453125, -0.0767822265625, -0.041473388671875, -0.00616455078125, 0.029144287109375, 0.064453125, 0.099761962890625, 0.13507080078125, 0.170379638671875, 0.2056884765625, 0.240997314453125, 0.27630615234375, 0.311614990234375, 0.346923828125, 0.382232666015625, 0.41754150390625, 0.452850341796875, 0.4881591796875, 0.523468017578125, 0.55877685546875, 0.594085693359375, 0.62939453125, 0.664703369140625, 0.70001220703125, 0.735321044921875, 0.7706298828125, 0.805938720703125, 0.84124755859375, 0.876556396484375, 0.911865234375, 0.947174072265625, 0.98248291015625, 1.017791748046875, 1.0531005859375, 1.088409423828125, 1.12371826171875, 1.159027099609375, 1.1943359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 7.0, 16.0, 13.0, 14.0, 13.0, 37.0, 43.0, 44.0, 47.0, 45.0, 66.0, 58.0, 48.0, 66.0, 64.0, 54.0, 48.0, 41.0, 34.0, 35.0, 40.0, 30.0, 19.0, 20.0, 18.0, 11.0, 8.0, 6.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5383148193359375, -0.519500732421875, -0.5006866455078125, -0.48187255859375, -0.4630584716796875, -0.444244384765625, -0.4254302978515625, -0.4066162109375, -0.3878021240234375, -0.368988037109375, -0.3501739501953125, -0.33135986328125, -0.3125457763671875, -0.293731689453125, -0.2749176025390625, -0.256103515625, -0.2372894287109375, -0.218475341796875, -0.1996612548828125, -0.18084716796875, -0.1620330810546875, -0.143218994140625, -0.1244049072265625, -0.1055908203125, -0.0867767333984375, -0.067962646484375, -0.0491485595703125, -0.03033447265625, -0.0115203857421875, 0.007293701171875, 0.0261077880859375, 0.044921875, 0.0637359619140625, 0.082550048828125, 0.1013641357421875, 0.12017822265625, 0.1389923095703125, 0.157806396484375, 0.1766204833984375, 0.1954345703125, 0.2142486572265625, 0.233062744140625, 0.2518768310546875, 0.27069091796875, 0.2895050048828125, 0.308319091796875, 0.3271331787109375, 0.345947265625, 0.3647613525390625, 0.383575439453125, 0.4023895263671875, 0.42120361328125, 0.4400177001953125, 0.458831787109375, 0.4776458740234375, 0.4964599609375, 0.5152740478515625, 0.534088134765625, 0.5529022216796875, 0.57171630859375, 0.5905303955078125, 0.609344482421875, 0.6281585693359375, 0.64697265625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 16.0, 48.0, 141.0, 275.0, 249.0, 146.0, 56.0, 26.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.348570823669434, -14.780890464782715, -14.213211059570312, -13.645530700683594, -13.077851295471191, -12.510170936584473, -11.94249153137207, -11.374811172485352, -10.807130813598633, -10.239450454711914, -9.671771049499512, -9.104090690612793, -8.53641128540039, -7.968730926513672, -7.401051044464111, -6.833371162414551, -6.265691757202148, -5.698011875152588, -5.130331993103027, -4.562651634216309, -3.994971990585327, -3.4272921085357666, -2.859611988067627, -2.2919321060180664, -1.7242522239685059, -1.1565723419189453, -0.5888923406600952, -0.021212339401245117, 0.5464675426483154, 1.114147424697876, 1.6818275451660156, 2.249507427215576, 2.817188262939453, 3.3848681449890137, 3.952548027038574, 4.520228385925293, 5.087907791137695, 5.655588150024414, 6.223268032073975, 6.790947914123535, 7.358627796173096, 7.926307678222656, 8.493988037109375, 9.061667442321777, 9.629347801208496, 10.197027206420898, 10.764707565307617, 11.332387924194336, 11.900067329406738, 12.467747688293457, 13.03542709350586, 13.603107452392578, 14.17078685760498, 14.7384672164917, 15.306146621704102, 15.87382698059082, 16.44150733947754, 17.009187698364258, 17.576868057250977, 18.144546508789062, 18.71222686767578, 19.2799072265625, 19.84758758544922, 20.415267944335938, 20.982946395874023]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 5.0, 5.0, 13.0, 14.0, 20.0, 26.0, 33.0, 50.0, 65.0, 64.0, 80.0, 97.0, 94.0, 74.0, 90.0, 62.0, 53.0, 37.0, 34.0, 16.0, 19.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.967996120452881, -7.727425575256348, -7.486854553222656, -7.246284008026123, -7.00571346282959, -6.765142440795898, -6.524571895599365, -6.284001350402832, -6.043430328369141, -5.802859783172607, -5.562288761138916, -5.321718215942383, -5.08114767074585, -4.840577125549316, -4.600006103515625, -4.359435558319092, -4.118865013122559, -3.8782942295074463, -3.637723684310913, -3.397152900695801, -3.1565823554992676, -2.9160115718841553, -2.675440788269043, -2.4348702430725098, -2.1942994594573975, -1.9537287950515747, -1.713158130645752, -1.4725873470306396, -1.232016682624817, -0.9914460182189941, -0.7508752346038818, -0.5103045701980591, -0.2697334289550781, -0.029162734746932983, 0.21140795946121216, 0.4519786834716797, 0.6925493478775024, 0.9331200122833252, 1.1736907958984375, 1.4142614603042603, 1.654832124710083, 1.8954027891159058, 2.1359734535217285, 2.376544237136841, 2.617115020751953, 2.8576855659484863, 3.0982563495635986, 3.338827133178711, 3.579397678375244, 3.8199684619903564, 4.060539245605469, 4.301109790802002, 4.541680335998535, 4.782251358032227, 5.02282190322876, 5.263392448425293, 5.503963470458984, 5.744534015655518, 5.985105037689209, 6.225675582885742, 6.466246128082275, 6.706816673278809, 6.9473876953125, 7.187958240509033, 7.428528785705566]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 33.0, 35.0, 58.0, 103.0, 154.0, 265.0, 470.0, 977.0, 2041.0, 5219.0, 17439.0, 93870.0, 3687606.0, 336086.0, 35126.0, 8715.0, 3115.0, 1362.0, 698.0, 345.0, 171.0, 111.0, 82.0, 55.0, 23.0, 20.0, 11.0, 14.0, 15.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.664031982421875, -2.56439208984375, -2.464752197265625, -2.3651123046875, -2.265472412109375, -2.16583251953125, -2.066192626953125, -1.966552734375, -1.866912841796875, -1.76727294921875, -1.667633056640625, -1.5679931640625, -1.468353271484375, -1.36871337890625, -1.269073486328125, -1.16943359375, -1.069793701171875, -0.97015380859375, -0.870513916015625, -0.7708740234375, -0.671234130859375, -0.57159423828125, -0.471954345703125, -0.372314453125, -0.272674560546875, -0.17303466796875, -0.073394775390625, 0.0262451171875, 0.125885009765625, 0.22552490234375, 0.325164794921875, 0.4248046875, 0.524444580078125, 0.62408447265625, 0.723724365234375, 0.8233642578125, 0.923004150390625, 1.02264404296875, 1.122283935546875, 1.221923828125, 1.321563720703125, 1.42120361328125, 1.520843505859375, 1.6204833984375, 1.720123291015625, 1.81976318359375, 1.919403076171875, 2.01904296875, 2.118682861328125, 2.21832275390625, 2.317962646484375, 2.4176025390625, 2.517242431640625, 2.61688232421875, 2.716522216796875, 2.816162109375, 2.915802001953125, 3.01544189453125, 3.115081787109375, 3.2147216796875, 3.314361572265625, 3.41400146484375, 3.513641357421875, 3.61328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 10.0, 14.0, 27.0, 43.0, 63.0, 69.0, 89.0, 105.0, 114.0, 98.0, 86.0, 75.0, 51.0, 45.0, 23.0, 11.0, 17.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2812824249267578, -0.2744789123535156, -0.26767539978027344, -0.26087188720703125, -0.25406837463378906, -0.24726486206054688, -0.2404613494873047, -0.2336578369140625, -0.2268543243408203, -0.22005081176757812, -0.21324729919433594, -0.20644378662109375, -0.19964027404785156, -0.19283676147460938, -0.1860332489013672, -0.179229736328125, -0.1724262237548828, -0.16562271118164062, -0.15881919860839844, -0.15201568603515625, -0.14521217346191406, -0.13840866088867188, -0.1316051483154297, -0.1248016357421875, -0.11799812316894531, -0.11119461059570312, -0.10439109802246094, -0.09758758544921875, -0.09078407287597656, -0.08398056030273438, -0.07717704772949219, -0.07037353515625, -0.06357002258300781, -0.056766510009765625, -0.04996299743652344, -0.04315948486328125, -0.03635597229003906, -0.029552459716796875, -0.022748947143554688, -0.0159454345703125, -0.009141921997070312, -0.002338409423828125, 0.0044651031494140625, 0.01126861572265625, 0.018072128295898438, 0.024875640869140625, 0.03167915344238281, 0.038482666015625, 0.04528617858886719, 0.052089691162109375, 0.05889320373535156, 0.06569671630859375, 0.07250022888183594, 0.07930374145507812, 0.08610725402832031, 0.0929107666015625, 0.09971427917480469, 0.10651779174804688, 0.11332130432128906, 0.12012481689453125, 0.12692832946777344, 0.13373184204101562, 0.1405353546142578, 0.1473388671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 12.0, 9.0, 17.0, 38.0, 50.0, 82.0, 182.0, 376.0, 990.0, 2679.0, 9141.0, 38751.0, 308880.0, 3593187.0, 198950.0, 29438.0, 7610.0, 2347.0, 812.0, 344.0, 140.0, 88.0, 54.0, 29.0, 23.0, 20.0, 7.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.786834716796875, -2.67718505859375, -2.567535400390625, -2.4578857421875, -2.348236083984375, -2.23858642578125, -2.128936767578125, -2.019287109375, -1.909637451171875, -1.79998779296875, -1.690338134765625, -1.5806884765625, -1.471038818359375, -1.36138916015625, -1.251739501953125, -1.14208984375, -1.032440185546875, -0.92279052734375, -0.813140869140625, -0.7034912109375, -0.593841552734375, -0.48419189453125, -0.374542236328125, -0.264892578125, -0.155242919921875, -0.04559326171875, 0.064056396484375, 0.1737060546875, 0.283355712890625, 0.39300537109375, 0.502655029296875, 0.6123046875, 0.721954345703125, 0.83160400390625, 0.941253662109375, 1.0509033203125, 1.160552978515625, 1.27020263671875, 1.379852294921875, 1.489501953125, 1.599151611328125, 1.70880126953125, 1.818450927734375, 1.9281005859375, 2.037750244140625, 2.14739990234375, 2.257049560546875, 2.36669921875, 2.476348876953125, 2.58599853515625, 2.695648193359375, 2.8052978515625, 2.914947509765625, 3.02459716796875, 3.134246826171875, 3.243896484375, 3.353546142578125, 3.46319580078125, 3.572845458984375, 3.6824951171875, 3.792144775390625, 3.90179443359375, 4.011444091796875, 4.12109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 3.0, 4.0, 15.0, 15.0, 25.0, 22.0, 35.0, 49.0, 79.0, 117.0, 209.0, 340.0, 809.0, 1414.0, 375.0, 153.0, 125.0, 85.0, 60.0, 42.0, 21.0, 14.0, 15.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.438232421875, -0.426422119140625, -0.41461181640625, -0.402801513671875, -0.3909912109375, -0.379180908203125, -0.36737060546875, -0.355560302734375, -0.34375, -0.331939697265625, -0.32012939453125, -0.308319091796875, -0.2965087890625, -0.284698486328125, -0.27288818359375, -0.261077880859375, -0.249267578125, -0.237457275390625, -0.22564697265625, -0.213836669921875, -0.2020263671875, -0.190216064453125, -0.17840576171875, -0.166595458984375, -0.15478515625, -0.142974853515625, -0.13116455078125, -0.119354248046875, -0.1075439453125, -0.095733642578125, -0.08392333984375, -0.072113037109375, -0.060302734375, -0.048492431640625, -0.03668212890625, -0.024871826171875, -0.0130615234375, -0.001251220703125, 0.01055908203125, 0.022369384765625, 0.0341796875, 0.045989990234375, 0.05780029296875, 0.069610595703125, 0.0814208984375, 0.093231201171875, 0.10504150390625, 0.116851806640625, 0.128662109375, 0.140472412109375, 0.15228271484375, 0.164093017578125, 0.1759033203125, 0.187713623046875, 0.19952392578125, 0.211334228515625, 0.22314453125, 0.234954833984375, 0.24676513671875, 0.258575439453125, 0.2703857421875, 0.282196044921875, 0.29400634765625, 0.305816650390625, 0.317626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 17.0, 24.0, 35.0, 70.0, 122.0, 158.0, 186.0, 140.0, 103.0, 56.0, 29.0, 26.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874171495437622, -3.7760050296783447, -3.6778385639190674, -3.57967209815979, -3.4815056324005127, -3.3833391666412354, -3.285172939300537, -3.1870064735412598, -3.0888400077819824, -2.990673542022705, -2.8925070762634277, -2.7943406105041504, -2.696174144744873, -2.5980076789855957, -2.4998412132263184, -2.401674747467041, -2.3035082817077637, -2.2053418159484863, -2.107175350189209, -2.0090088844299316, -1.9108424186706543, -1.812675952911377, -1.7145096063613892, -1.6163431406021118, -1.5181766748428345, -1.4200102090835571, -1.3218437433242798, -1.223677396774292, -1.1255109310150146, -1.0273444652557373, -0.92917799949646, -0.8310115337371826, -0.7328448295593262, -0.6346783638000488, -0.5365118980407715, -0.4383454918861389, -0.3401790261268616, -0.24201256036758423, -0.14384615421295166, -0.045679688453674316, 0.05248677730560303, 0.15065322816371918, 0.24881967902183533, 0.3469861149787903, 0.4451525807380676, 0.543319046497345, 0.6414854526519775, 0.7396519184112549, 0.8378183841705322, 0.9359848499298096, 1.034151315689087, 1.1323177814483643, 1.2304842472076416, 1.328650712966919, 1.4268170595169067, 1.524983525276184, 1.6231499910354614, 1.7213164567947388, 1.8194829225540161, 1.917649269104004, 2.0158157348632812, 2.1139822006225586, 2.212148666381836, 2.3103151321411133, 2.4084815979003906]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 1.0, 6.0, 2.0, 12.0, 10.0, 13.0, 13.0, 21.0, 24.0, 27.0, 37.0, 32.0, 26.0, 49.0, 50.0, 46.0, 57.0, 63.0, 56.0, 53.0, 43.0, 41.0, 38.0, 40.0, 35.0, 40.0, 31.0, 23.0, 19.0, 13.0, 17.0, 12.0, 8.0, 5.0, 8.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.244240164756775, -1.2038975954055786, -1.1635550260543823, -1.123212456703186, -1.0828698873519897, -1.0425273180007935, -1.0021847486495972, -0.9618421196937561, -0.9214995503425598, -0.8811569809913635, -0.8408144116401672, -0.800471842288971, -0.7601292133331299, -0.7197866439819336, -0.6794440746307373, -0.639101505279541, -0.5987589359283447, -0.5584163665771484, -0.5180737972259521, -0.47773119807243347, -0.4373886287212372, -0.3970460593700409, -0.3567034602165222, -0.3163608908653259, -0.27601832151412964, -0.23567575216293335, -0.19533316791057587, -0.15499058365821838, -0.1146480143070221, -0.0743054449558258, -0.03396286070346832, 0.00637972354888916, 0.0467221736907959, 0.08706475049257278, 0.12740732729434967, 0.16774991154670715, 0.20809248089790344, 0.24843505024909973, 0.2887776494026184, 0.3291202187538147, 0.369462788105011, 0.4098053574562073, 0.45014792680740356, 0.49049052596092224, 0.5308331251144409, 0.5711756944656372, 0.6115182638168335, 0.6518608331680298, 0.6922034025192261, 0.7325459718704224, 0.7728885412216187, 0.8132311105728149, 0.8535736799240112, 0.8939162492752075, 0.9342588782310486, 0.9746014475822449, 1.014944076538086, 1.0552866458892822, 1.0956292152404785, 1.1359717845916748, 1.176314353942871, 1.2166569232940674, 1.2569994926452637, 1.29734206199646, 1.3376846313476562]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 10.0, 17.0, 19.0, 21.0, 53.0, 67.0, 101.0, 190.0, 361.0, 668.0, 1462.0, 3100.0, 8025.0, 24809.0, 90365.0, 315545.0, 407902.0, 139827.0, 36771.0, 11261.0, 4186.0, 1835.0, 881.0, 431.0, 249.0, 129.0, 81.0, 60.0, 33.0, 19.0, 19.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.687225341796875, -1.63128662109375, -1.575347900390625, -1.5194091796875, -1.463470458984375, -1.40753173828125, -1.351593017578125, -1.295654296875, -1.239715576171875, -1.18377685546875, -1.127838134765625, -1.0718994140625, -1.015960693359375, -0.96002197265625, -0.904083251953125, -0.84814453125, -0.792205810546875, -0.73626708984375, -0.680328369140625, -0.6243896484375, -0.568450927734375, -0.51251220703125, -0.456573486328125, -0.400634765625, -0.344696044921875, -0.28875732421875, -0.232818603515625, -0.1768798828125, -0.120941162109375, -0.06500244140625, -0.009063720703125, 0.046875, 0.102813720703125, 0.15875244140625, 0.214691162109375, 0.2706298828125, 0.326568603515625, 0.38250732421875, 0.438446044921875, 0.494384765625, 0.550323486328125, 0.60626220703125, 0.662200927734375, 0.7181396484375, 0.774078369140625, 0.83001708984375, 0.885955810546875, 0.94189453125, 0.997833251953125, 1.05377197265625, 1.109710693359375, 1.1656494140625, 1.221588134765625, 1.27752685546875, 1.333465576171875, 1.389404296875, 1.445343017578125, 1.50128173828125, 1.557220458984375, 1.6131591796875, 1.669097900390625, 1.72503662109375, 1.780975341796875, 1.8369140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 8.0, 2.0, 11.0, 16.0, 24.0, 34.0, 52.0, 60.0, 93.0, 86.0, 116.0, 98.0, 106.0, 81.0, 63.0, 45.0, 42.0, 23.0, 15.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.314453125, -0.30727577209472656, -0.3000984191894531, -0.2929210662841797, -0.28574371337890625, -0.2785663604736328, -0.2713890075683594, -0.26421165466308594, -0.2570343017578125, -0.24985694885253906, -0.24267959594726562, -0.2355022430419922, -0.22832489013671875, -0.2211475372314453, -0.21397018432617188, -0.20679283142089844, -0.199615478515625, -0.19243812561035156, -0.18526077270507812, -0.1780834197998047, -0.17090606689453125, -0.1637287139892578, -0.15655136108398438, -0.14937400817871094, -0.1421966552734375, -0.13501930236816406, -0.12784194946289062, -0.12066459655761719, -0.11348724365234375, -0.10630989074707031, -0.09913253784179688, -0.09195518493652344, -0.08477783203125, -0.07760047912597656, -0.07042312622070312, -0.06324577331542969, -0.05606842041015625, -0.04889106750488281, -0.041713714599609375, -0.03453636169433594, -0.0273590087890625, -0.020181655883789062, -0.013004302978515625, -0.0058269500732421875, 0.00135040283203125, 0.008527755737304688, 0.015705108642578125, 0.022882461547851562, 0.030059814453125, 0.03723716735839844, 0.044414520263671875, 0.05159187316894531, 0.05876922607421875, 0.06594657897949219, 0.07312393188476562, 0.08030128479003906, 0.0874786376953125, 0.09465599060058594, 0.10183334350585938, 0.10901069641113281, 0.11618804931640625, 0.12336540222167969, 0.13054275512695312, 0.13772010803222656, 0.1448974609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 17.0, 24.0, 20.0, 31.0, 43.0, 63.0, 85.0, 110.0, 179.0, 232.0, 352.0, 487.0, 825.0, 1179.0, 1966.0, 3233.0, 6128.0, 12271.0, 26091.0, 56896.0, 120543.0, 217341.0, 257275.0, 174331.0, 88369.0, 40903.0, 18921.0, 8970.0, 4624.0, 2582.0, 1444.0, 943.0, 599.0, 445.0, 326.0, 200.0, 146.0, 94.0, 69.0, 50.0, 36.0, 36.0, 17.0, 18.0, 8.0, 6.0, 4.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.017578125, -0.983978271484375, -0.95037841796875, -0.916778564453125, -0.8831787109375, -0.849578857421875, -0.81597900390625, -0.782379150390625, -0.748779296875, -0.715179443359375, -0.68157958984375, -0.647979736328125, -0.6143798828125, -0.580780029296875, -0.54718017578125, -0.513580322265625, -0.47998046875, -0.446380615234375, -0.41278076171875, -0.379180908203125, -0.3455810546875, -0.311981201171875, -0.27838134765625, -0.244781494140625, -0.211181640625, -0.177581787109375, -0.14398193359375, -0.110382080078125, -0.0767822265625, -0.043182373046875, -0.00958251953125, 0.024017333984375, 0.0576171875, 0.091217041015625, 0.12481689453125, 0.158416748046875, 0.1920166015625, 0.225616455078125, 0.25921630859375, 0.292816162109375, 0.326416015625, 0.360015869140625, 0.39361572265625, 0.427215576171875, 0.4608154296875, 0.494415283203125, 0.52801513671875, 0.561614990234375, 0.59521484375, 0.628814697265625, 0.66241455078125, 0.696014404296875, 0.7296142578125, 0.763214111328125, 0.79681396484375, 0.830413818359375, 0.864013671875, 0.897613525390625, 0.93121337890625, 0.964813232421875, 0.9984130859375, 1.032012939453125, 1.06561279296875, 1.099212646484375, 1.1328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 10.0, 13.0, 21.0, 12.0, 14.0, 24.0, 30.0, 29.0, 45.0, 29.0, 34.0, 46.0, 46.0, 50.0, 51.0, 50.0, 47.0, 49.0, 49.0, 57.0, 56.0, 32.0, 34.0, 27.0, 20.0, 26.0, 17.0, 13.0, 11.0, 12.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8062210083007812, -0.7769927978515625, -0.7477645874023438, -0.718536376953125, -0.6893081665039062, -0.6600799560546875, -0.6308517456054688, -0.60162353515625, -0.5723953247070312, -0.5431671142578125, -0.5139389038085938, -0.484710693359375, -0.45548248291015625, -0.4262542724609375, -0.39702606201171875, -0.3677978515625, -0.33856964111328125, -0.3093414306640625, -0.28011322021484375, -0.250885009765625, -0.22165679931640625, -0.1924285888671875, -0.16320037841796875, -0.13397216796875, -0.10474395751953125, -0.0755157470703125, -0.04628753662109375, -0.017059326171875, 0.01216888427734375, 0.0413970947265625, 0.07062530517578125, 0.099853515625, 0.12908172607421875, 0.1583099365234375, 0.18753814697265625, 0.216766357421875, 0.24599456787109375, 0.2752227783203125, 0.30445098876953125, 0.33367919921875, 0.36290740966796875, 0.3921356201171875, 0.42136383056640625, 0.450592041015625, 0.47982025146484375, 0.5090484619140625, 0.5382766723632812, 0.5675048828125, 0.5967330932617188, 0.6259613037109375, 0.6551895141601562, 0.684417724609375, 0.7136459350585938, 0.7428741455078125, 0.7721023559570312, 0.80133056640625, 0.8305587768554688, 0.8597869873046875, 0.8890151977539062, 0.918243408203125, 0.9474716186523438, 0.9766998291015625, 1.0059280395507812, 1.03515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 7.0, 7.0, 18.0, 11.0, 20.0, 42.0, 60.0, 82.0, 137.0, 228.0, 414.0, 757.0, 1356.0, 2935.0, 6442.0, 15799.0, 41630.0, 115697.0, 274811.0, 326209.0, 163329.0, 60066.0, 22086.0, 8710.0, 3772.0, 1871.0, 864.0, 467.0, 283.0, 148.0, 105.0, 73.0, 35.0, 24.0, 18.0, 9.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9150390625, -0.8856887817382812, -0.8563385009765625, -0.8269882202148438, -0.797637939453125, -0.7682876586914062, -0.7389373779296875, -0.7095870971679688, -0.68023681640625, -0.6508865356445312, -0.6215362548828125, -0.5921859741210938, -0.562835693359375, -0.5334854125976562, -0.5041351318359375, -0.47478485107421875, -0.4454345703125, -0.41608428955078125, -0.3867340087890625, -0.35738372802734375, -0.328033447265625, -0.29868316650390625, -0.2693328857421875, -0.23998260498046875, -0.21063232421875, -0.18128204345703125, -0.1519317626953125, -0.12258148193359375, -0.093231201171875, -0.06388092041015625, -0.0345306396484375, -0.00518035888671875, 0.024169921875, 0.05352020263671875, 0.0828704833984375, 0.11222076416015625, 0.141571044921875, 0.17092132568359375, 0.2002716064453125, 0.22962188720703125, 0.25897216796875, 0.28832244873046875, 0.3176727294921875, 0.34702301025390625, 0.376373291015625, 0.40572357177734375, 0.4350738525390625, 0.46442413330078125, 0.4937744140625, 0.5231246948242188, 0.5524749755859375, 0.5818252563476562, 0.611175537109375, 0.6405258178710938, 0.6698760986328125, 0.6992263793945312, 0.72857666015625, 0.7579269409179688, 0.7872772216796875, 0.8166275024414062, 0.845977783203125, 0.8753280639648438, 0.9046783447265625, 0.9340286254882812, 0.96337890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 2.0, 9.0, 5.0, 12.0, 9.0, 33.0, 31.0, 25.0, 37.0, 34.0, 41.0, 50.0, 66.0, 61.0, 59.0, 66.0, 68.0, 52.0, 65.0, 48.0, 40.0, 32.0, 29.0, 30.0, 21.0, 16.0, 8.0, 15.0, 11.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000148773193359375, -0.00014415383338928223, -0.00013953447341918945, -0.00013491511344909668, -0.0001302957534790039, -0.00012567639350891113, -0.00012105703353881836, -0.00011643767356872559, -0.00011181831359863281, -0.00010719895362854004, -0.00010257959365844727, -9.796023368835449e-05, -9.334087371826172e-05, -8.872151374816895e-05, -8.410215377807617e-05, -7.94827938079834e-05, -7.486343383789062e-05, -7.024407386779785e-05, -6.562471389770508e-05, -6.1005353927612305e-05, -5.638599395751953e-05, -5.176663398742676e-05, -4.7147274017333984e-05, -4.252791404724121e-05, -3.790855407714844e-05, -3.3289194107055664e-05, -2.866983413696289e-05, -2.4050474166870117e-05, -1.9431114196777344e-05, -1.481175422668457e-05, -1.0192394256591797e-05, -5.5730342864990234e-06, -9.5367431640625e-07, 3.6656856536865234e-06, 8.285045623779297e-06, 1.290440559387207e-05, 1.7523765563964844e-05, 2.2143125534057617e-05, 2.676248550415039e-05, 3.1381845474243164e-05, 3.600120544433594e-05, 4.062056541442871e-05, 4.5239925384521484e-05, 4.985928535461426e-05, 5.447864532470703e-05, 5.9098005294799805e-05, 6.371736526489258e-05, 6.833672523498535e-05, 7.295608520507812e-05, 7.75754451751709e-05, 8.219480514526367e-05, 8.681416511535645e-05, 9.143352508544922e-05, 9.605288505554199e-05, 0.00010067224502563477, 0.00010529160499572754, 0.00010991096496582031, 0.00011453032493591309, 0.00011914968490600586, 0.00012376904487609863, 0.0001283884048461914, 0.00013300776481628418, 0.00013762712478637695, 0.00014224648475646973, 0.0001468658447265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 8.0, 7.0, 11.0, 21.0, 26.0, 33.0, 48.0, 86.0, 139.0, 222.0, 285.0, 501.0, 827.0, 1456.0, 2917.0, 6072.0, 14643.0, 39042.0, 120363.0, 350517.0, 335747.0, 112734.0, 36969.0, 13965.0, 5855.0, 2632.0, 1368.0, 771.0, 422.0, 283.0, 185.0, 127.0, 68.0, 58.0, 45.0, 23.0, 19.0, 13.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.30078125, -1.264617919921875, -1.22845458984375, -1.192291259765625, -1.1561279296875, -1.119964599609375, -1.08380126953125, -1.047637939453125, -1.011474609375, -0.975311279296875, -0.93914794921875, -0.902984619140625, -0.8668212890625, -0.830657958984375, -0.79449462890625, -0.758331298828125, -0.72216796875, -0.686004638671875, -0.64984130859375, -0.613677978515625, -0.5775146484375, -0.541351318359375, -0.50518798828125, -0.469024658203125, -0.432861328125, -0.396697998046875, -0.36053466796875, -0.324371337890625, -0.2882080078125, -0.252044677734375, -0.21588134765625, -0.179718017578125, -0.1435546875, -0.107391357421875, -0.07122802734375, -0.035064697265625, 0.0010986328125, 0.037261962890625, 0.07342529296875, 0.109588623046875, 0.145751953125, 0.181915283203125, 0.21807861328125, 0.254241943359375, 0.2904052734375, 0.326568603515625, 0.36273193359375, 0.398895263671875, 0.43505859375, 0.471221923828125, 0.50738525390625, 0.543548583984375, 0.5797119140625, 0.615875244140625, 0.65203857421875, 0.688201904296875, 0.724365234375, 0.760528564453125, 0.79669189453125, 0.832855224609375, 0.8690185546875, 0.905181884765625, 0.94134521484375, 0.977508544921875, 1.013671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 3.0, 7.0, 9.0, 17.0, 15.0, 19.0, 26.0, 31.0, 29.0, 25.0, 28.0, 37.0, 47.0, 50.0, 46.0, 61.0, 56.0, 55.0, 45.0, 54.0, 50.0, 46.0, 39.0, 29.0, 36.0, 21.0, 26.0, 15.0, 11.0, 9.0, 10.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.62646484375, -0.6099624633789062, -0.5934600830078125, -0.5769577026367188, -0.560455322265625, -0.5439529418945312, -0.5274505615234375, -0.5109481811523438, -0.49444580078125, -0.47794342041015625, -0.4614410400390625, -0.44493865966796875, -0.428436279296875, -0.41193389892578125, -0.3954315185546875, -0.37892913818359375, -0.3624267578125, -0.34592437744140625, -0.3294219970703125, -0.31291961669921875, -0.296417236328125, -0.27991485595703125, -0.2634124755859375, -0.24691009521484375, -0.23040771484375, -0.21390533447265625, -0.1974029541015625, -0.18090057373046875, -0.164398193359375, -0.14789581298828125, -0.1313934326171875, -0.11489105224609375, -0.098388671875, -0.08188629150390625, -0.0653839111328125, -0.04888153076171875, -0.032379150390625, -0.01587677001953125, 0.0006256103515625, 0.01712799072265625, 0.03363037109375, 0.05013275146484375, 0.0666351318359375, 0.08313751220703125, 0.099639892578125, 0.11614227294921875, 0.1326446533203125, 0.14914703369140625, 0.1656494140625, 0.18215179443359375, 0.1986541748046875, 0.21515655517578125, 0.231658935546875, 0.24816131591796875, 0.2646636962890625, 0.28116607666015625, 0.29766845703125, 0.31417083740234375, 0.3306732177734375, 0.34717559814453125, 0.363677978515625, 0.38018035888671875, 0.3966827392578125, 0.41318511962890625, 0.4296875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 12.0, 12.0, 27.0, 38.0, 63.0, 78.0, 103.0, 117.0, 133.0, 112.0, 85.0, 66.0, 45.0, 33.0, 22.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.11367416381836, -9.795899391174316, -9.478123664855957, -9.160348892211914, -8.842574119567871, -8.524798393249512, -8.207023620605469, -7.889248371124268, -7.571473121643066, -7.253697872161865, -6.935923099517822, -6.618147850036621, -6.30037260055542, -5.982597351074219, -5.664822578430176, -5.347047328948975, -5.029272556304932, -4.7114973068237305, -4.3937225341796875, -4.075947284698486, -3.758172035217285, -3.440397024154663, -3.122622013092041, -2.80484676361084, -2.4870717525482178, -2.1692967414855957, -1.8515214920043945, -1.5337464809417725, -1.2159713506698608, -0.8981962203979492, -0.5804212093353271, -0.262645959854126, 0.055129051208496094, 0.3729041516780853, 0.6906792521476746, 1.0084543228149414, 1.326229453086853, 1.6440045833587646, 1.9617795944213867, 2.279554843902588, 2.59732985496521, 2.915104866027832, 3.232880115509033, 3.5506551265716553, 3.8684301376342773, 4.1862053871154785, 4.50398063659668, 4.821755409240723, 5.139530658721924, 5.457305908203125, 5.775080680847168, 6.092855930328369, 6.41063117980957, 6.728405952453613, 7.0461812019348145, 7.363956451416016, 7.681731224060059, 7.99950647354126, 8.317281723022461, 8.635056495666504, 8.952831268310547, 9.270606994628906, 9.58838176727295, 9.906156539916992, 10.223932266235352]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 12.0, 14.0, 28.0, 20.0, 33.0, 38.0, 52.0, 45.0, 55.0, 59.0, 74.0, 75.0, 75.0, 55.0, 66.0, 73.0, 37.0, 47.0, 31.0, 18.0, 31.0, 22.0, 14.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21395206451416, -8.920344352722168, -8.62673568725586, -8.333127975463867, -8.039520263671875, -7.745912551879883, -7.452304363250732, -7.158696174621582, -6.86508846282959, -6.571480751037598, -6.277872562408447, -5.984264373779297, -5.690656661987305, -5.3970489501953125, -5.103440761566162, -4.809832572937012, -4.5162248611450195, -4.222617149353027, -3.929008960723877, -3.6354010105133057, -3.3417930603027344, -3.048185110092163, -2.754577159881592, -2.4609692096710205, -2.167361259460449, -1.873753309249878, -1.5801453590393066, -1.2865374088287354, -0.9929294586181641, -0.6993215084075928, -0.4057135581970215, -0.1121056079864502, 0.1815013885498047, 0.475109338760376, 0.7687172889709473, 1.0623252391815186, 1.3559331893920898, 1.6495411396026611, 1.9431490898132324, 2.2367570400238037, 2.530364990234375, 2.8239729404449463, 3.1175808906555176, 3.411188840866089, 3.70479679107666, 3.9984047412872314, 4.292012691497803, 4.585620880126953, 4.879228591918945, 5.1728363037109375, 5.466444492340088, 5.760052680969238, 6.0536603927612305, 6.347268104553223, 6.640876293182373, 6.934484481811523, 7.228092193603516, 7.521699905395508, 7.815308094024658, 8.108916282653809, 8.4025239944458, 8.696131706237793, 8.989740371704102, 9.283348083496094, 9.576955795288086]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 16.0, 17.0, 34.0, 59.0, 87.0, 194.0, 419.0, 1161.0, 4756.0, 43750.0, 3960593.0, 170305.0, 9949.0, 1874.0, 578.0, 232.0, 115.0, 56.0, 23.0, 17.0, 12.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.92431640625, -5.7822265625, -5.64013671875, -5.498046875, -5.35595703125, -5.2138671875, -5.07177734375, -4.9296875, -4.78759765625, -4.6455078125, -4.50341796875, -4.361328125, -4.21923828125, -4.0771484375, -3.93505859375, -3.79296875, -3.65087890625, -3.5087890625, -3.36669921875, -3.224609375, -3.08251953125, -2.9404296875, -2.79833984375, -2.65625, -2.51416015625, -2.3720703125, -2.22998046875, -2.087890625, -1.94580078125, -1.8037109375, -1.66162109375, -1.51953125, -1.37744140625, -1.2353515625, -1.09326171875, -0.951171875, -0.80908203125, -0.6669921875, -0.52490234375, -0.3828125, -0.24072265625, -0.0986328125, 0.04345703125, 0.185546875, 0.32763671875, 0.4697265625, 0.61181640625, 0.75390625, 0.89599609375, 1.0380859375, 1.18017578125, 1.322265625, 1.46435546875, 1.6064453125, 1.74853515625, 1.890625, 2.03271484375, 2.1748046875, 2.31689453125, 2.458984375, 2.60107421875, 2.7431640625, 2.88525390625, 3.02734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 8.0, 11.0, 31.0, 33.0, 57.0, 63.0, 93.0, 82.0, 104.0, 113.0, 107.0, 92.0, 64.0, 40.0, 38.0, 18.0, 16.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.457763671875, -0.4475383758544922, -0.4373130798339844, -0.42708778381347656, -0.41686248779296875, -0.40663719177246094, -0.3964118957519531, -0.3861865997314453, -0.3759613037109375, -0.3657360076904297, -0.3555107116699219, -0.34528541564941406, -0.33506011962890625, -0.32483482360839844, -0.3146095275878906, -0.3043842315673828, -0.294158935546875, -0.2839336395263672, -0.2737083435058594, -0.26348304748535156, -0.25325775146484375, -0.24303245544433594, -0.23280715942382812, -0.2225818634033203, -0.2123565673828125, -0.2021312713623047, -0.19190597534179688, -0.18168067932128906, -0.17145538330078125, -0.16123008728027344, -0.15100479125976562, -0.1407794952392578, -0.13055419921875, -0.12032890319824219, -0.11010360717773438, -0.09987831115722656, -0.08965301513671875, -0.07942771911621094, -0.06920242309570312, -0.05897712707519531, -0.0487518310546875, -0.03852653503417969, -0.028301239013671875, -0.018075942993164062, -0.00785064697265625, 0.0023746490478515625, 0.012599945068359375, 0.022825241088867188, 0.033050537109375, 0.04327583312988281, 0.053501129150390625, 0.06372642517089844, 0.07395172119140625, 0.08417701721191406, 0.09440231323242188, 0.10462760925292969, 0.1148529052734375, 0.1250782012939453, 0.13530349731445312, 0.14552879333496094, 0.15575408935546875, 0.16597938537597656, 0.17620468139648438, 0.1864299774169922, 0.1966552734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 12.0, 8.0, 24.0, 40.0, 45.0, 106.0, 184.0, 323.0, 767.0, 1828.0, 4728.0, 14167.0, 52838.0, 323812.0, 3399951.0, 319968.0, 52397.0, 14289.0, 4883.0, 1956.0, 886.0, 441.0, 246.0, 146.0, 96.0, 53.0, 31.0, 15.0, 12.0, 6.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.28143310546875, -2.2171630859375, -2.15289306640625, -2.088623046875, -2.02435302734375, -1.9600830078125, -1.89581298828125, -1.83154296875, -1.76727294921875, -1.7030029296875, -1.63873291015625, -1.574462890625, -1.51019287109375, -1.4459228515625, -1.38165283203125, -1.3173828125, -1.25311279296875, -1.1888427734375, -1.12457275390625, -1.060302734375, -0.99603271484375, -0.9317626953125, -0.86749267578125, -0.80322265625, -0.73895263671875, -0.6746826171875, -0.61041259765625, -0.546142578125, -0.48187255859375, -0.4176025390625, -0.35333251953125, -0.2890625, -0.22479248046875, -0.1605224609375, -0.09625244140625, -0.031982421875, 0.03228759765625, 0.0965576171875, 0.16082763671875, 0.22509765625, 0.28936767578125, 0.3536376953125, 0.41790771484375, 0.482177734375, 0.54644775390625, 0.6107177734375, 0.67498779296875, 0.7392578125, 0.80352783203125, 0.8677978515625, 0.93206787109375, 0.996337890625, 1.06060791015625, 1.1248779296875, 1.18914794921875, 1.25341796875, 1.31768798828125, 1.3819580078125, 1.44622802734375, 1.510498046875, 1.57476806640625, 1.6390380859375, 1.70330810546875, 1.767578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 23.0, 18.0, 27.0, 50.0, 49.0, 93.0, 138.0, 205.0, 367.0, 1341.0, 821.0, 317.0, 171.0, 123.0, 92.0, 57.0, 36.0, 21.0, 26.0, 15.0, 11.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2578125, -0.24703216552734375, -0.2362518310546875, -0.22547149658203125, -0.214691162109375, -0.20391082763671875, -0.1931304931640625, -0.18235015869140625, -0.17156982421875, -0.16078948974609375, -0.1500091552734375, -0.13922882080078125, -0.128448486328125, -0.11766815185546875, -0.1068878173828125, -0.09610748291015625, -0.0853271484375, -0.07454681396484375, -0.0637664794921875, -0.05298614501953125, -0.042205810546875, -0.03142547607421875, -0.0206451416015625, -0.00986480712890625, 0.00091552734375, 0.01169586181640625, 0.0224761962890625, 0.03325653076171875, 0.044036865234375, 0.05481719970703125, 0.0655975341796875, 0.07637786865234375, 0.087158203125, 0.09793853759765625, 0.1087188720703125, 0.11949920654296875, 0.130279541015625, 0.14105987548828125, 0.1518402099609375, 0.16262054443359375, 0.17340087890625, 0.18418121337890625, 0.1949615478515625, 0.20574188232421875, 0.216522216796875, 0.22730255126953125, 0.2380828857421875, 0.24886322021484375, 0.2596435546875, 0.27042388916015625, 0.2812042236328125, 0.29198455810546875, 0.302764892578125, 0.31354522705078125, 0.3243255615234375, 0.33510589599609375, 0.34588623046875, 0.35666656494140625, 0.3674468994140625, 0.37822723388671875, 0.389007568359375, 0.39978790283203125, 0.4105682373046875, 0.42134857177734375, 0.43212890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 15.0, 31.0, 71.0, 122.0, 153.0, 175.0, 148.0, 121.0, 70.0, 42.0, 21.0, 12.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.760511875152588, -1.6604740619659424, -1.5604362487792969, -1.4603984355926514, -1.3603606224060059, -1.2603228092193604, -1.1602851152420044, -1.0602473020553589, -0.9602094888687134, -0.8601716756820679, -0.7601338624954224, -0.6600961089134216, -0.5600582957267761, -0.4600204825401306, -0.3599827289581299, -0.2599449157714844, -0.15990710258483887, -0.05986930429935455, 0.04016849398612976, 0.14020627737045288, 0.2402440905570984, 0.3402819037437439, 0.44031965732574463, 0.5403574705123901, 0.6403952836990356, 0.7404330968856812, 0.8404709100723267, 0.9405086636543274, 1.0405464172363281, 1.1405842304229736, 1.2406220436096191, 1.3406598567962646, 1.4406976699829102, 1.5407354831695557, 1.6407732963562012, 1.7408111095428467, 1.8408489227294922, 1.9408867359161377, 2.040924549102783, 2.1409621238708496, 2.241000175476074, 2.3410379886627197, 2.4410758018493652, 2.5411136150360107, 2.6411514282226562, 2.7411892414093018, 2.8412270545959473, 2.9412646293640137, 3.041302442550659, 3.1413402557373047, 3.24137806892395, 3.3414158821105957, 3.441453695297241, 3.5414915084838867, 3.641529083251953, 3.7415671348571777, 3.841604709625244, 3.9416425228118896, 4.041680335998535, 4.141717910766602, 4.241755962371826, 4.341793537139893, 4.441831588745117, 4.541869163513184, 4.641907215118408]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 14.0, 12.0, 16.0, 19.0, 19.0, 22.0, 23.0, 23.0, 35.0, 27.0, 34.0, 44.0, 42.0, 51.0, 46.0, 32.0, 43.0, 45.0, 48.0, 37.0, 42.0, 30.0, 33.0, 41.0, 19.0, 19.0, 25.0, 24.0, 12.0, 16.0, 18.0, 11.0, 10.0, 14.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0349489450454712, -0.9999313950538635, -0.9649138450622559, -0.929896354675293, -0.8948788046836853, -0.8598612546920776, -0.82484370470047, -0.7898261547088623, -0.7548086643218994, -0.7197911143302917, -0.6847735643386841, -0.6497560739517212, -0.6147385239601135, -0.5797209739685059, -0.5447034239768982, -0.5096858739852905, -0.47466832399368286, -0.4396507740020752, -0.4046332538127899, -0.36961570382118225, -0.334598183631897, -0.2995806336402893, -0.26456308364868164, -0.22954554855823517, -0.1945280134677887, -0.15951047837734222, -0.12449293583631516, -0.08947539329528809, -0.054457858204841614, -0.01944032311439514, 0.015577226877212524, 0.050594761967659, 0.08561229705810547, 0.12062983214855194, 0.1556473672389984, 0.19066491723060608, 0.22568245232105255, 0.260699987411499, 0.2957175374031067, 0.33073508739471436, 0.36575260758399963, 0.4007701575756073, 0.4357876777648926, 0.47080522775650024, 0.5058227777481079, 0.5408402681350708, 0.5758578777313232, 0.6108753681182861, 0.6458929181098938, 0.6809104681015015, 0.7159280180931091, 0.7509455680847168, 0.7859630584716797, 0.8209806084632874, 0.855998158454895, 0.8910157084465027, 0.9260332584381104, 0.961050808429718, 0.9960683584213257, 1.0310858488082886, 1.066103458404541, 1.101120948791504, 1.1361384391784668, 1.1711560487747192, 1.2061735391616821]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 11.0, 9.0, 6.0, 21.0, 23.0, 55.0, 94.0, 184.0, 303.0, 749.0, 1811.0, 5218.0, 20265.0, 93451.0, 357751.0, 410528.0, 121821.0, 26005.0, 6487.0, 2121.0, 840.0, 367.0, 176.0, 91.0, 56.0, 40.0, 24.0, 13.0, 8.0, 7.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.07781982421875, -2.0130615234375, -1.94830322265625, -1.883544921875, -1.81878662109375, -1.7540283203125, -1.68927001953125, -1.62451171875, -1.55975341796875, -1.4949951171875, -1.43023681640625, -1.365478515625, -1.30072021484375, -1.2359619140625, -1.17120361328125, -1.1064453125, -1.04168701171875, -0.9769287109375, -0.91217041015625, -0.847412109375, -0.78265380859375, -0.7178955078125, -0.65313720703125, -0.58837890625, -0.52362060546875, -0.4588623046875, -0.39410400390625, -0.329345703125, -0.26458740234375, -0.1998291015625, -0.13507080078125, -0.0703125, -0.00555419921875, 0.0592041015625, 0.12396240234375, 0.188720703125, 0.25347900390625, 0.3182373046875, 0.38299560546875, 0.44775390625, 0.51251220703125, 0.5772705078125, 0.64202880859375, 0.706787109375, 0.77154541015625, 0.8363037109375, 0.90106201171875, 0.9658203125, 1.03057861328125, 1.0953369140625, 1.16009521484375, 1.224853515625, 1.28961181640625, 1.3543701171875, 1.41912841796875, 1.48388671875, 1.54864501953125, 1.6134033203125, 1.67816162109375, 1.742919921875, 1.80767822265625, 1.8724365234375, 1.93719482421875, 2.001953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 6.0, 14.0, 11.0, 24.0, 40.0, 59.0, 66.0, 83.0, 90.0, 116.0, 107.0, 94.0, 78.0, 64.0, 43.0, 28.0, 25.0, 24.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.435791015625, -0.4258403778076172, -0.4158897399902344, -0.40593910217285156, -0.39598846435546875, -0.38603782653808594, -0.3760871887207031, -0.3661365509033203, -0.3561859130859375, -0.3462352752685547, -0.3362846374511719, -0.32633399963378906, -0.31638336181640625, -0.30643272399902344, -0.2964820861816406, -0.2865314483642578, -0.276580810546875, -0.2666301727294922, -0.2566795349121094, -0.24672889709472656, -0.23677825927734375, -0.22682762145996094, -0.21687698364257812, -0.2069263458251953, -0.1969757080078125, -0.1870250701904297, -0.17707443237304688, -0.16712379455566406, -0.15717315673828125, -0.14722251892089844, -0.13727188110351562, -0.1273212432861328, -0.11737060546875, -0.10741996765136719, -0.09746932983398438, -0.08751869201660156, -0.07756805419921875, -0.06761741638183594, -0.057666778564453125, -0.04771614074707031, -0.0377655029296875, -0.027814865112304688, -0.017864227294921875, -0.007913589477539062, 0.00203704833984375, 0.011987686157226562, 0.021938323974609375, 0.03188896179199219, 0.041839599609375, 0.05179023742675781, 0.061740875244140625, 0.07169151306152344, 0.08164215087890625, 0.09159278869628906, 0.10154342651367188, 0.11149406433105469, 0.1214447021484375, 0.1313953399658203, 0.14134597778320312, 0.15129661560058594, 0.16124725341796875, 0.17119789123535156, 0.18114852905273438, 0.1910991668701172, 0.2010498046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 8.0, 10.0, 7.0, 12.0, 20.0, 28.0, 40.0, 54.0, 96.0, 128.0, 203.0, 286.0, 412.0, 561.0, 951.0, 1574.0, 3130.0, 6770.0, 17370.0, 48660.0, 129516.0, 265548.0, 297694.0, 167942.0, 65808.0, 23699.0, 8974.0, 3942.0, 1959.0, 1083.0, 721.0, 464.0, 275.0, 198.0, 132.0, 82.0, 59.0, 51.0, 34.0, 17.0, 12.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4658203125, -1.4241180419921875, -1.382415771484375, -1.3407135009765625, -1.29901123046875, -1.2573089599609375, -1.215606689453125, -1.1739044189453125, -1.1322021484375, -1.0904998779296875, -1.048797607421875, -1.0070953369140625, -0.96539306640625, -0.9236907958984375, -0.881988525390625, -0.8402862548828125, -0.798583984375, -0.7568817138671875, -0.715179443359375, -0.6734771728515625, -0.63177490234375, -0.5900726318359375, -0.548370361328125, -0.5066680908203125, -0.4649658203125, -0.4232635498046875, -0.381561279296875, -0.3398590087890625, -0.29815673828125, -0.2564544677734375, -0.214752197265625, -0.1730499267578125, -0.13134765625, -0.0896453857421875, -0.047943115234375, -0.0062408447265625, 0.03546142578125, 0.0771636962890625, 0.118865966796875, 0.1605682373046875, 0.2022705078125, 0.2439727783203125, 0.285675048828125, 0.3273773193359375, 0.36907958984375, 0.4107818603515625, 0.452484130859375, 0.4941864013671875, 0.535888671875, 0.5775909423828125, 0.619293212890625, 0.6609954833984375, 0.70269775390625, 0.7444000244140625, 0.786102294921875, 0.8278045654296875, 0.8695068359375, 0.9112091064453125, 0.952911376953125, 0.9946136474609375, 1.03631591796875, 1.0780181884765625, 1.119720458984375, 1.1614227294921875, 1.203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 14.0, 9.0, 12.0, 17.0, 22.0, 25.0, 31.0, 37.0, 39.0, 46.0, 46.0, 41.0, 46.0, 50.0, 57.0, 55.0, 44.0, 50.0, 52.0, 46.0, 36.0, 26.0, 32.0, 18.0, 27.0, 23.0, 20.0, 20.0, 14.0, 7.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.3271484375, -1.2929306030273438, -1.2587127685546875, -1.2244949340820312, -1.190277099609375, -1.1560592651367188, -1.1218414306640625, -1.0876235961914062, -1.05340576171875, -1.0191879272460938, -0.9849700927734375, -0.9507522583007812, -0.916534423828125, -0.8823165893554688, -0.8480987548828125, -0.8138809204101562, -0.7796630859375, -0.7454452514648438, -0.7112274169921875, -0.6770095825195312, -0.642791748046875, -0.6085739135742188, -0.5743560791015625, -0.5401382446289062, -0.50592041015625, -0.47170257568359375, -0.4374847412109375, -0.40326690673828125, -0.369049072265625, -0.33483123779296875, -0.3006134033203125, -0.26639556884765625, -0.232177734375, -0.19795989990234375, -0.1637420654296875, -0.12952423095703125, -0.095306396484375, -0.06108856201171875, -0.0268707275390625, 0.00734710693359375, 0.04156494140625, 0.07578277587890625, 0.1100006103515625, 0.14421844482421875, 0.178436279296875, 0.21265411376953125, 0.2468719482421875, 0.28108978271484375, 0.3153076171875, 0.34952545166015625, 0.3837432861328125, 0.41796112060546875, 0.452178955078125, 0.48639678955078125, 0.5206146240234375, 0.5548324584960938, 0.58905029296875, 0.6232681274414062, 0.6574859619140625, 0.6917037963867188, 0.725921630859375, 0.7601394653320312, 0.7943572998046875, 0.8285751342773438, 0.86279296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 9.0, 11.0, 15.0, 23.0, 38.0, 43.0, 59.0, 112.0, 156.0, 245.0, 392.0, 698.0, 1072.0, 1954.0, 3777.0, 7566.0, 16516.0, 38159.0, 91580.0, 200262.0, 296294.0, 212989.0, 99317.0, 42200.0, 17895.0, 8259.0, 4067.0, 1977.0, 1116.0, 619.0, 353.0, 260.0, 169.0, 93.0, 69.0, 63.0, 34.0, 25.0, 20.0, 13.0, 13.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6826400756835938, -0.6616668701171875, -0.6406936645507812, -0.619720458984375, -0.5987472534179688, -0.5777740478515625, -0.5568008422851562, -0.53582763671875, -0.5148544311523438, -0.4938812255859375, -0.47290802001953125, -0.451934814453125, -0.43096160888671875, -0.4099884033203125, -0.38901519775390625, -0.3680419921875, -0.34706878662109375, -0.3260955810546875, -0.30512237548828125, -0.284149169921875, -0.26317596435546875, -0.2422027587890625, -0.22122955322265625, -0.20025634765625, -0.17928314208984375, -0.1583099365234375, -0.13733673095703125, -0.116363525390625, -0.09539031982421875, -0.0744171142578125, -0.05344390869140625, -0.032470703125, -0.01149749755859375, 0.0094757080078125, 0.03044891357421875, 0.051422119140625, 0.07239532470703125, 0.0933685302734375, 0.11434173583984375, 0.13531494140625, 0.15628814697265625, 0.1772613525390625, 0.19823455810546875, 0.219207763671875, 0.24018096923828125, 0.2611541748046875, 0.28212738037109375, 0.3031005859375, 0.32407379150390625, 0.3450469970703125, 0.36602020263671875, 0.386993408203125, 0.40796661376953125, 0.4289398193359375, 0.44991302490234375, 0.47088623046875, 0.49185943603515625, 0.5128326416015625, 0.5338058471679688, 0.554779052734375, 0.5757522583007812, 0.5967254638671875, 0.6176986694335938, 0.638671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 16.0, 12.0, 24.0, 19.0, 22.0, 30.0, 45.0, 42.0, 42.0, 59.0, 57.0, 57.0, 83.0, 67.0, 49.0, 48.0, 49.0, 47.0, 35.0, 26.0, 22.0, 28.0, 17.0, 21.0, 10.0, 12.0, 9.0, 8.0, 2.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011900998651981354, -0.0001145191490650177, -0.00011002831161022186, -0.00010553747415542603, -0.00010104663670063019, -9.655579924583435e-05, -9.206496179103851e-05, -8.757412433624268e-05, -8.308328688144684e-05, -7.8592449426651e-05, -7.410161197185516e-05, -6.961077451705933e-05, -6.511993706226349e-05, -6.062909960746765e-05, -5.6138262152671814e-05, -5.1647424697875977e-05, -4.715658724308014e-05, -4.26657497882843e-05, -3.8174912333488464e-05, -3.368407487869263e-05, -2.919323742389679e-05, -2.4702399969100952e-05, -2.0211562514305115e-05, -1.5720725059509277e-05, -1.122988760471344e-05, -6.7390501499176025e-06, -2.248212695121765e-06, 2.2426247596740723e-06, 6.73346221446991e-06, 1.1224299669265747e-05, 1.5715137124061584e-05, 2.0205974578857422e-05, 2.469681203365326e-05, 2.9187649488449097e-05, 3.3678486943244934e-05, 3.816932439804077e-05, 4.266016185283661e-05, 4.7150999307632446e-05, 5.1641836762428284e-05, 5.613267421722412e-05, 6.062351167201996e-05, 6.51143491268158e-05, 6.960518658161163e-05, 7.409602403640747e-05, 7.858686149120331e-05, 8.307769894599915e-05, 8.756853640079498e-05, 9.205937385559082e-05, 9.655021131038666e-05, 0.0001010410487651825, 0.00010553188621997833, 0.00011002272367477417, 0.00011451356112957001, 0.00011900439858436584, 0.00012349523603916168, 0.00012798607349395752, 0.00013247691094875336, 0.0001369677484035492, 0.00014145858585834503, 0.00014594942331314087, 0.0001504402607679367, 0.00015493109822273254, 0.00015942193567752838, 0.00016391277313232422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 8.0, 3.0, 7.0, 4.0, 15.0, 11.0, 32.0, 35.0, 41.0, 73.0, 94.0, 155.0, 230.0, 359.0, 636.0, 1132.0, 2144.0, 4708.0, 11740.0, 33587.0, 107760.0, 317593.0, 364760.0, 136279.0, 41614.0, 14253.0, 5552.0, 2507.0, 1296.0, 712.0, 423.0, 258.0, 178.0, 118.0, 67.0, 51.0, 30.0, 23.0, 18.0, 13.0, 10.0, 6.0, 10.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88134765625, -0.8538894653320312, -0.8264312744140625, -0.7989730834960938, -0.771514892578125, -0.7440567016601562, -0.7165985107421875, -0.6891403198242188, -0.66168212890625, -0.6342239379882812, -0.6067657470703125, -0.5793075561523438, -0.551849365234375, -0.5243911743164062, -0.4969329833984375, -0.46947479248046875, -0.4420166015625, -0.41455841064453125, -0.3871002197265625, -0.35964202880859375, -0.332183837890625, -0.30472564697265625, -0.2772674560546875, -0.24980926513671875, -0.22235107421875, -0.19489288330078125, -0.1674346923828125, -0.13997650146484375, -0.112518310546875, -0.08506011962890625, -0.0576019287109375, -0.03014373779296875, -0.002685546875, 0.02477264404296875, 0.0522308349609375, 0.07968902587890625, 0.107147216796875, 0.13460540771484375, 0.1620635986328125, 0.18952178955078125, 0.21697998046875, 0.24443817138671875, 0.2718963623046875, 0.29935455322265625, 0.326812744140625, 0.35427093505859375, 0.3817291259765625, 0.40918731689453125, 0.4366455078125, 0.46410369873046875, 0.4915618896484375, 0.5190200805664062, 0.546478271484375, 0.5739364624023438, 0.6013946533203125, 0.6288528442382812, 0.65631103515625, 0.6837692260742188, 0.7112274169921875, 0.7386856079101562, 0.766143798828125, 0.7936019897460938, 0.8210601806640625, 0.8485183715820312, 0.8759765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 5.0, 6.0, 12.0, 9.0, 14.0, 21.0, 27.0, 30.0, 43.0, 46.0, 53.0, 60.0, 61.0, 70.0, 72.0, 65.0, 78.0, 63.0, 48.0, 52.0, 33.0, 19.0, 25.0, 17.0, 8.0, 15.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49560546875, -0.47869110107421875, -0.4617767333984375, -0.44486236572265625, -0.427947998046875, -0.41103363037109375, -0.3941192626953125, -0.37720489501953125, -0.36029052734375, -0.34337615966796875, -0.3264617919921875, -0.30954742431640625, -0.292633056640625, -0.27571868896484375, -0.2588043212890625, -0.24188995361328125, -0.2249755859375, -0.20806121826171875, -0.1911468505859375, -0.17423248291015625, -0.157318115234375, -0.14040374755859375, -0.1234893798828125, -0.10657501220703125, -0.08966064453125, -0.07274627685546875, -0.0558319091796875, -0.03891754150390625, -0.022003173828125, -0.00508880615234375, 0.0118255615234375, 0.02873992919921875, 0.045654296875, 0.06256866455078125, 0.0794830322265625, 0.09639739990234375, 0.113311767578125, 0.13022613525390625, 0.1471405029296875, 0.16405487060546875, 0.18096923828125, 0.19788360595703125, 0.2147979736328125, 0.23171234130859375, 0.248626708984375, 0.26554107666015625, 0.2824554443359375, 0.29936981201171875, 0.3162841796875, 0.33319854736328125, 0.3501129150390625, 0.36702728271484375, 0.383941650390625, 0.40085601806640625, 0.4177703857421875, 0.43468475341796875, 0.45159912109375, 0.46851348876953125, 0.4854278564453125, 0.5023422241210938, 0.519256591796875, 0.5361709594726562, 0.5530853271484375, 0.5699996948242188, 0.5869140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 4.0, 13.0, 13.0, 11.0, 22.0, 37.0, 58.0, 69.0, 84.0, 112.0, 101.0, 108.0, 96.0, 71.0, 59.0, 36.0, 31.0, 31.0, 7.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.084464073181152, -10.79800033569336, -10.511537551879883, -10.22507381439209, -9.938611030578613, -9.65214729309082, -9.365684509277344, -9.07922077178955, -8.792757987976074, -8.506294250488281, -8.219831466674805, -7.93336820602417, -7.646904945373535, -7.3604416847229, -7.073978424072266, -6.787514686584473, -6.501051425933838, -6.214588165283203, -5.928124904632568, -5.641661643981934, -5.355198383331299, -5.068735122680664, -4.782271385192871, -4.4958086013793945, -4.209344863891602, -3.922881603240967, -3.636418342590332, -3.3499550819396973, -3.0634918212890625, -2.7770285606384277, -2.490565061569214, -2.204101800918579, -1.9176383018493652, -1.6311750411987305, -1.3447117805480957, -1.0582484006881714, -0.7717851400375366, -0.48532187938690186, -0.19885849952697754, 0.08760476112365723, 0.374068021774292, 0.6605312824249268, 0.9469946026802063, 1.2334579229354858, 1.5199211835861206, 1.8063844442367554, 2.0928478240966797, 2.3793110847473145, 2.665774345397949, 2.952237606048584, 3.2387008666992188, 3.5251641273498535, 3.8116273880004883, 4.098090648651123, 4.384553909301758, 4.671017646789551, 4.957480430603027, 5.243943691253662, 5.530406951904297, 5.816870212554932, 6.103333473205566, 6.389796733856201, 6.676259994506836, 6.962723731994629, 7.249186992645264]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 6.0, 18.0, 5.0, 23.0, 26.0, 22.0, 35.0, 40.0, 38.0, 48.0, 65.0, 56.0, 53.0, 66.0, 48.0, 66.0, 50.0, 53.0, 49.0, 45.0, 32.0, 30.0, 29.0, 16.0, 14.0, 18.0, 13.0, 9.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735222339630127, -6.45862340927124, -6.182024002075195, -5.905425071716309, -5.628825664520264, -5.352226734161377, -5.075627326965332, -4.799028396606445, -4.522429466247559, -4.245830535888672, -3.969231128692627, -3.6926321983337402, -3.4160327911376953, -3.1394338607788086, -2.8628346920013428, -2.586235523223877, -2.309636116027832, -2.033036947250366, -1.7564377784729004, -1.4798387289047241, -1.2032395601272583, -0.9266403913497925, -0.6500413417816162, -0.3734421730041504, -0.09684300422668457, 0.17975613474845886, 0.4563552737236023, 0.7329543828964233, 1.0095535516738892, 1.286152720451355, 1.5627517700195312, 1.839350938796997, 2.115950584411621, 2.392549753189087, 2.6691489219665527, 2.9457478523254395, 3.2223472595214844, 3.498946189880371, 3.775545358657837, 4.052144527435303, 4.328743934631348, 4.605342864990234, 4.881942272186279, 5.158541202545166, 5.435140609741211, 5.711739540100098, 5.988338470458984, 6.264937877655029, 6.541536808013916, 6.818135738372803, 7.094735145568848, 7.371334075927734, 7.647933483123779, 7.924532413482666, 8.201131820678711, 8.477730751037598, 8.754329681396484, 9.030928611755371, 9.307527542114258, 9.584127426147461, 9.860726356506348, 10.137325286865234, 10.413924217224121, 10.690523147583008, 10.967123031616211]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 11.0, 8.0, 13.0, 14.0, 17.0, 28.0, 47.0, 56.0, 118.0, 221.0, 411.0, 728.0, 1486.0, 3269.0, 9278.0, 32233.0, 173451.0, 3631127.0, 278707.0, 43246.0, 11934.0, 4164.0, 1754.0, 853.0, 462.0, 239.0, 152.0, 80.0, 53.0, 36.0, 21.0, 13.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.8876953125, -1.837493896484375, -1.78729248046875, -1.737091064453125, -1.6868896484375, -1.636688232421875, -1.58648681640625, -1.536285400390625, -1.486083984375, -1.435882568359375, -1.38568115234375, -1.335479736328125, -1.2852783203125, -1.235076904296875, -1.18487548828125, -1.134674072265625, -1.08447265625, -1.034271240234375, -0.98406982421875, -0.933868408203125, -0.8836669921875, -0.833465576171875, -0.78326416015625, -0.733062744140625, -0.682861328125, -0.632659912109375, -0.58245849609375, -0.532257080078125, -0.4820556640625, -0.431854248046875, -0.38165283203125, -0.331451416015625, -0.28125, -0.231048583984375, -0.18084716796875, -0.130645751953125, -0.0804443359375, -0.030242919921875, 0.01995849609375, 0.070159912109375, 0.120361328125, 0.170562744140625, 0.22076416015625, 0.270965576171875, 0.3211669921875, 0.371368408203125, 0.42156982421875, 0.471771240234375, 0.52197265625, 0.572174072265625, 0.62237548828125, 0.672576904296875, 0.7227783203125, 0.772979736328125, 0.82318115234375, 0.873382568359375, 0.923583984375, 0.973785400390625, 1.02398681640625, 1.074188232421875, 1.1243896484375, 1.174591064453125, 1.22479248046875, 1.274993896484375, 1.3251953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 9.0, 17.0, 28.0, 47.0, 48.0, 66.0, 82.0, 91.0, 103.0, 88.0, 102.0, 65.0, 77.0, 46.0, 35.0, 31.0, 23.0, 14.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.473388671875, -0.4615516662597656, -0.44971466064453125, -0.4378776550292969, -0.4260406494140625, -0.4142036437988281, -0.40236663818359375, -0.3905296325683594, -0.378692626953125, -0.3668556213378906, -0.35501861572265625, -0.3431816101074219, -0.3313446044921875, -0.3195075988769531, -0.30767059326171875, -0.2958335876464844, -0.28399658203125, -0.2721595764160156, -0.26032257080078125, -0.24848556518554688, -0.2366485595703125, -0.22481155395507812, -0.21297454833984375, -0.20113754272460938, -0.189300537109375, -0.17746353149414062, -0.16562652587890625, -0.15378952026367188, -0.1419525146484375, -0.13011550903320312, -0.11827850341796875, -0.10644149780273438, -0.0946044921875, -0.08276748657226562, -0.07093048095703125, -0.059093475341796875, -0.0472564697265625, -0.035419464111328125, -0.02358245849609375, -0.011745452880859375, 9.1552734375e-05, 0.011928558349609375, 0.02376556396484375, 0.035602569580078125, 0.0474395751953125, 0.059276580810546875, 0.07111358642578125, 0.08295059204101562, 0.09478759765625, 0.10662460327148438, 0.11846160888671875, 0.13029861450195312, 0.1421356201171875, 0.15397262573242188, 0.16580963134765625, 0.17764663696289062, 0.189483642578125, 0.20132064819335938, 0.21315765380859375, 0.22499465942382812, 0.2368316650390625, 0.24866867065429688, 0.26050567626953125, 0.2723426818847656, 0.2841796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 12.0, 11.0, 26.0, 36.0, 38.0, 58.0, 83.0, 144.0, 217.0, 411.0, 727.0, 1496.0, 4060.0, 11595.0, 40769.0, 192457.0, 3141050.0, 672158.0, 92990.0, 23417.0, 7468.0, 2751.0, 1074.0, 467.0, 284.0, 164.0, 111.0, 62.0, 32.0, 35.0, 18.0, 15.0, 5.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.58203125, -1.5365447998046875, -1.491058349609375, -1.4455718994140625, -1.40008544921875, -1.3545989990234375, -1.309112548828125, -1.2636260986328125, -1.2181396484375, -1.1726531982421875, -1.127166748046875, -1.0816802978515625, -1.03619384765625, -0.9907073974609375, -0.945220947265625, -0.8997344970703125, -0.854248046875, -0.8087615966796875, -0.763275146484375, -0.7177886962890625, -0.67230224609375, -0.6268157958984375, -0.581329345703125, -0.5358428955078125, -0.4903564453125, -0.4448699951171875, -0.399383544921875, -0.3538970947265625, -0.30841064453125, -0.2629241943359375, -0.217437744140625, -0.1719512939453125, -0.12646484375, -0.0809783935546875, -0.035491943359375, 0.0099945068359375, 0.05548095703125, 0.1009674072265625, 0.146453857421875, 0.1919403076171875, 0.2374267578125, 0.2829132080078125, 0.328399658203125, 0.3738861083984375, 0.41937255859375, 0.4648590087890625, 0.510345458984375, 0.5558319091796875, 0.601318359375, 0.6468048095703125, 0.692291259765625, 0.7377777099609375, 0.78326416015625, 0.8287506103515625, 0.874237060546875, 0.9197235107421875, 0.9652099609375, 1.0106964111328125, 1.056182861328125, 1.1016693115234375, 1.14715576171875, 1.1926422119140625, 1.238128662109375, 1.2836151123046875, 1.3291015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 15.0, 12.0, 11.0, 27.0, 32.0, 65.0, 68.0, 147.0, 210.0, 516.0, 1794.0, 530.0, 222.0, 132.0, 93.0, 61.0, 29.0, 33.0, 25.0, 13.0, 10.0, 4.0, 10.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43310546875, -0.4205589294433594, -0.40801239013671875, -0.3954658508300781, -0.3829193115234375, -0.3703727722167969, -0.35782623291015625, -0.3452796936035156, -0.332733154296875, -0.3201866149902344, -0.30764007568359375, -0.2950935363769531, -0.2825469970703125, -0.2700004577636719, -0.25745391845703125, -0.24490737915039062, -0.23236083984375, -0.21981430053710938, -0.20726776123046875, -0.19472122192382812, -0.1821746826171875, -0.16962814331054688, -0.15708160400390625, -0.14453506469726562, -0.131988525390625, -0.11944198608398438, -0.10689544677734375, -0.09434890747070312, -0.0818023681640625, -0.06925582885742188, -0.05670928955078125, -0.044162750244140625, -0.0316162109375, -0.019069671630859375, -0.00652313232421875, 0.006023406982421875, 0.0185699462890625, 0.031116485595703125, 0.04366302490234375, 0.056209564208984375, 0.068756103515625, 0.08130264282226562, 0.09384918212890625, 0.10639572143554688, 0.1189422607421875, 0.13148880004882812, 0.14403533935546875, 0.15658187866210938, 0.16912841796875, 0.18167495727539062, 0.19422149658203125, 0.20676803588867188, 0.2193145751953125, 0.23186111450195312, 0.24440765380859375, 0.2569541931152344, 0.269500732421875, 0.2820472717285156, 0.29459381103515625, 0.3071403503417969, 0.3196868896484375, 0.3322334289550781, 0.34477996826171875, 0.3573265075683594, 0.369873046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 13.0, 17.0, 31.0, 51.0, 71.0, 88.0, 111.0, 122.0, 124.0, 107.0, 86.0, 64.0, 46.0, 23.0, 17.0, 12.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0657577514648438, -2.994230031967163, -2.9227023124694824, -2.851174831390381, -2.7796471118927, -2.7081193923950195, -2.636591672897339, -2.565063953399658, -2.4935364723205566, -2.422008752822876, -2.3504810333251953, -2.2789535522460938, -2.207425832748413, -2.1358981132507324, -2.0643703937530518, -1.992842674255371, -1.9213149547576904, -1.8497872352600098, -1.7782596349716187, -1.706731915473938, -1.6352043151855469, -1.5636765956878662, -1.4921488761901855, -1.4206211566925049, -1.3490935564041138, -1.277565836906433, -1.206038236618042, -1.1345105171203613, -1.0629827976226807, -0.9914551973342896, -0.9199274778366089, -0.848399817943573, -0.7768720388412476, -0.7053443789482117, -0.6338167190551758, -0.5622889995574951, -0.49076133966445923, -0.41923367977142334, -0.34770599007606506, -0.2761783003807068, -0.2046506404876709, -0.13312296569347382, -0.06159529089927673, 0.009932383894920349, 0.08146005868911743, 0.15298771858215332, 0.2245154082775116, 0.2960430979728699, 0.36757075786590576, 0.43909841775894165, 0.5106260776519775, 0.5821537971496582, 0.6536814570426941, 0.72520911693573, 0.7967368364334106, 0.8682644963264465, 0.9397921562194824, 1.011319875717163, 1.0828474760055542, 1.1543751955032349, 1.225902795791626, 1.2974305152893066, 1.3689582347869873, 1.440485954284668, 1.512013554573059]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 8.0, 3.0, 8.0, 8.0, 9.0, 12.0, 16.0, 12.0, 19.0, 30.0, 40.0, 29.0, 38.0, 31.0, 32.0, 38.0, 40.0, 32.0, 47.0, 51.0, 48.0, 32.0, 48.0, 35.0, 38.0, 34.0, 29.0, 37.0, 30.0, 24.0, 35.0, 19.0, 22.0, 11.0, 8.0, 10.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.2433825731277466, -1.2091513872146606, -1.1749200820922852, -1.1406888961791992, -1.1064577102661133, -1.0722265243530273, -1.0379952192306519, -1.003764033317566, -0.96953284740448, -0.9353016018867493, -0.9010704159736633, -0.8668391704559326, -0.8326079845428467, -0.798376739025116, -0.7641454935073853, -0.7299143075942993, -0.6956830620765686, -0.6614518165588379, -0.627220630645752, -0.5929893851280212, -0.5587581992149353, -0.5245269536972046, -0.49029573798179626, -0.45606452226638794, -0.4218333065509796, -0.3876020908355713, -0.35337087512016296, -0.31913965940475464, -0.2849084138870239, -0.250677227973938, -0.21644598245620728, -0.18221476674079895, -0.1479836106300354, -0.11375239491462708, -0.07952117174863815, -0.04528994858264923, -0.011058732867240906, 0.02317248284816742, 0.05740371346473694, 0.09163492918014526, 0.1258661448955536, 0.16009736061096191, 0.19432857632637024, 0.22855980694293976, 0.2627910375595093, 0.2970222234725952, 0.3312534689903259, 0.36548468470573425, 0.3997159004211426, 0.4339471161365509, 0.46817833185195923, 0.5024095773696899, 0.5366407632827759, 0.5708720088005066, 0.6051032543182373, 0.6393344402313232, 0.6735656261444092, 0.7077968716621399, 0.7420280575752258, 0.7762593030929565, 0.8104904890060425, 0.8447217345237732, 0.8789529800415039, 0.9131841659545898, 0.9474154114723206]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 11.0, 9.0, 30.0, 29.0, 40.0, 57.0, 101.0, 155.0, 221.0, 440.0, 813.0, 1441.0, 3167.0, 7267.0, 18004.0, 47327.0, 122795.0, 265715.0, 309451.0, 163321.0, 65186.0, 24654.0, 10005.0, 4079.0, 1919.0, 939.0, 517.0, 290.0, 178.0, 112.0, 77.0, 56.0, 38.0, 31.0, 21.0, 9.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1484375, -1.1103668212890625, -1.072296142578125, -1.0342254638671875, -0.99615478515625, -0.9580841064453125, -0.920013427734375, -0.8819427490234375, -0.8438720703125, -0.8058013916015625, -0.767730712890625, -0.7296600341796875, -0.69158935546875, -0.6535186767578125, -0.615447998046875, -0.5773773193359375, -0.539306640625, -0.5012359619140625, -0.463165283203125, -0.4250946044921875, -0.38702392578125, -0.3489532470703125, -0.310882568359375, -0.2728118896484375, -0.2347412109375, -0.1966705322265625, -0.158599853515625, -0.1205291748046875, -0.08245849609375, -0.0443878173828125, -0.006317138671875, 0.0317535400390625, 0.06982421875, 0.1078948974609375, 0.145965576171875, 0.1840362548828125, 0.22210693359375, 0.2601776123046875, 0.298248291015625, 0.3363189697265625, 0.3743896484375, 0.4124603271484375, 0.450531005859375, 0.4886016845703125, 0.52667236328125, 0.5647430419921875, 0.602813720703125, 0.6408843994140625, 0.678955078125, 0.7170257568359375, 0.755096435546875, 0.7931671142578125, 0.83123779296875, 0.8693084716796875, 0.907379150390625, 0.9454498291015625, 0.9835205078125, 1.0215911865234375, 1.059661865234375, 1.0977325439453125, 1.13580322265625, 1.1738739013671875, 1.211944580078125, 1.2500152587890625, 1.2880859375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 11.0, 17.0, 26.0, 35.0, 37.0, 52.0, 76.0, 92.0, 83.0, 113.0, 92.0, 76.0, 70.0, 64.0, 43.0, 40.0, 29.0, 17.0, 13.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45556640625, -0.4437446594238281, -0.43192291259765625, -0.4201011657714844, -0.4082794189453125, -0.3964576721191406, -0.38463592529296875, -0.3728141784667969, -0.360992431640625, -0.3491706848144531, -0.33734893798828125, -0.3255271911621094, -0.3137054443359375, -0.3018836975097656, -0.29006195068359375, -0.2782402038574219, -0.26641845703125, -0.2545967102050781, -0.24277496337890625, -0.23095321655273438, -0.2191314697265625, -0.20730972290039062, -0.19548797607421875, -0.18366622924804688, -0.171844482421875, -0.16002273559570312, -0.14820098876953125, -0.13637924194335938, -0.1245574951171875, -0.11273574829101562, -0.10091400146484375, -0.08909225463867188, -0.0772705078125, -0.06544876098632812, -0.05362701416015625, -0.041805267333984375, -0.0299835205078125, -0.018161773681640625, -0.00634002685546875, 0.005481719970703125, 0.017303466796875, 0.029125213623046875, 0.04094696044921875, 0.052768707275390625, 0.0645904541015625, 0.07641220092773438, 0.08823394775390625, 0.10005569458007812, 0.11187744140625, 0.12369918823242188, 0.13552093505859375, 0.14734268188476562, 0.1591644287109375, 0.17098617553710938, 0.18280792236328125, 0.19462966918945312, 0.206451416015625, 0.21827316284179688, 0.23009490966796875, 0.24191665649414062, 0.2537384033203125, 0.2655601501464844, 0.27738189697265625, 0.2892036437988281, 0.301025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 4.0, 12.0, 17.0, 18.0, 22.0, 43.0, 56.0, 81.0, 94.0, 157.0, 235.0, 300.0, 463.0, 731.0, 1150.0, 2007.0, 4575.0, 10963.0, 29697.0, 82619.0, 199344.0, 319909.0, 232738.0, 100845.0, 37450.0, 13506.0, 5347.0, 2418.0, 1337.0, 802.0, 488.0, 337.0, 223.0, 153.0, 131.0, 75.0, 50.0, 49.0, 23.0, 26.0, 17.0, 12.0, 7.0, 9.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154296875, -1.118896484375, -1.08349609375, -1.048095703125, -1.0126953125, -0.977294921875, -0.94189453125, -0.906494140625, -0.87109375, -0.835693359375, -0.80029296875, -0.764892578125, -0.7294921875, -0.694091796875, -0.65869140625, -0.623291015625, -0.587890625, -0.552490234375, -0.51708984375, -0.481689453125, -0.4462890625, -0.410888671875, -0.37548828125, -0.340087890625, -0.3046875, -0.269287109375, -0.23388671875, -0.198486328125, -0.1630859375, -0.127685546875, -0.09228515625, -0.056884765625, -0.021484375, 0.013916015625, 0.04931640625, 0.084716796875, 0.1201171875, 0.155517578125, 0.19091796875, 0.226318359375, 0.26171875, 0.297119140625, 0.33251953125, 0.367919921875, 0.4033203125, 0.438720703125, 0.47412109375, 0.509521484375, 0.544921875, 0.580322265625, 0.61572265625, 0.651123046875, 0.6865234375, 0.721923828125, 0.75732421875, 0.792724609375, 0.828125, 0.863525390625, 0.89892578125, 0.934326171875, 0.9697265625, 1.005126953125, 1.04052734375, 1.075927734375, 1.111328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 11.0, 11.0, 10.0, 15.0, 15.0, 21.0, 20.0, 24.0, 35.0, 38.0, 36.0, 42.0, 47.0, 54.0, 55.0, 45.0, 51.0, 48.0, 39.0, 43.0, 46.0, 36.0, 36.0, 22.0, 43.0, 19.0, 27.0, 14.0, 18.0, 16.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.109375, -1.0761566162109375, -1.042938232421875, -1.0097198486328125, -0.97650146484375, -0.9432830810546875, -0.910064697265625, -0.8768463134765625, -0.8436279296875, -0.8104095458984375, -0.777191162109375, -0.7439727783203125, -0.71075439453125, -0.6775360107421875, -0.644317626953125, -0.6110992431640625, -0.577880859375, -0.5446624755859375, -0.511444091796875, -0.4782257080078125, -0.44500732421875, -0.4117889404296875, -0.378570556640625, -0.3453521728515625, -0.3121337890625, -0.2789154052734375, -0.245697021484375, -0.2124786376953125, -0.17926025390625, -0.1460418701171875, -0.112823486328125, -0.0796051025390625, -0.04638671875, -0.0131683349609375, 0.020050048828125, 0.0532684326171875, 0.08648681640625, 0.1197052001953125, 0.152923583984375, 0.1861419677734375, 0.2193603515625, 0.2525787353515625, 0.285797119140625, 0.3190155029296875, 0.35223388671875, 0.3854522705078125, 0.418670654296875, 0.4518890380859375, 0.485107421875, 0.5183258056640625, 0.551544189453125, 0.5847625732421875, 0.61798095703125, 0.6511993408203125, 0.684417724609375, 0.7176361083984375, 0.7508544921875, 0.7840728759765625, 0.817291259765625, 0.8505096435546875, 0.88372802734375, 0.9169464111328125, 0.950164794921875, 0.9833831787109375, 1.0166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 19.0, 31.0, 30.0, 91.0, 112.0, 239.0, 509.0, 1114.0, 3215.0, 10869.0, 45209.0, 254707.0, 558564.0, 136373.0, 26598.0, 6961.0, 2186.0, 885.0, 338.0, 199.0, 92.0, 53.0, 40.0, 26.0, 12.0, 8.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9879302978515625, -0.955352783203125, -0.9227752685546875, -0.89019775390625, -0.8576202392578125, -0.825042724609375, -0.7924652099609375, -0.7598876953125, -0.7273101806640625, -0.694732666015625, -0.6621551513671875, -0.62957763671875, -0.5970001220703125, -0.564422607421875, -0.5318450927734375, -0.499267578125, -0.4666900634765625, -0.434112548828125, -0.4015350341796875, -0.36895751953125, -0.3363800048828125, -0.303802490234375, -0.2712249755859375, -0.2386474609375, -0.2060699462890625, -0.173492431640625, -0.1409149169921875, -0.10833740234375, -0.0757598876953125, -0.043182373046875, -0.0106048583984375, 0.02197265625, 0.0545501708984375, 0.087127685546875, 0.1197052001953125, 0.15228271484375, 0.1848602294921875, 0.217437744140625, 0.2500152587890625, 0.2825927734375, 0.3151702880859375, 0.347747802734375, 0.3803253173828125, 0.41290283203125, 0.4454803466796875, 0.478057861328125, 0.5106353759765625, 0.543212890625, 0.5757904052734375, 0.608367919921875, 0.6409454345703125, 0.67352294921875, 0.7061004638671875, 0.738677978515625, 0.7712554931640625, 0.8038330078125, 0.8364105224609375, 0.868988037109375, 0.9015655517578125, 0.93414306640625, 0.9667205810546875, 0.999298095703125, 1.0318756103515625, 1.064453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 8.0, 5.0, 9.0, 11.0, 17.0, 19.0, 22.0, 34.0, 33.0, 36.0, 57.0, 55.0, 72.0, 67.0, 79.0, 75.0, 60.0, 71.0, 54.0, 45.0, 40.0, 23.0, 25.0, 18.0, 18.0, 10.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001302957534790039, -0.00012613646686077118, -0.00012197718024253845, -0.00011781789362430573, -0.000113658607006073, -0.00010949932038784027, -0.00010534003376960754, -0.00010118074715137482, -9.702146053314209e-05, -9.286217391490936e-05, -8.870288729667664e-05, -8.454360067844391e-05, -8.038431406021118e-05, -7.622502744197845e-05, -7.206574082374573e-05, -6.7906454205513e-05, -6.374716758728027e-05, -5.9587880969047546e-05, -5.542859435081482e-05, -5.126930773258209e-05, -4.7110021114349365e-05, -4.295073449611664e-05, -3.879144787788391e-05, -3.4632161259651184e-05, -3.0472874641418457e-05, -2.631358802318573e-05, -2.2154301404953003e-05, -1.7995014786720276e-05, -1.3835728168487549e-05, -9.676441550254822e-06, -5.517154932022095e-06, -1.3578683137893677e-06, 2.8014183044433594e-06, 6.9607049226760864e-06, 1.1119991540908813e-05, 1.527927815914154e-05, 1.9438564777374268e-05, 2.3597851395606995e-05, 2.775713801383972e-05, 3.191642463207245e-05, 3.6075711250305176e-05, 4.02349978685379e-05, 4.439428448677063e-05, 4.855357110500336e-05, 5.2712857723236084e-05, 5.687214434146881e-05, 6.103143095970154e-05, 6.519071757793427e-05, 6.935000419616699e-05, 7.350929081439972e-05, 7.766857743263245e-05, 8.182786405086517e-05, 8.59871506690979e-05, 9.014643728733063e-05, 9.430572390556335e-05, 9.846501052379608e-05, 0.00010262429714202881, 0.00010678358376026154, 0.00011094287037849426, 0.00011510215699672699, 0.00011926144361495972, 0.00012342073023319244, 0.00012758001685142517, 0.0001317393034696579, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 5.0, 6.0, 16.0, 16.0, 18.0, 32.0, 60.0, 80.0, 84.0, 141.0, 212.0, 387.0, 656.0, 1281.0, 2669.0, 6773.0, 19184.0, 65370.0, 293193.0, 479973.0, 127062.0, 32880.0, 10489.0, 3983.0, 1774.0, 909.0, 470.0, 279.0, 156.0, 115.0, 63.0, 50.0, 50.0, 28.0, 18.0, 17.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8330078125, -0.805450439453125, -0.77789306640625, -0.750335693359375, -0.7227783203125, -0.695220947265625, -0.66766357421875, -0.640106201171875, -0.612548828125, -0.584991455078125, -0.55743408203125, -0.529876708984375, -0.5023193359375, -0.474761962890625, -0.44720458984375, -0.419647216796875, -0.39208984375, -0.364532470703125, -0.33697509765625, -0.309417724609375, -0.2818603515625, -0.254302978515625, -0.22674560546875, -0.199188232421875, -0.171630859375, -0.144073486328125, -0.11651611328125, -0.088958740234375, -0.0614013671875, -0.033843994140625, -0.00628662109375, 0.021270751953125, 0.048828125, 0.076385498046875, 0.10394287109375, 0.131500244140625, 0.1590576171875, 0.186614990234375, 0.21417236328125, 0.241729736328125, 0.269287109375, 0.296844482421875, 0.32440185546875, 0.351959228515625, 0.3795166015625, 0.407073974609375, 0.43463134765625, 0.462188720703125, 0.48974609375, 0.517303466796875, 0.54486083984375, 0.572418212890625, 0.5999755859375, 0.627532958984375, 0.65509033203125, 0.682647705078125, 0.710205078125, 0.737762451171875, 0.76531982421875, 0.792877197265625, 0.8204345703125, 0.847991943359375, 0.87554931640625, 0.903106689453125, 0.9306640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 17.0, 13.0, 23.0, 15.0, 24.0, 17.0, 36.0, 44.0, 48.0, 55.0, 86.0, 74.0, 72.0, 66.0, 65.0, 45.0, 48.0, 40.0, 36.0, 17.0, 24.0, 19.0, 12.0, 9.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.455078125, -0.4395904541015625, -0.424102783203125, -0.4086151123046875, -0.39312744140625, -0.3776397705078125, -0.362152099609375, -0.3466644287109375, -0.3311767578125, -0.3156890869140625, -0.300201416015625, -0.2847137451171875, -0.26922607421875, -0.2537384033203125, -0.238250732421875, -0.2227630615234375, -0.207275390625, -0.1917877197265625, -0.176300048828125, -0.1608123779296875, -0.14532470703125, -0.1298370361328125, -0.114349365234375, -0.0988616943359375, -0.0833740234375, -0.0678863525390625, -0.052398681640625, -0.0369110107421875, -0.02142333984375, -0.0059356689453125, 0.009552001953125, 0.0250396728515625, 0.04052734375, 0.0560150146484375, 0.071502685546875, 0.0869903564453125, 0.10247802734375, 0.1179656982421875, 0.133453369140625, 0.1489410400390625, 0.1644287109375, 0.1799163818359375, 0.195404052734375, 0.2108917236328125, 0.22637939453125, 0.2418670654296875, 0.257354736328125, 0.2728424072265625, 0.288330078125, 0.3038177490234375, 0.319305419921875, 0.3347930908203125, 0.35028076171875, 0.3657684326171875, 0.381256103515625, 0.3967437744140625, 0.4122314453125, 0.4277191162109375, 0.443206787109375, 0.4586944580078125, 0.47418212890625, 0.4896697998046875, 0.505157470703125, 0.5206451416015625, 0.5361328125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 6.0, 20.0, 47.0, 68.0, 98.0, 171.0, 183.0, 142.0, 102.0, 66.0, 42.0, 20.0, 7.0, 9.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.496323585510254, -6.120082378387451, -5.743841171264648, -5.367599964141846, -4.991358757019043, -4.61511754989624, -4.2388763427734375, -3.8626351356506348, -3.486393928527832, -3.1101527214050293, -2.7339115142822266, -2.357670307159424, -1.981429100036621, -1.6051878929138184, -1.2289466857910156, -0.8527054786682129, -0.47646427154541016, -0.10022306442260742, 0.2760181427001953, 0.652259349822998, 1.0285005569458008, 1.4047417640686035, 1.7809829711914062, 2.157224178314209, 2.5334653854370117, 2.9097065925598145, 3.285947799682617, 3.66218900680542, 4.038430213928223, 4.414671421051025, 4.790912628173828, 5.167153835296631, 5.54339599609375, 5.919637203216553, 6.2958784103393555, 6.672119617462158, 7.048360824584961, 7.424602031707764, 7.800843238830566, 8.177083969116211, 8.553325653076172, 8.929567337036133, 9.305808067321777, 9.682048797607422, 10.058290481567383, 10.434532165527344, 10.810772895812988, 11.187013626098633, 11.563255310058594, 11.939496994018555, 12.3157377243042, 12.691978454589844, 13.068220138549805, 13.444461822509766, 13.82070255279541, 14.196943283081055, 14.573184967041016, 14.949426651000977, 15.325667381286621, 15.701908111572266, 16.078149795532227, 16.454391479492188, 16.830631256103516, 17.206872940063477, 17.583114624023438]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 5.0, 16.0, 17.0, 13.0, 13.0, 28.0, 32.0, 28.0, 27.0, 40.0, 43.0, 47.0, 52.0, 49.0, 51.0, 61.0, 40.0, 55.0, 42.0, 59.0, 46.0, 36.0, 36.0, 21.0, 27.0, 16.0, 23.0, 12.0, 11.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.030461311340332, -5.819243907928467, -5.608026504516602, -5.396809101104736, -5.185591697692871, -4.974374771118164, -4.763157367706299, -4.551939964294434, -4.340722560882568, -4.129505157470703, -3.918287754058838, -3.7070705890655518, -3.4958531856536865, -3.2846357822418213, -3.073418617248535, -2.86220121383667, -2.6509838104248047, -2.4397664070129395, -2.228549003601074, -2.017331838607788, -1.8061144351959229, -1.5948970317840576, -1.383679747581482, -1.1724624633789062, -0.961245059967041, -0.7500277161598206, -0.5388103723526001, -0.32759302854537964, -0.11637568473815918, 0.09484171867370605, 0.30605900287628174, 0.5172762870788574, 0.7284936904907227, 0.9397110342979431, 1.1509283781051636, 1.3621456623077393, 1.5733630657196045, 1.7845804691314697, 1.9957977533340454, 2.207015037536621, 2.4182324409484863, 2.6294498443603516, 2.840667247772217, 3.051884412765503, 3.263101816177368, 3.4743192195892334, 3.6855363845825195, 3.8967537879943848, 4.10797119140625, 4.319188594818115, 4.5304059982299805, 4.741623401641846, 4.952840805053711, 5.164057731628418, 5.375275135040283, 5.586492538452148, 5.797709941864014, 6.008927345275879, 6.220144748687744, 6.431362152099609, 6.642579078674316, 6.85379695892334, 7.065013885498047, 7.276231288909912, 7.487448692321777]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 12.0, 17.0, 26.0, 65.0, 147.0, 309.0, 1054.0, 4010.0, 21851.0, 330096.0, 3776728.0, 49994.0, 7322.0, 1772.0, 517.0, 174.0, 85.0, 47.0, 23.0, 18.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.49359130859375, -2.4110107421875, -2.32843017578125, -2.245849609375, -2.16326904296875, -2.0806884765625, -1.99810791015625, -1.91552734375, -1.83294677734375, -1.7503662109375, -1.66778564453125, -1.585205078125, -1.50262451171875, -1.4200439453125, -1.33746337890625, -1.2548828125, -1.17230224609375, -1.0897216796875, -1.00714111328125, -0.924560546875, -0.84197998046875, -0.7593994140625, -0.67681884765625, -0.59423828125, -0.51165771484375, -0.4290771484375, -0.34649658203125, -0.263916015625, -0.18133544921875, -0.0987548828125, -0.01617431640625, 0.06640625, 0.14898681640625, 0.2315673828125, 0.31414794921875, 0.396728515625, 0.47930908203125, 0.5618896484375, 0.64447021484375, 0.72705078125, 0.80963134765625, 0.8922119140625, 0.97479248046875, 1.057373046875, 1.13995361328125, 1.2225341796875, 1.30511474609375, 1.3876953125, 1.47027587890625, 1.5528564453125, 1.63543701171875, 1.718017578125, 1.80059814453125, 1.8831787109375, 1.96575927734375, 2.04833984375, 2.13092041015625, 2.2135009765625, 2.29608154296875, 2.378662109375, 2.46124267578125, 2.5438232421875, 2.62640380859375, 2.708984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 9.0, 13.0, 28.0, 26.0, 51.0, 51.0, 55.0, 91.0, 72.0, 75.0, 91.0, 73.0, 77.0, 70.0, 45.0, 43.0, 38.0, 34.0, 16.0, 13.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.412841796875, -0.4014015197753906, -0.38996124267578125, -0.3785209655761719, -0.3670806884765625, -0.3556404113769531, -0.34420013427734375, -0.3327598571777344, -0.321319580078125, -0.3098793029785156, -0.29843902587890625, -0.2869987487792969, -0.2755584716796875, -0.2641181945800781, -0.25267791748046875, -0.24123764038085938, -0.22979736328125, -0.21835708618164062, -0.20691680908203125, -0.19547653198242188, -0.1840362548828125, -0.17259597778320312, -0.16115570068359375, -0.14971542358398438, -0.138275146484375, -0.12683486938476562, -0.11539459228515625, -0.10395431518554688, -0.0925140380859375, -0.08107376098632812, -0.06963348388671875, -0.058193206787109375, -0.0467529296875, -0.035312652587890625, -0.02387237548828125, -0.012432098388671875, -0.0009918212890625, 0.010448455810546875, 0.02188873291015625, 0.033329010009765625, 0.044769287109375, 0.056209564208984375, 0.06764984130859375, 0.07909011840820312, 0.0905303955078125, 0.10197067260742188, 0.11341094970703125, 0.12485122680664062, 0.13629150390625, 0.14773178100585938, 0.15917205810546875, 0.17061233520507812, 0.1820526123046875, 0.19349288940429688, 0.20493316650390625, 0.21637344360351562, 0.227813720703125, 0.23925399780273438, 0.25069427490234375, 0.2621345520019531, 0.2735748291015625, 0.2850151062011719, 0.29645538330078125, 0.3078956604003906, 0.3193359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 12.0, 8.0, 15.0, 32.0, 43.0, 60.0, 94.0, 117.0, 233.0, 418.0, 692.0, 1327.0, 2817.0, 6235.0, 15738.0, 47997.0, 204635.0, 3059717.0, 703659.0, 102845.0, 28857.0, 10402.0, 4233.0, 1943.0, 977.0, 497.0, 289.0, 140.0, 82.0, 67.0, 34.0, 21.0, 16.0, 7.0, 14.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.322418212890625, -1.28546142578125, -1.248504638671875, -1.2115478515625, -1.174591064453125, -1.13763427734375, -1.100677490234375, -1.063720703125, -1.026763916015625, -0.98980712890625, -0.952850341796875, -0.9158935546875, -0.878936767578125, -0.84197998046875, -0.805023193359375, -0.76806640625, -0.731109619140625, -0.69415283203125, -0.657196044921875, -0.6202392578125, -0.583282470703125, -0.54632568359375, -0.509368896484375, -0.472412109375, -0.435455322265625, -0.39849853515625, -0.361541748046875, -0.3245849609375, -0.287628173828125, -0.25067138671875, -0.213714599609375, -0.1767578125, -0.139801025390625, -0.10284423828125, -0.065887451171875, -0.0289306640625, 0.008026123046875, 0.04498291015625, 0.081939697265625, 0.118896484375, 0.155853271484375, 0.19281005859375, 0.229766845703125, 0.2667236328125, 0.303680419921875, 0.34063720703125, 0.377593994140625, 0.41455078125, 0.451507568359375, 0.48846435546875, 0.525421142578125, 0.5623779296875, 0.599334716796875, 0.63629150390625, 0.673248291015625, 0.710205078125, 0.747161865234375, 0.78411865234375, 0.821075439453125, 0.8580322265625, 0.894989013671875, 0.93194580078125, 0.968902587890625, 1.005859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 13.0, 8.0, 9.0, 19.0, 27.0, 40.0, 51.0, 79.0, 96.0, 200.0, 323.0, 1243.0, 1057.0, 356.0, 173.0, 99.0, 65.0, 44.0, 47.0, 28.0, 14.0, 14.0, 14.0, 14.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.406005859375, -0.39531707763671875, -0.3846282958984375, -0.37393951416015625, -0.363250732421875, -0.35256195068359375, -0.3418731689453125, -0.33118438720703125, -0.32049560546875, -0.30980682373046875, -0.2991180419921875, -0.28842926025390625, -0.277740478515625, -0.26705169677734375, -0.2563629150390625, -0.24567413330078125, -0.2349853515625, -0.22429656982421875, -0.2136077880859375, -0.20291900634765625, -0.192230224609375, -0.18154144287109375, -0.1708526611328125, -0.16016387939453125, -0.14947509765625, -0.13878631591796875, -0.1280975341796875, -0.11740875244140625, -0.106719970703125, -0.09603118896484375, -0.0853424072265625, -0.07465362548828125, -0.06396484375, -0.05327606201171875, -0.0425872802734375, -0.03189849853515625, -0.021209716796875, -0.01052093505859375, 0.0001678466796875, 0.01085662841796875, 0.02154541015625, 0.03223419189453125, 0.0429229736328125, 0.05361175537109375, 0.064300537109375, 0.07498931884765625, 0.0856781005859375, 0.09636688232421875, 0.1070556640625, 0.11774444580078125, 0.1284332275390625, 0.13912200927734375, 0.149810791015625, 0.16049957275390625, 0.1711883544921875, 0.18187713623046875, 0.19256591796875, 0.20325469970703125, 0.2139434814453125, 0.22463226318359375, 0.235321044921875, 0.24600982666015625, 0.2566986083984375, 0.26738739013671875, 0.278076171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 12.0, 21.0, 63.0, 110.0, 178.0, 198.0, 185.0, 127.0, 56.0, 22.0, 19.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951761245727539, -3.834469795227051, -3.7171785831451416, -3.5998871326446533, -3.482595682144165, -3.365304470062256, -3.2480130195617676, -3.1307215690612793, -3.013430118560791, -2.8961386680603027, -2.7788474559783936, -2.6615560054779053, -2.544264554977417, -2.426973342895508, -2.3096818923950195, -2.1923904418945312, -2.075099229812622, -1.9578078985214233, -1.840516448020935, -1.7232251167297363, -1.605933666229248, -1.4886423349380493, -1.3713510036468506, -1.2540595531463623, -1.1367682218551636, -1.0194768905639648, -0.9021854400634766, -0.7848941087722778, -0.6676027178764343, -0.5503113269805908, -0.4330199956893921, -0.3157286047935486, -0.19843721389770508, -0.08114583790302277, 0.036145538091659546, 0.15343689918518066, 0.27072829008102417, 0.3880196809768677, 0.5053110122680664, 0.6226024031639099, 0.7398937940597534, 0.8571851849555969, 0.9744765758514404, 1.0917679071426392, 1.209059238433838, 1.3263506889343262, 1.443642020225525, 1.5609333515167236, 1.678224802017212, 1.7955161333084106, 1.912807583808899, 2.0300989151000977, 2.147390365600586, 2.264681816101074, 2.3819730281829834, 2.4992644786834717, 2.616555690765381, 2.733847141265869, 2.8511383533477783, 2.9684298038482666, 3.085721254348755, 3.203012466430664, 3.3203039169311523, 3.4375953674316406, 3.554886817932129]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 4.0, 10.0, 10.0, 4.0, 11.0, 8.0, 10.0, 20.0, 16.0, 18.0, 26.0, 27.0, 36.0, 39.0, 46.0, 39.0, 39.0, 51.0, 53.0, 45.0, 29.0, 38.0, 48.0, 41.0, 44.0, 28.0, 31.0, 27.0, 27.0, 32.0, 16.0, 16.0, 16.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 5.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0928044319152832, -1.0589731931686401, -1.025141954421997, -0.991310715675354, -0.9574794769287109, -0.9236482381820679, -0.8898169994354248, -0.8559857606887817, -0.8221545219421387, -0.7883232831954956, -0.7544920444488525, -0.7206608057022095, -0.6868295669555664, -0.6529983282089233, -0.6191670894622803, -0.5853358507156372, -0.5515046715736389, -0.5176734328269958, -0.4838421940803528, -0.4500109553337097, -0.41617971658706665, -0.3823484778404236, -0.3485172688961029, -0.31468603014945984, -0.2808547914028168, -0.2470235526561737, -0.21319231390953064, -0.17936109006404877, -0.1455298513174057, -0.11169861257076263, -0.07786738872528076, -0.044036149978637695, -0.010204911231994629, 0.02362632378935814, 0.05745755881071091, 0.09128879010677338, 0.12512002885341644, 0.1589512676000595, 0.19278249144554138, 0.22661373019218445, 0.2604449689388275, 0.2942762076854706, 0.32810744643211365, 0.3619386553764343, 0.3957698941230774, 0.42960113286972046, 0.4634323716163635, 0.4972636103630066, 0.5310948491096497, 0.5649260878562927, 0.5987573266029358, 0.6325885653495789, 0.6664198040962219, 0.700251042842865, 0.7340822219848633, 0.7679134607315063, 0.8017446994781494, 0.8355759382247925, 0.8694071769714355, 0.9032384157180786, 0.9370696544647217, 0.9709008932113647, 1.0047321319580078, 1.0385633707046509, 1.072394609451294]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 16.0, 26.0, 36.0, 73.0, 135.0, 203.0, 391.0, 834.0, 2002.0, 5618.0, 19281.0, 81853.0, 311548.0, 428725.0, 148940.0, 34606.0, 9004.0, 2970.0, 1148.0, 510.0, 243.0, 150.0, 88.0, 52.0, 38.0, 9.0, 16.0, 11.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.5965576171875, -1.543701171875, -1.4908447265625, -1.43798828125, -1.3851318359375, -1.332275390625, -1.2794189453125, -1.2265625, -1.1737060546875, -1.120849609375, -1.0679931640625, -1.01513671875, -0.9622802734375, -0.909423828125, -0.8565673828125, -0.8037109375, -0.7508544921875, -0.697998046875, -0.6451416015625, -0.59228515625, -0.5394287109375, -0.486572265625, -0.4337158203125, -0.380859375, -0.3280029296875, -0.275146484375, -0.2222900390625, -0.16943359375, -0.1165771484375, -0.063720703125, -0.0108642578125, 0.0419921875, 0.0948486328125, 0.147705078125, 0.2005615234375, 0.25341796875, 0.3062744140625, 0.359130859375, 0.4119873046875, 0.46484375, 0.5177001953125, 0.570556640625, 0.6234130859375, 0.67626953125, 0.7291259765625, 0.781982421875, 0.8348388671875, 0.8876953125, 0.9405517578125, 0.993408203125, 1.0462646484375, 1.09912109375, 1.1519775390625, 1.204833984375, 1.2576904296875, 1.310546875, 1.3634033203125, 1.416259765625, 1.4691162109375, 1.52197265625, 1.5748291015625, 1.627685546875, 1.6805419921875, 1.7333984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 18.0, 22.0, 33.0, 42.0, 56.0, 57.0, 52.0, 89.0, 79.0, 77.0, 89.0, 69.0, 67.0, 54.0, 41.0, 39.0, 30.0, 26.0, 17.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.408447265625, -0.397186279296875, -0.38592529296875, -0.374664306640625, -0.3634033203125, -0.352142333984375, -0.34088134765625, -0.329620361328125, -0.318359375, -0.307098388671875, -0.29583740234375, -0.284576416015625, -0.2733154296875, -0.262054443359375, -0.25079345703125, -0.239532470703125, -0.228271484375, -0.217010498046875, -0.20574951171875, -0.194488525390625, -0.1832275390625, -0.171966552734375, -0.16070556640625, -0.149444580078125, -0.13818359375, -0.126922607421875, -0.11566162109375, -0.104400634765625, -0.0931396484375, -0.081878662109375, -0.07061767578125, -0.059356689453125, -0.048095703125, -0.036834716796875, -0.02557373046875, -0.014312744140625, -0.0030517578125, 0.008209228515625, 0.01947021484375, 0.030731201171875, 0.0419921875, 0.053253173828125, 0.06451416015625, 0.075775146484375, 0.0870361328125, 0.098297119140625, 0.10955810546875, 0.120819091796875, 0.132080078125, 0.143341064453125, 0.15460205078125, 0.165863037109375, 0.1771240234375, 0.188385009765625, 0.19964599609375, 0.210906982421875, 0.22216796875, 0.233428955078125, 0.24468994140625, 0.255950927734375, 0.2672119140625, 0.278472900390625, 0.28973388671875, 0.300994873046875, 0.312255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 9.0, 4.0, 8.0, 15.0, 21.0, 33.0, 33.0, 43.0, 84.0, 115.0, 173.0, 233.0, 321.0, 497.0, 829.0, 1471.0, 3216.0, 8242.0, 25598.0, 90615.0, 280873.0, 391167.0, 170648.0, 49454.0, 14550.0, 4966.0, 2302.0, 1112.0, 631.0, 395.0, 272.0, 178.0, 122.0, 88.0, 66.0, 50.0, 27.0, 24.0, 13.0, 16.0, 16.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4208984375, -1.379425048828125, -1.33795166015625, -1.296478271484375, -1.2550048828125, -1.213531494140625, -1.17205810546875, -1.130584716796875, -1.089111328125, -1.047637939453125, -1.00616455078125, -0.964691162109375, -0.9232177734375, -0.881744384765625, -0.84027099609375, -0.798797607421875, -0.75732421875, -0.715850830078125, -0.67437744140625, -0.632904052734375, -0.5914306640625, -0.549957275390625, -0.50848388671875, -0.467010498046875, -0.425537109375, -0.384063720703125, -0.34259033203125, -0.301116943359375, -0.2596435546875, -0.218170166015625, -0.17669677734375, -0.135223388671875, -0.09375, -0.052276611328125, -0.01080322265625, 0.030670166015625, 0.0721435546875, 0.113616943359375, 0.15509033203125, 0.196563720703125, 0.238037109375, 0.279510498046875, 0.32098388671875, 0.362457275390625, 0.4039306640625, 0.445404052734375, 0.48687744140625, 0.528350830078125, 0.56982421875, 0.611297607421875, 0.65277099609375, 0.694244384765625, 0.7357177734375, 0.777191162109375, 0.81866455078125, 0.860137939453125, 0.901611328125, 0.943084716796875, 0.98455810546875, 1.026031494140625, 1.0675048828125, 1.108978271484375, 1.15045166015625, 1.191925048828125, 1.2333984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 8.0, 6.0, 2.0, 7.0, 7.0, 11.0, 6.0, 12.0, 18.0, 9.0, 19.0, 28.0, 23.0, 32.0, 39.0, 27.0, 38.0, 39.0, 32.0, 38.0, 44.0, 42.0, 33.0, 31.0, 40.0, 31.0, 37.0, 32.0, 27.0, 48.0, 32.0, 25.0, 20.0, 24.0, 20.0, 18.0, 19.0, 16.0, 9.0, 2.0, 11.0, 6.0, 6.0, 7.0, 9.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.94873046875, -0.9200515747070312, -0.8913726806640625, -0.8626937866210938, -0.834014892578125, -0.8053359985351562, -0.7766571044921875, -0.7479782104492188, -0.71929931640625, -0.6906204223632812, -0.6619415283203125, -0.6332626342773438, -0.604583740234375, -0.5759048461914062, -0.5472259521484375, -0.5185470581054688, -0.4898681640625, -0.46118927001953125, -0.4325103759765625, -0.40383148193359375, -0.375152587890625, -0.34647369384765625, -0.3177947998046875, -0.28911590576171875, -0.26043701171875, -0.23175811767578125, -0.2030792236328125, -0.17440032958984375, -0.145721435546875, -0.11704254150390625, -0.0883636474609375, -0.05968475341796875, -0.031005859375, -0.00232696533203125, 0.0263519287109375, 0.05503082275390625, 0.083709716796875, 0.11238861083984375, 0.1410675048828125, 0.16974639892578125, 0.19842529296875, 0.22710418701171875, 0.2557830810546875, 0.28446197509765625, 0.313140869140625, 0.34181976318359375, 0.3704986572265625, 0.39917755126953125, 0.4278564453125, 0.45653533935546875, 0.4852142333984375, 0.5138931274414062, 0.542572021484375, 0.5712509155273438, 0.5999298095703125, 0.6286087036132812, 0.65728759765625, 0.6859664916992188, 0.7146453857421875, 0.7433242797851562, 0.772003173828125, 0.8006820678710938, 0.8293609619140625, 0.8580398559570312, 0.88671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 8.0, 9.0, 13.0, 15.0, 16.0, 29.0, 40.0, 80.0, 130.0, 264.0, 549.0, 1459.0, 3983.0, 14047.0, 85369.0, 706357.0, 203444.0, 23237.0, 5927.0, 1989.0, 772.0, 336.0, 154.0, 96.0, 69.0, 56.0, 26.0, 14.0, 15.0, 9.0, 11.0, 10.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.34906005859375, -1.3035888671875, -1.25811767578125, -1.212646484375, -1.16717529296875, -1.1217041015625, -1.07623291015625, -1.03076171875, -0.98529052734375, -0.9398193359375, -0.89434814453125, -0.848876953125, -0.80340576171875, -0.7579345703125, -0.71246337890625, -0.6669921875, -0.62152099609375, -0.5760498046875, -0.53057861328125, -0.485107421875, -0.43963623046875, -0.3941650390625, -0.34869384765625, -0.30322265625, -0.25775146484375, -0.2122802734375, -0.16680908203125, -0.121337890625, -0.07586669921875, -0.0303955078125, 0.01507568359375, 0.060546875, 0.10601806640625, 0.1514892578125, 0.19696044921875, 0.242431640625, 0.28790283203125, 0.3333740234375, 0.37884521484375, 0.42431640625, 0.46978759765625, 0.5152587890625, 0.56072998046875, 0.606201171875, 0.65167236328125, 0.6971435546875, 0.74261474609375, 0.7880859375, 0.83355712890625, 0.8790283203125, 0.92449951171875, 0.969970703125, 1.01544189453125, 1.0609130859375, 1.10638427734375, 1.15185546875, 1.19732666015625, 1.2427978515625, 1.28826904296875, 1.333740234375, 1.37921142578125, 1.4246826171875, 1.47015380859375, 1.515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 4.0, 12.0, 25.0, 13.0, 34.0, 40.0, 73.0, 71.0, 92.0, 111.0, 110.0, 88.0, 85.0, 52.0, 49.0, 36.0, 21.0, 13.0, 21.0, 7.0, 8.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001437664031982422, -0.0001380518078804016, -0.00013233721256256104, -0.00012662261724472046, -0.00012090802192687988, -0.0001151934266090393, -0.00010947883129119873, -0.00010376423597335815, -9.804964065551758e-05, -9.2335045337677e-05, -8.662045001983643e-05, -8.090585470199585e-05, -7.519125938415527e-05, -6.94766640663147e-05, -6.376206874847412e-05, -5.8047473430633545e-05, -5.233287811279297e-05, -4.661828279495239e-05, -4.0903687477111816e-05, -3.518909215927124e-05, -2.9474496841430664e-05, -2.3759901523590088e-05, -1.8045306205749512e-05, -1.2330710887908936e-05, -6.616115570068359e-06, -9.015202522277832e-07, 4.813075065612793e-06, 1.0527670383453369e-05, 1.6242265701293945e-05, 2.195686101913452e-05, 2.7671456336975098e-05, 3.3386051654815674e-05, 3.910064697265625e-05, 4.4815242290496826e-05, 5.05298376083374e-05, 5.624443292617798e-05, 6.195902824401855e-05, 6.767362356185913e-05, 7.338821887969971e-05, 7.910281419754028e-05, 8.481740951538086e-05, 9.053200483322144e-05, 9.624660015106201e-05, 0.00010196119546890259, 0.00010767579078674316, 0.00011339038610458374, 0.00011910498142242432, 0.0001248195767402649, 0.00013053417205810547, 0.00013624876737594604, 0.00014196336269378662, 0.0001476779580116272, 0.00015339255332946777, 0.00015910714864730835, 0.00016482174396514893, 0.0001705363392829895, 0.00017625093460083008, 0.00018196552991867065, 0.00018768012523651123, 0.0001933947205543518, 0.00019910931587219238, 0.00020482391119003296, 0.00021053850650787354, 0.0002162531018257141, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 2.0, 14.0, 20.0, 46.0, 30.0, 55.0, 120.0, 267.0, 650.0, 1746.0, 5854.0, 35612.0, 795009.0, 189977.0, 14078.0, 3157.0, 1025.0, 427.0, 184.0, 107.0, 66.0, 32.0, 17.0, 16.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8284454345703125, -1.757476806640625, -1.6865081787109375, -1.61553955078125, -1.5445709228515625, -1.473602294921875, -1.4026336669921875, -1.3316650390625, -1.2606964111328125, -1.189727783203125, -1.1187591552734375, -1.04779052734375, -0.9768218994140625, -0.905853271484375, -0.8348846435546875, -0.763916015625, -0.6929473876953125, -0.621978759765625, -0.5510101318359375, -0.48004150390625, -0.4090728759765625, -0.338104248046875, -0.2671356201171875, -0.1961669921875, -0.1251983642578125, -0.054229736328125, 0.0167388916015625, 0.08770751953125, 0.1586761474609375, 0.229644775390625, 0.3006134033203125, 0.37158203125, 0.4425506591796875, 0.513519287109375, 0.5844879150390625, 0.65545654296875, 0.7264251708984375, 0.797393798828125, 0.8683624267578125, 0.9393310546875, 1.0102996826171875, 1.081268310546875, 1.1522369384765625, 1.22320556640625, 1.2941741943359375, 1.365142822265625, 1.4361114501953125, 1.507080078125, 1.5780487060546875, 1.649017333984375, 1.7199859619140625, 1.79095458984375, 1.8619232177734375, 1.932891845703125, 2.0038604736328125, 2.0748291015625, 2.1457977294921875, 2.216766357421875, 2.2877349853515625, 2.35870361328125, 2.4296722412109375, 2.500640869140625, 2.5716094970703125, 2.642578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 7.0, 7.0, 27.0, 51.0, 55.0, 117.0, 145.0, 161.0, 140.0, 96.0, 49.0, 39.0, 36.0, 16.0, 11.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.94219970703125, -0.9078369140625, -0.87347412109375, -0.839111328125, -0.80474853515625, -0.7703857421875, -0.73602294921875, -0.70166015625, -0.66729736328125, -0.6329345703125, -0.59857177734375, -0.564208984375, -0.52984619140625, -0.4954833984375, -0.46112060546875, -0.4267578125, -0.39239501953125, -0.3580322265625, -0.32366943359375, -0.289306640625, -0.25494384765625, -0.2205810546875, -0.18621826171875, -0.15185546875, -0.11749267578125, -0.0831298828125, -0.04876708984375, -0.014404296875, 0.01995849609375, 0.0543212890625, 0.08868408203125, 0.123046875, 0.15740966796875, 0.1917724609375, 0.22613525390625, 0.260498046875, 0.29486083984375, 0.3292236328125, 0.36358642578125, 0.39794921875, 0.43231201171875, 0.4666748046875, 0.50103759765625, 0.535400390625, 0.56976318359375, 0.6041259765625, 0.63848876953125, 0.6728515625, 0.70721435546875, 0.7415771484375, 0.77593994140625, 0.810302734375, 0.84466552734375, 0.8790283203125, 0.91339111328125, 0.94775390625, 0.98211669921875, 1.0164794921875, 1.05084228515625, 1.085205078125, 1.11956787109375, 1.1539306640625, 1.18829345703125, 1.22265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 17.0, 31.0, 68.0, 95.0, 161.0, 153.0, 156.0, 153.0, 76.0, 43.0, 22.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.84821319580078, -18.425582885742188, -18.002952575683594, -17.580322265625, -17.157691955566406, -16.735061645507812, -16.31243133544922, -15.889801979064941, -15.467171669006348, -15.044541358947754, -14.62191104888916, -14.199280738830566, -13.776651382446289, -13.354021072387695, -12.931390762329102, -12.508760452270508, -12.086130142211914, -11.66349983215332, -11.240869522094727, -10.818239212036133, -10.395608901977539, -9.972978591918945, -9.550349235534668, -9.127718925476074, -8.70508861541748, -8.282458305358887, -7.859827995300293, -7.437198162078857, -7.014567852020264, -6.59193754196167, -6.169307708740234, -5.746677398681641, -5.324047088623047, -4.901416778564453, -4.478786468505859, -4.056156635284424, -3.63352632522583, -3.2108960151672363, -2.7882659435272217, -2.365635871887207, -1.9430055618286133, -1.520375370979309, -1.0977451801300049, -0.6751149892807007, -0.2524847984313965, 0.17014551162719727, 0.5927755832672119, 1.0154056549072266, 1.4380359649658203, 1.8606661558151245, 2.2832963466644287, 2.7059264183044434, 3.128556728363037, 3.551187038421631, 3.9738171100616455, 4.39644718170166, 4.819077491760254, 5.241707801818848, 5.664338111877441, 6.086967945098877, 6.509598255157471, 6.9322285652160645, 7.3548583984375, 7.777488708496094, 8.200119018554688]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 11.0, 12.0, 10.0, 10.0, 19.0, 17.0, 19.0, 16.0, 16.0, 33.0, 25.0, 30.0, 36.0, 37.0, 38.0, 34.0, 45.0, 35.0, 50.0, 37.0, 36.0, 55.0, 38.0, 35.0, 37.0, 40.0, 34.0, 21.0, 28.0, 29.0, 19.0, 15.0, 19.0, 12.0, 6.0, 9.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.233152866363525, -6.054147720336914, -5.875142574310303, -5.696137428283691, -5.51713228225708, -5.338127136230469, -5.159121990203857, -4.980116844177246, -4.801111698150635, -4.622106552124023, -4.443101406097412, -4.264096260070801, -4.0850911140441895, -3.906085968017578, -3.727080821990967, -3.5480756759643555, -3.369070291519165, -3.1900651454925537, -3.0110599994659424, -2.832054853439331, -2.6530497074127197, -2.4740445613861084, -2.295039176940918, -2.1160340309143066, -1.9370290040969849, -1.7580238580703735, -1.5790187120437622, -1.4000134468078613, -1.22100830078125, -1.0420031547546387, -0.8629980087280273, -0.683992862701416, -0.5049877166748047, -0.32598257064819336, -0.14697739481925964, 0.03202778100967407, 0.2110329270362854, 0.39003807306289673, 0.5690432786941528, 0.7480484247207642, 0.9270535707473755, 1.1060587167739868, 1.2850638628005981, 1.464069128036499, 1.6430742740631104, 1.8220794200897217, 2.001084566116333, 2.1800897121429443, 2.3590948581695557, 2.538100004196167, 2.7171051502227783, 2.8961102962493896, 3.075115442276001, 3.2541205883026123, 3.4331259727478027, 3.612131118774414, 3.7911362648010254, 3.9701414108276367, 4.149146556854248, 4.328151702880859, 4.507156848907471, 4.686161994934082, 4.865167140960693, 5.044172286987305, 5.223177433013916]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 4.0, 12.0, 7.0, 16.0, 26.0, 31.0, 51.0, 86.0, 137.0, 275.0, 554.0, 1214.0, 2846.0, 7906.0, 26393.0, 120730.0, 2762850.0, 1140700.0, 96234.0, 22386.0, 7031.0, 2532.0, 1097.0, 525.0, 274.0, 138.0, 85.0, 39.0, 30.0, 16.0, 16.0, 9.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2464447021484375, -1.204803466796875, -1.1631622314453125, -1.12152099609375, -1.0798797607421875, -1.038238525390625, -0.9965972900390625, -0.9549560546875, -0.9133148193359375, -0.871673583984375, -0.8300323486328125, -0.78839111328125, -0.7467498779296875, -0.705108642578125, -0.6634674072265625, -0.621826171875, -0.5801849365234375, -0.538543701171875, -0.4969024658203125, -0.45526123046875, -0.4136199951171875, -0.371978759765625, -0.3303375244140625, -0.2886962890625, -0.2470550537109375, -0.205413818359375, -0.1637725830078125, -0.12213134765625, -0.0804901123046875, -0.038848876953125, 0.0027923583984375, 0.04443359375, 0.0860748291015625, 0.127716064453125, 0.1693572998046875, 0.21099853515625, 0.2526397705078125, 0.294281005859375, 0.3359222412109375, 0.3775634765625, 0.4192047119140625, 0.460845947265625, 0.5024871826171875, 0.54412841796875, 0.5857696533203125, 0.627410888671875, 0.6690521240234375, 0.710693359375, 0.7523345947265625, 0.793975830078125, 0.8356170654296875, 0.87725830078125, 0.9188995361328125, 0.960540771484375, 1.0021820068359375, 1.0438232421875, 1.0854644775390625, 1.127105712890625, 1.1687469482421875, 1.21038818359375, 1.2520294189453125, 1.293670654296875, 1.3353118896484375, 1.376953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 22.0, 32.0, 52.0, 52.0, 64.0, 66.0, 79.0, 96.0, 85.0, 81.0, 75.0, 69.0, 42.0, 39.0, 33.0, 27.0, 20.0, 18.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424072265625, -0.4115715026855469, -0.39907073974609375, -0.3865699768066406, -0.3740692138671875, -0.3615684509277344, -0.34906768798828125, -0.3365669250488281, -0.324066162109375, -0.3115653991699219, -0.29906463623046875, -0.2865638732910156, -0.2740631103515625, -0.2615623474121094, -0.24906158447265625, -0.23656082153320312, -0.22406005859375, -0.21155929565429688, -0.19905853271484375, -0.18655776977539062, -0.1740570068359375, -0.16155624389648438, -0.14905548095703125, -0.13655471801757812, -0.124053955078125, -0.11155319213867188, -0.09905242919921875, -0.08655166625976562, -0.0740509033203125, -0.061550140380859375, -0.04904937744140625, -0.036548614501953125, -0.0240478515625, -0.011547088623046875, 0.00095367431640625, 0.013454437255859375, 0.0259552001953125, 0.038455963134765625, 0.05095672607421875, 0.06345748901367188, 0.075958251953125, 0.08845901489257812, 0.10095977783203125, 0.11346054077148438, 0.1259613037109375, 0.13846206665039062, 0.15096282958984375, 0.16346359252929688, 0.17596435546875, 0.18846511840820312, 0.20096588134765625, 0.21346664428710938, 0.2259674072265625, 0.23846817016601562, 0.25096893310546875, 0.2634696960449219, 0.275970458984375, 0.2884712219238281, 0.30097198486328125, 0.3134727478027344, 0.3259735107421875, 0.3384742736816406, 0.35097503662109375, 0.3634757995605469, 0.3759765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 7.0, 9.0, 9.0, 10.0, 14.0, 22.0, 26.0, 36.0, 51.0, 75.0, 130.0, 166.0, 292.0, 438.0, 975.0, 1872.0, 3891.0, 9496.0, 25246.0, 83669.0, 391900.0, 2925274.0, 587899.0, 110828.0, 31409.0, 11265.0, 4698.0, 2129.0, 1031.0, 534.0, 323.0, 193.0, 104.0, 95.0, 64.0, 24.0, 25.0, 10.0, 13.0, 11.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9555892944335938, -0.9243621826171875, -0.8931350708007812, -0.861907958984375, -0.8306808471679688, -0.7994537353515625, -0.7682266235351562, -0.73699951171875, -0.7057723999023438, -0.6745452880859375, -0.6433181762695312, -0.612091064453125, -0.5808639526367188, -0.5496368408203125, -0.5184097290039062, -0.4871826171875, -0.45595550537109375, -0.4247283935546875, -0.39350128173828125, -0.362274169921875, -0.33104705810546875, -0.2998199462890625, -0.26859283447265625, -0.23736572265625, -0.20613861083984375, -0.1749114990234375, -0.14368438720703125, -0.112457275390625, -0.08123016357421875, -0.0500030517578125, -0.01877593994140625, 0.012451171875, 0.04367828369140625, 0.0749053955078125, 0.10613250732421875, 0.137359619140625, 0.16858673095703125, 0.1998138427734375, 0.23104095458984375, 0.26226806640625, 0.29349517822265625, 0.3247222900390625, 0.35594940185546875, 0.387176513671875, 0.41840362548828125, 0.4496307373046875, 0.48085784912109375, 0.5120849609375, 0.5433120727539062, 0.5745391845703125, 0.6057662963867188, 0.636993408203125, 0.6682205200195312, 0.6994476318359375, 0.7306747436523438, 0.76190185546875, 0.7931289672851562, 0.8243560791015625, 0.8555831909179688, 0.886810302734375, 0.9180374145507812, 0.9492645263671875, 0.9804916381835938, 1.01171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 24.0, 16.0, 19.0, 36.0, 74.0, 82.0, 144.0, 223.0, 402.0, 990.0, 1021.0, 394.0, 243.0, 152.0, 70.0, 53.0, 33.0, 21.0, 14.0, 19.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5767669677734375, -0.560272216796875, -0.5437774658203125, -0.52728271484375, -0.5107879638671875, -0.494293212890625, -0.4777984619140625, -0.4613037109375, -0.4448089599609375, -0.428314208984375, -0.4118194580078125, -0.39532470703125, -0.3788299560546875, -0.362335205078125, -0.3458404541015625, -0.329345703125, -0.3128509521484375, -0.296356201171875, -0.2798614501953125, -0.26336669921875, -0.2468719482421875, -0.230377197265625, -0.2138824462890625, -0.1973876953125, -0.1808929443359375, -0.164398193359375, -0.1479034423828125, -0.13140869140625, -0.1149139404296875, -0.098419189453125, -0.0819244384765625, -0.0654296875, -0.0489349365234375, -0.032440185546875, -0.0159454345703125, 0.00054931640625, 0.0170440673828125, 0.033538818359375, 0.0500335693359375, 0.0665283203125, 0.0830230712890625, 0.099517822265625, 0.1160125732421875, 0.13250732421875, 0.1490020751953125, 0.165496826171875, 0.1819915771484375, 0.198486328125, 0.2149810791015625, 0.231475830078125, 0.2479705810546875, 0.26446533203125, 0.2809600830078125, 0.297454833984375, 0.3139495849609375, 0.3304443359375, 0.3469390869140625, 0.363433837890625, 0.3799285888671875, 0.39642333984375, 0.4129180908203125, 0.429412841796875, 0.4459075927734375, 0.46240234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 17.0, 27.0, 38.0, 57.0, 92.0, 86.0, 100.0, 111.0, 96.0, 97.0, 69.0, 55.0, 30.0, 34.0, 24.0, 20.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7610864639282227, -2.670240640640259, -2.579395055770874, -2.48854923248291, -2.3977034091949463, -2.3068578243255615, -2.2160120010375977, -2.125166416168213, -2.034320592880249, -1.9434748888015747, -1.8526290655136108, -1.7617833614349365, -1.6709376573562622, -1.580091953277588, -1.489246129989624, -1.3984004259109497, -1.3075546026229858, -1.2167088985443115, -1.1258630752563477, -1.0350173711776733, -0.944171667098999, -0.8533259034156799, -0.7624801397323608, -0.6716344356536865, -0.5807886719703674, -0.4899429380893707, -0.399097204208374, -0.30825144052505493, -0.21740570664405823, -0.12655997276306152, -0.03571420907974243, 0.055131494998931885, 0.14597725868225098, 0.23682299256324768, 0.3276687264442444, 0.4185144901275635, 0.5093601942062378, 0.6002059578895569, 0.691051721572876, 0.7818974256515503, 0.8727431893348694, 0.9635889530181885, 1.0544346570968628, 1.145280361175537, 1.236126184463501, 1.3269718885421753, 1.4178175926208496, 1.5086634159088135, 1.5995091199874878, 1.690354824066162, 1.781200647354126, 1.8720463514328003, 1.9628920555114746, 2.0537378787994385, 2.1445837020874023, 2.235429286956787, 2.326275110244751, 2.417120933532715, 2.5079665184020996, 2.5988123416900635, 2.6896581649780273, 2.780503749847412, 2.871349573135376, 2.96219539642334, 3.0530409812927246]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 11.0, 10.0, 13.0, 10.0, 20.0, 22.0, 26.0, 23.0, 36.0, 31.0, 42.0, 42.0, 47.0, 51.0, 36.0, 42.0, 36.0, 45.0, 51.0, 37.0, 47.0, 38.0, 33.0, 36.0, 31.0, 30.0, 30.0, 25.0, 17.0, 17.0, 12.0, 13.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6502515077590942, -1.5969529151916504, -1.543654203414917, -1.4903556108474731, -1.4370570182800293, -1.383758306503296, -1.330459713935852, -1.2771611213684082, -1.2238624095916748, -1.170563817024231, -1.1172651052474976, -1.0639665126800537, -1.0106678009033203, -0.9573692083358765, -0.9040706157684326, -0.850771963596344, -0.7974733114242554, -0.7441746592521667, -0.6908760070800781, -0.6375774145126343, -0.5842787623405457, -0.530980110168457, -0.4776814877986908, -0.42438286542892456, -0.37108421325683594, -0.3177855610847473, -0.2644869387149811, -0.21118830144405365, -0.15788966417312622, -0.1045910120010376, -0.05129238963127136, 0.002006232738494873, 0.05530500411987305, 0.10860364139080048, 0.1619022786617279, 0.21520091593265533, 0.26849955320358276, 0.3217982053756714, 0.3750968277454376, 0.42839545011520386, 0.4816941022872925, 0.5349927544593811, 0.5882914066314697, 0.6415899991989136, 0.6948886513710022, 0.7481873035430908, 0.8014858961105347, 0.8547845482826233, 0.9080832004547119, 0.9613818526268005, 1.0146805047988892, 1.067979097366333, 1.1212778091430664, 1.1745764017105103, 1.227874994277954, 1.2811737060546875, 1.3344722986221313, 1.3877708911895752, 1.4410696029663086, 1.4943681955337524, 1.5476667881011963, 1.6009654998779297, 1.6542640924453735, 1.7075626850128174, 1.7608613967895508]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 14.0, 19.0, 30.0, 55.0, 98.0, 119.0, 258.0, 508.0, 1075.0, 2449.0, 6559.0, 19363.0, 61498.0, 195086.0, 425434.0, 228441.0, 72372.0, 22356.0, 7528.0, 2755.0, 1224.0, 581.0, 289.0, 151.0, 102.0, 68.0, 34.0, 26.0, 10.0, 6.0, 18.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.5949859619140625, -1.544464111328125, -1.4939422607421875, -1.44342041015625, -1.3928985595703125, -1.342376708984375, -1.2918548583984375, -1.2413330078125, -1.1908111572265625, -1.140289306640625, -1.0897674560546875, -1.03924560546875, -0.9887237548828125, -0.938201904296875, -0.8876800537109375, -0.837158203125, -0.7866363525390625, -0.736114501953125, -0.6855926513671875, -0.63507080078125, -0.5845489501953125, -0.534027099609375, -0.4835052490234375, -0.4329833984375, -0.3824615478515625, -0.331939697265625, -0.2814178466796875, -0.23089599609375, -0.1803741455078125, -0.129852294921875, -0.0793304443359375, -0.02880859375, 0.0217132568359375, 0.072235107421875, 0.1227569580078125, 0.17327880859375, 0.2238006591796875, 0.274322509765625, 0.3248443603515625, 0.3753662109375, 0.4258880615234375, 0.476409912109375, 0.5269317626953125, 0.57745361328125, 0.6279754638671875, 0.678497314453125, 0.7290191650390625, 0.779541015625, 0.8300628662109375, 0.880584716796875, 0.9311065673828125, 0.98162841796875, 1.0321502685546875, 1.082672119140625, 1.1331939697265625, 1.1837158203125, 1.2342376708984375, 1.284759521484375, 1.3352813720703125, 1.38580322265625, 1.4363250732421875, 1.486846923828125, 1.5373687744140625, 1.587890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 7.0, 16.0, 22.0, 28.0, 58.0, 52.0, 58.0, 79.0, 70.0, 98.0, 99.0, 81.0, 60.0, 59.0, 54.0, 40.0, 38.0, 33.0, 13.0, 6.0, 13.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.3940162658691406, -0.38129425048828125, -0.3685722351074219, -0.3558502197265625, -0.3431282043457031, -0.33040618896484375, -0.3176841735839844, -0.304962158203125, -0.2922401428222656, -0.27951812744140625, -0.2667961120605469, -0.2540740966796875, -0.24135208129882812, -0.22863006591796875, -0.21590805053710938, -0.20318603515625, -0.19046401977539062, -0.17774200439453125, -0.16501998901367188, -0.1522979736328125, -0.13957595825195312, -0.12685394287109375, -0.11413192749023438, -0.101409912109375, -0.08868789672851562, -0.07596588134765625, -0.06324386596679688, -0.0505218505859375, -0.037799835205078125, -0.02507781982421875, -0.012355804443359375, 0.0003662109375, 0.013088226318359375, 0.02581024169921875, 0.038532257080078125, 0.0512542724609375, 0.06397628784179688, 0.07669830322265625, 0.08942031860351562, 0.102142333984375, 0.11486434936523438, 0.12758636474609375, 0.14030838012695312, 0.1530303955078125, 0.16575241088867188, 0.17847442626953125, 0.19119644165039062, 0.20391845703125, 0.21664047241210938, 0.22936248779296875, 0.24208450317382812, 0.2548065185546875, 0.2675285339355469, 0.28025054931640625, 0.2929725646972656, 0.305694580078125, 0.3184165954589844, 0.33113861083984375, 0.3438606262207031, 0.3565826416015625, 0.3693046569824219, 0.38202667236328125, 0.3947486877441406, 0.407470703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 16.0, 15.0, 24.0, 32.0, 52.0, 52.0, 104.0, 164.0, 264.0, 420.0, 749.0, 1283.0, 2579.0, 5942.0, 15007.0, 41684.0, 117838.0, 288027.0, 335637.0, 150840.0, 53997.0, 19329.0, 7430.0, 3259.0, 1616.0, 798.0, 499.0, 303.0, 182.0, 129.0, 81.0, 48.0, 39.0, 18.0, 16.0, 18.0, 6.0, 9.0, 11.0, 5.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.3837890625, -1.3474960327148438, -1.3112030029296875, -1.2749099731445312, -1.238616943359375, -1.2023239135742188, -1.1660308837890625, -1.1297378540039062, -1.09344482421875, -1.0571517944335938, -1.0208587646484375, -0.9845657348632812, -0.948272705078125, -0.9119796752929688, -0.8756866455078125, -0.8393936157226562, -0.8031005859375, -0.7668075561523438, -0.7305145263671875, -0.6942214965820312, -0.657928466796875, -0.6216354370117188, -0.5853424072265625, -0.5490493774414062, -0.51275634765625, -0.47646331787109375, -0.4401702880859375, -0.40387725830078125, -0.367584228515625, -0.33129119873046875, -0.2949981689453125, -0.25870513916015625, -0.222412109375, -0.18611907958984375, -0.1498260498046875, -0.11353302001953125, -0.077239990234375, -0.04094696044921875, -0.0046539306640625, 0.03163909912109375, 0.06793212890625, 0.10422515869140625, 0.1405181884765625, 0.17681121826171875, 0.213104248046875, 0.24939727783203125, 0.2856903076171875, 0.32198333740234375, 0.3582763671875, 0.39456939697265625, 0.4308624267578125, 0.46715545654296875, 0.503448486328125, 0.5397415161132812, 0.5760345458984375, 0.6123275756835938, 0.64862060546875, 0.6849136352539062, 0.7212066650390625, 0.7574996948242188, 0.793792724609375, 0.8300857543945312, 0.8663787841796875, 0.9026718139648438, 0.93896484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 14.0, 17.0, 14.0, 16.0, 16.0, 25.0, 27.0, 26.0, 31.0, 31.0, 38.0, 35.0, 45.0, 43.0, 43.0, 51.0, 46.0, 46.0, 37.0, 36.0, 50.0, 28.0, 26.0, 45.0, 25.0, 33.0, 23.0, 19.0, 22.0, 15.0, 13.0, 12.0, 5.0, 6.0, 3.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.98828125, -0.9542083740234375, -0.920135498046875, -0.8860626220703125, -0.85198974609375, -0.8179168701171875, -0.783843994140625, -0.7497711181640625, -0.7156982421875, -0.6816253662109375, -0.647552490234375, -0.6134796142578125, -0.57940673828125, -0.5453338623046875, -0.511260986328125, -0.4771881103515625, -0.443115234375, -0.4090423583984375, -0.374969482421875, -0.3408966064453125, -0.30682373046875, -0.2727508544921875, -0.238677978515625, -0.2046051025390625, -0.1705322265625, -0.1364593505859375, -0.102386474609375, -0.0683135986328125, -0.03424072265625, -0.0001678466796875, 0.033905029296875, 0.0679779052734375, 0.10205078125, 0.1361236572265625, 0.170196533203125, 0.2042694091796875, 0.23834228515625, 0.2724151611328125, 0.306488037109375, 0.3405609130859375, 0.3746337890625, 0.4087066650390625, 0.442779541015625, 0.4768524169921875, 0.51092529296875, 0.5449981689453125, 0.579071044921875, 0.6131439208984375, 0.647216796875, 0.6812896728515625, 0.715362548828125, 0.7494354248046875, 0.78350830078125, 0.8175811767578125, 0.851654052734375, 0.8857269287109375, 0.9197998046875, 0.9538726806640625, 0.987945556640625, 1.0220184326171875, 1.05609130859375, 1.0901641845703125, 1.124237060546875, 1.1583099365234375, 1.1923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 5.0, 22.0, 35.0, 27.0, 73.0, 130.0, 205.0, 423.0, 925.0, 2286.0, 6236.0, 20784.0, 93930.0, 473208.0, 362043.0, 64524.0, 15349.0, 4989.0, 1750.0, 765.0, 374.0, 187.0, 104.0, 54.0, 31.0, 31.0, 16.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.97503662109375, -0.9412841796875, -0.90753173828125, -0.873779296875, -0.84002685546875, -0.8062744140625, -0.77252197265625, -0.73876953125, -0.70501708984375, -0.6712646484375, -0.63751220703125, -0.603759765625, -0.57000732421875, -0.5362548828125, -0.50250244140625, -0.46875, -0.43499755859375, -0.4012451171875, -0.36749267578125, -0.333740234375, -0.29998779296875, -0.2662353515625, -0.23248291015625, -0.19873046875, -0.16497802734375, -0.1312255859375, -0.09747314453125, -0.063720703125, -0.02996826171875, 0.0037841796875, 0.03753662109375, 0.0712890625, 0.10504150390625, 0.1387939453125, 0.17254638671875, 0.206298828125, 0.24005126953125, 0.2738037109375, 0.30755615234375, 0.34130859375, 0.37506103515625, 0.4088134765625, 0.44256591796875, 0.476318359375, 0.51007080078125, 0.5438232421875, 0.57757568359375, 0.611328125, 0.64508056640625, 0.6788330078125, 0.71258544921875, 0.746337890625, 0.78009033203125, 0.8138427734375, 0.84759521484375, 0.88134765625, 0.91510009765625, 0.9488525390625, 0.98260498046875, 1.016357421875, 1.05010986328125, 1.0838623046875, 1.11761474609375, 1.1513671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 14.0, 10.0, 20.0, 18.0, 27.0, 44.0, 73.0, 70.0, 103.0, 127.0, 127.0, 89.0, 83.0, 53.0, 36.0, 27.0, 17.0, 15.0, 10.0, 11.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016808509826660156, -0.00016077235341072083, -0.0001534596085548401, -0.00014614686369895935, -0.0001388341188430786, -0.00013152137398719788, -0.00012420862913131714, -0.0001168958842754364, -0.00010958313941955566, -0.00010227039456367493, -9.495764970779419e-05, -8.764490485191345e-05, -8.033215999603271e-05, -7.301941514015198e-05, -6.570667028427124e-05, -5.83939254283905e-05, -5.1081180572509766e-05, -4.376843571662903e-05, -3.645569086074829e-05, -2.9142946004867554e-05, -2.1830201148986816e-05, -1.4517456293106079e-05, -7.204711437225342e-06, 1.0803341865539551e-07, 7.420778274536133e-06, 1.473352313041687e-05, 2.2046267986297607e-05, 2.9359012842178345e-05, 3.667175769805908e-05, 4.398450255393982e-05, 5.129724740982056e-05, 5.8609992265701294e-05, 6.592273712158203e-05, 7.323548197746277e-05, 8.05482268333435e-05, 8.786097168922424e-05, 9.517371654510498e-05, 0.00010248646140098572, 0.00010979920625686646, 0.00011711195111274719, 0.00012442469596862793, 0.00013173744082450867, 0.0001390501856803894, 0.00014636293053627014, 0.00015367567539215088, 0.00016098842024803162, 0.00016830116510391235, 0.0001756139099597931, 0.00018292665481567383, 0.00019023939967155457, 0.0001975521445274353, 0.00020486488938331604, 0.00021217763423919678, 0.00021949037909507751, 0.00022680312395095825, 0.000234115868806839, 0.00024142861366271973, 0.00024874135851860046, 0.0002560541033744812, 0.00026336684823036194, 0.0002706795930862427, 0.0002779923379421234, 0.00028530508279800415, 0.0002926178276538849, 0.0002999305725097656]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 9.0, 15.0, 12.0, 42.0, 55.0, 98.0, 152.0, 293.0, 614.0, 1493.0, 3805.0, 12170.0, 53153.0, 381581.0, 497527.0, 74301.0, 15310.0, 4731.0, 1688.0, 694.0, 356.0, 179.0, 115.0, 50.0, 28.0, 29.0, 11.0, 6.0, 5.0, 8.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1517181396484375, -1.116912841796875, -1.0821075439453125, -1.04730224609375, -1.0124969482421875, -0.977691650390625, -0.9428863525390625, -0.9080810546875, -0.8732757568359375, -0.838470458984375, -0.8036651611328125, -0.76885986328125, -0.7340545654296875, -0.699249267578125, -0.6644439697265625, -0.629638671875, -0.5948333740234375, -0.560028076171875, -0.5252227783203125, -0.49041748046875, -0.4556121826171875, -0.420806884765625, -0.3860015869140625, -0.3511962890625, -0.3163909912109375, -0.281585693359375, -0.2467803955078125, -0.21197509765625, -0.1771697998046875, -0.142364501953125, -0.1075592041015625, -0.07275390625, -0.0379486083984375, -0.003143310546875, 0.0316619873046875, 0.06646728515625, 0.1012725830078125, 0.136077880859375, 0.1708831787109375, 0.2056884765625, 0.2404937744140625, 0.275299072265625, 0.3101043701171875, 0.34490966796875, 0.3797149658203125, 0.414520263671875, 0.4493255615234375, 0.484130859375, 0.5189361572265625, 0.553741455078125, 0.5885467529296875, 0.62335205078125, 0.6581573486328125, 0.692962646484375, 0.7277679443359375, 0.7625732421875, 0.7973785400390625, 0.832183837890625, 0.8669891357421875, 0.90179443359375, 0.9365997314453125, 0.971405029296875, 1.0062103271484375, 1.041015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 10.0, 4.0, 9.0, 12.0, 17.0, 24.0, 26.0, 62.0, 76.0, 87.0, 108.0, 134.0, 124.0, 103.0, 67.0, 43.0, 31.0, 14.0, 16.0, 9.0, 9.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8366851806640625, -0.810089111328125, -0.7834930419921875, -0.75689697265625, -0.7303009033203125, -0.703704833984375, -0.6771087646484375, -0.6505126953125, -0.6239166259765625, -0.597320556640625, -0.5707244873046875, -0.54412841796875, -0.5175323486328125, -0.490936279296875, -0.4643402099609375, -0.437744140625, -0.4111480712890625, -0.384552001953125, -0.3579559326171875, -0.33135986328125, -0.3047637939453125, -0.278167724609375, -0.2515716552734375, -0.2249755859375, -0.1983795166015625, -0.171783447265625, -0.1451873779296875, -0.11859130859375, -0.0919952392578125, -0.065399169921875, -0.0388031005859375, -0.01220703125, 0.0143890380859375, 0.040985107421875, 0.0675811767578125, 0.09417724609375, 0.1207733154296875, 0.147369384765625, 0.1739654541015625, 0.2005615234375, 0.2271575927734375, 0.253753662109375, 0.2803497314453125, 0.30694580078125, 0.3335418701171875, 0.360137939453125, 0.3867340087890625, 0.413330078125, 0.4399261474609375, 0.466522216796875, 0.4931182861328125, 0.51971435546875, 0.5463104248046875, 0.572906494140625, 0.5995025634765625, 0.6260986328125, 0.6526947021484375, 0.679290771484375, 0.7058868408203125, 0.73248291015625, 0.7590789794921875, 0.785675048828125, 0.8122711181640625, 0.8388671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 18.0, 27.0, 65.0, 56.0, 77.0, 125.0, 129.0, 127.0, 104.0, 82.0, 65.0, 44.0, 23.0, 22.0, 10.0, 8.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.324390411376953, -8.015144348144531, -7.705897331237793, -7.396650791168213, -7.087404251098633, -6.778157711029053, -6.468911170959473, -6.159665107727051, -5.8504180908203125, -5.541171550750732, -5.231925010681152, -4.922678470611572, -4.613431930541992, -4.304185390472412, -3.994939088821411, -3.685692548751831, -3.37644624710083, -3.06719970703125, -2.75795316696167, -2.44870662689209, -2.1394600868225098, -1.8302136659622192, -1.5209672451019287, -1.2117207050323486, -0.9024741649627686, -0.5932276248931885, -0.2839811444282532, 0.02526533603668213, 0.3345118761062622, 0.6437584161758423, 0.9530048370361328, 1.262251377105713, 1.571497917175293, 1.880744457244873, 2.189990997314453, 2.499237537384033, 2.8084840774536133, 3.1177306175231934, 3.4269769191741943, 3.7362234592437744, 4.045470237731934, 4.354716777801514, 4.663963317871094, 4.973209857940674, 5.282456398010254, 5.591702938079834, 5.900949478149414, 6.210195541381836, 6.519442081451416, 6.828688621520996, 7.137935161590576, 7.447181701660156, 7.756428241729736, 8.065674781799316, 8.374920845031738, 8.684167861938477, 8.993413925170898, 9.30265998840332, 9.611907005310059, 9.92115306854248, 10.230400085449219, 10.53964614868164, 10.848893165588379, 11.1581392288208, 11.467386245727539]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 2.0, 11.0, 11.0, 14.0, 19.0, 17.0, 14.0, 25.0, 19.0, 21.0, 31.0, 32.0, 40.0, 39.0, 53.0, 35.0, 35.0, 43.0, 31.0, 41.0, 39.0, 41.0, 26.0, 29.0, 26.0, 28.0, 25.0, 33.0, 30.0, 21.0, 26.0, 14.0, 14.0, 11.0, 10.0, 9.0, 9.0, 6.0, 6.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.059335231781006, -4.904572010040283, -4.749809265136719, -4.595046043395996, -4.440282821655273, -4.285519599914551, -4.130756855010986, -3.9759936332702637, -3.82123064994812, -3.6664676666259766, -3.511704444885254, -3.3569414615631104, -3.202178478240967, -3.047415256500244, -2.8926522731781006, -2.737889289855957, -2.5831260681152344, -2.428363084793091, -2.273599863052368, -2.1188368797302246, -1.9640737771987915, -1.8093106746673584, -1.6545476913452148, -1.4997845888137817, -1.3450214862823486, -1.1902583837509155, -1.0354952812194824, -0.8807322978973389, -0.7259691953659058, -0.5712060928344727, -0.4164430499076843, -0.261680006980896, -0.10691690444946289, 0.04784616827964783, 0.20260924100875854, 0.35737231373786926, 0.51213538646698, 0.6668984889984131, 0.8216615319252014, 0.9764245748519897, 1.1311876773834229, 1.285950779914856, 1.440713882446289, 1.5954768657684326, 1.7502399682998657, 1.9050030708312988, 2.0597660541534424, 2.214529037475586, 2.3692922592163086, 2.524055242538452, 2.678818464279175, 2.8335814476013184, 2.988344669342041, 3.1431076526641846, 3.297870635986328, 3.452633857727051, 3.6073968410491943, 3.762159824371338, 3.9169230461120605, 4.071686267852783, 4.226449012756348, 4.38121223449707, 4.535975456237793, 4.690738201141357, 4.84550142288208]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 3.0, 7.0, 9.0, 8.0, 23.0, 32.0, 46.0, 74.0, 158.0, 276.0, 516.0, 1086.0, 2416.0, 5998.0, 16744.0, 56989.0, 315293.0, 3511877.0, 214503.0, 44924.0, 13968.0, 5047.0, 2169.0, 927.0, 524.0, 274.0, 137.0, 94.0, 58.0, 33.0, 15.0, 13.0, 14.0, 12.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9470443725585938, -0.9082489013671875, -0.8694534301757812, -0.830657958984375, -0.7918624877929688, -0.7530670166015625, -0.7142715454101562, -0.67547607421875, -0.6366806030273438, -0.5978851318359375, -0.5590896606445312, -0.520294189453125, -0.48149871826171875, -0.4427032470703125, -0.40390777587890625, -0.3651123046875, -0.32631683349609375, -0.2875213623046875, -0.24872589111328125, -0.209930419921875, -0.17113494873046875, -0.1323394775390625, -0.09354400634765625, -0.05474853515625, -0.01595306396484375, 0.0228424072265625, 0.06163787841796875, 0.100433349609375, 0.13922882080078125, 0.1780242919921875, 0.21681976318359375, 0.255615234375, 0.29441070556640625, 0.3332061767578125, 0.37200164794921875, 0.410797119140625, 0.44959259033203125, 0.4883880615234375, 0.5271835327148438, 0.56597900390625, 0.6047744750976562, 0.6435699462890625, 0.6823654174804688, 0.721160888671875, 0.7599563598632812, 0.7987518310546875, 0.8375473022460938, 0.8763427734375, 0.9151382446289062, 0.9539337158203125, 0.9927291870117188, 1.031524658203125, 1.0703201293945312, 1.1091156005859375, 1.1479110717773438, 1.18670654296875, 1.2255020141601562, 1.2642974853515625, 1.3030929565429688, 1.341888427734375, 1.3806838989257812, 1.4194793701171875, 1.4582748413085938, 1.4970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 10.0, 7.0, 8.0, 14.0, 22.0, 22.0, 34.0, 46.0, 42.0, 54.0, 65.0, 67.0, 67.0, 71.0, 89.0, 74.0, 63.0, 55.0, 45.0, 34.0, 31.0, 24.0, 18.0, 13.0, 12.0, 10.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39013671875, -0.3784217834472656, -0.36670684814453125, -0.3549919128417969, -0.3432769775390625, -0.3315620422363281, -0.31984710693359375, -0.3081321716308594, -0.296417236328125, -0.2847023010253906, -0.27298736572265625, -0.2612724304199219, -0.2495574951171875, -0.23784255981445312, -0.22612762451171875, -0.21441268920898438, -0.20269775390625, -0.19098281860351562, -0.17926788330078125, -0.16755294799804688, -0.1558380126953125, -0.14412307739257812, -0.13240814208984375, -0.12069320678710938, -0.108978271484375, -0.09726333618164062, -0.08554840087890625, -0.07383346557617188, -0.0621185302734375, -0.050403594970703125, -0.03868865966796875, -0.026973724365234375, -0.0152587890625, -0.003543853759765625, 0.00817108154296875, 0.019886016845703125, 0.0316009521484375, 0.043315887451171875, 0.05503082275390625, 0.06674575805664062, 0.078460693359375, 0.09017562866210938, 0.10189056396484375, 0.11360549926757812, 0.1253204345703125, 0.13703536987304688, 0.14875030517578125, 0.16046524047851562, 0.17218017578125, 0.18389511108398438, 0.19561004638671875, 0.20732498168945312, 0.2190399169921875, 0.23075485229492188, 0.24246978759765625, 0.2541847229003906, 0.265899658203125, 0.2776145935058594, 0.28932952880859375, 0.3010444641113281, 0.3127593994140625, 0.3244743347167969, 0.33618927001953125, 0.3479042053222656, 0.359619140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 12.0, 18.0, 25.0, 30.0, 77.0, 113.0, 196.0, 369.0, 773.0, 1527.0, 3310.0, 7469.0, 18576.0, 50107.0, 159304.0, 892943.0, 2680766.0, 259315.0, 74246.0, 26175.0, 10322.0, 4446.0, 2060.0, 1018.0, 481.0, 208.0, 152.0, 79.0, 55.0, 36.0, 21.0, 14.0, 12.0, 11.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.857421875, -0.829010009765625, -0.80059814453125, -0.772186279296875, -0.7437744140625, -0.715362548828125, -0.68695068359375, -0.658538818359375, -0.630126953125, -0.601715087890625, -0.57330322265625, -0.544891357421875, -0.5164794921875, -0.488067626953125, -0.45965576171875, -0.431243896484375, -0.40283203125, -0.374420166015625, -0.34600830078125, -0.317596435546875, -0.2891845703125, -0.260772705078125, -0.23236083984375, -0.203948974609375, -0.175537109375, -0.147125244140625, -0.11871337890625, -0.090301513671875, -0.0618896484375, -0.033477783203125, -0.00506591796875, 0.023345947265625, 0.0517578125, 0.080169677734375, 0.10858154296875, 0.136993408203125, 0.1654052734375, 0.193817138671875, 0.22222900390625, 0.250640869140625, 0.279052734375, 0.307464599609375, 0.33587646484375, 0.364288330078125, 0.3927001953125, 0.421112060546875, 0.44952392578125, 0.477935791015625, 0.50634765625, 0.534759521484375, 0.56317138671875, 0.591583251953125, 0.6199951171875, 0.648406982421875, 0.67681884765625, 0.705230712890625, 0.733642578125, 0.762054443359375, 0.79046630859375, 0.818878173828125, 0.8472900390625, 0.875701904296875, 0.90411376953125, 0.932525634765625, 0.9609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 7.0, 12.0, 16.0, 27.0, 30.0, 29.0, 69.0, 68.0, 97.0, 171.0, 262.0, 580.0, 1406.0, 521.0, 235.0, 158.0, 113.0, 63.0, 42.0, 41.0, 21.0, 26.0, 19.0, 17.0, 9.0, 7.0, 3.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3662300109863281, -0.35379791259765625, -0.3413658142089844, -0.3289337158203125, -0.3165016174316406, -0.30406951904296875, -0.2916374206542969, -0.279205322265625, -0.2667732238769531, -0.25434112548828125, -0.24190902709960938, -0.2294769287109375, -0.21704483032226562, -0.20461273193359375, -0.19218063354492188, -0.17974853515625, -0.16731643676757812, -0.15488433837890625, -0.14245223999023438, -0.1300201416015625, -0.11758804321289062, -0.10515594482421875, -0.09272384643554688, -0.080291748046875, -0.06785964965820312, -0.05542755126953125, -0.042995452880859375, -0.0305633544921875, -0.018131256103515625, -0.00569915771484375, 0.006732940673828125, 0.0191650390625, 0.031597137451171875, 0.04402923583984375, 0.056461334228515625, 0.0688934326171875, 0.08132553100585938, 0.09375762939453125, 0.10618972778320312, 0.118621826171875, 0.13105392456054688, 0.14348602294921875, 0.15591812133789062, 0.1683502197265625, 0.18078231811523438, 0.19321441650390625, 0.20564651489257812, 0.21807861328125, 0.23051071166992188, 0.24294281005859375, 0.2553749084472656, 0.2678070068359375, 0.2802391052246094, 0.29267120361328125, 0.3051033020019531, 0.317535400390625, 0.3299674987792969, 0.34239959716796875, 0.3548316955566406, 0.3672637939453125, 0.3796958923339844, 0.39212799072265625, 0.4045600891113281, 0.4169921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 14.0, 16.0, 25.0, 30.0, 42.0, 62.0, 60.0, 83.0, 92.0, 98.0, 103.0, 88.0, 68.0, 73.0, 47.0, 29.0, 17.0, 14.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4498510360717773, -2.374814510345459, -2.2997779846191406, -2.2247414588928223, -2.149704933166504, -2.0746684074401855, -1.9996318817138672, -1.9245953559875488, -1.8495588302612305, -1.774522304534912, -1.6994857788085938, -1.6244492530822754, -1.549412727355957, -1.4743762016296387, -1.3993396759033203, -1.324303150177002, -1.2492666244506836, -1.1742300987243652, -1.0991935729980469, -1.0241570472717285, -0.9491205215454102, -0.8740839958190918, -0.7990474700927734, -0.7240109443664551, -0.6489744186401367, -0.5739378929138184, -0.4989013671875, -0.42386484146118164, -0.3488283157348633, -0.2737917900085449, -0.19875526428222656, -0.1237187385559082, -0.048682451248168945, 0.026354074478149414, 0.10139060020446777, 0.17642712593078613, 0.2514636516571045, 0.32650017738342285, 0.4015367031097412, 0.47657322883605957, 0.5516097545623779, 0.6266462802886963, 0.7016828060150146, 0.776719331741333, 0.8517558574676514, 0.9267923831939697, 1.001828908920288, 1.0768654346466064, 1.1519019603729248, 1.2269384860992432, 1.3019750118255615, 1.3770115375518799, 1.4520480632781982, 1.5270845890045166, 1.602121114730835, 1.6771576404571533, 1.7521941661834717, 1.82723069190979, 1.9022672176361084, 1.9773037433624268, 2.052340269088745, 2.1273767948150635, 2.202413320541382, 2.2774498462677, 2.3524863719940186]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 13.0, 5.0, 7.0, 12.0, 10.0, 16.0, 13.0, 19.0, 18.0, 27.0, 33.0, 24.0, 36.0, 32.0, 30.0, 40.0, 45.0, 39.0, 52.0, 46.0, 45.0, 45.0, 50.0, 35.0, 29.0, 27.0, 34.0, 22.0, 19.0, 29.0, 23.0, 18.0, 23.0, 18.0, 19.0, 6.0, 9.0, 6.0, 4.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3644435405731201, -1.3231252431869507, -1.2818069458007812, -1.2404887676239014, -1.199170470237732, -1.1578521728515625, -1.116533875465393, -1.0752155780792236, -1.0338973999023438, -0.9925791025161743, -0.9512608647346497, -0.9099425673484802, -0.8686243295669556, -0.8273060321807861, -0.7859877347946167, -0.7446694374084473, -0.7033511400222778, -0.6620328426361084, -0.6207146048545837, -0.5793963074684143, -0.5380780696868896, -0.4967597723007202, -0.4554414749145508, -0.41412320733070374, -0.3728049397468567, -0.33148667216300964, -0.2901684045791626, -0.24885010719299316, -0.20753183960914612, -0.16621357202529907, -0.12489528954029083, -0.08357700705528259, -0.042258620262145996, -0.0009403452277183533, 0.04037792980670929, 0.08169620484113693, 0.12301447987556458, 0.16433274745941162, 0.20565102994441986, 0.2469693124294281, 0.28828758001327515, 0.3296058475971222, 0.37092411518096924, 0.41224241256713867, 0.4535606801509857, 0.49487894773483276, 0.5361972451210022, 0.5775154829025269, 0.6188337802886963, 0.6601520776748657, 0.7014703154563904, 0.7427886128425598, 0.7841068506240845, 0.8254251480102539, 0.8667434453964233, 0.9080617427825928, 0.9493799805641174, 0.9906982779502869, 1.0320165157318115, 1.073334813117981, 1.1146531105041504, 1.1559712886810303, 1.1972895860671997, 1.2386078834533691, 1.2799261808395386]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 7.0, 7.0, 13.0, 20.0, 23.0, 30.0, 61.0, 92.0, 124.0, 214.0, 356.0, 557.0, 1096.0, 2158.0, 4201.0, 8716.0, 18418.0, 40188.0, 91917.0, 209367.0, 325266.0, 191761.0, 83820.0, 36816.0, 16735.0, 8271.0, 3788.0, 2058.0, 1001.0, 589.0, 345.0, 204.0, 108.0, 63.0, 44.0, 38.0, 26.0, 22.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.12420654296875, -1.0872802734375, -1.05035400390625, -1.013427734375, -0.97650146484375, -0.9395751953125, -0.90264892578125, -0.86572265625, -0.82879638671875, -0.7918701171875, -0.75494384765625, -0.718017578125, -0.68109130859375, -0.6441650390625, -0.60723876953125, -0.5703125, -0.53338623046875, -0.4964599609375, -0.45953369140625, -0.422607421875, -0.38568115234375, -0.3487548828125, -0.31182861328125, -0.27490234375, -0.23797607421875, -0.2010498046875, -0.16412353515625, -0.127197265625, -0.09027099609375, -0.0533447265625, -0.01641845703125, 0.0205078125, 0.05743408203125, 0.0943603515625, 0.13128662109375, 0.168212890625, 0.20513916015625, 0.2420654296875, 0.27899169921875, 0.31591796875, 0.35284423828125, 0.3897705078125, 0.42669677734375, 0.463623046875, 0.50054931640625, 0.5374755859375, 0.57440185546875, 0.611328125, 0.64825439453125, 0.6851806640625, 0.72210693359375, 0.759033203125, 0.79595947265625, 0.8328857421875, 0.86981201171875, 0.90673828125, 0.94366455078125, 0.9805908203125, 1.01751708984375, 1.054443359375, 1.09136962890625, 1.1282958984375, 1.16522216796875, 1.2021484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 10.0, 19.0, 22.0, 31.0, 50.0, 37.0, 62.0, 63.0, 71.0, 71.0, 74.0, 86.0, 66.0, 69.0, 48.0, 53.0, 34.0, 43.0, 23.0, 15.0, 16.0, 4.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4079780578613281, -0.39579010009765625, -0.3836021423339844, -0.3714141845703125, -0.3592262268066406, -0.34703826904296875, -0.3348503112792969, -0.322662353515625, -0.3104743957519531, -0.29828643798828125, -0.2860984802246094, -0.2739105224609375, -0.2617225646972656, -0.24953460693359375, -0.23734664916992188, -0.22515869140625, -0.21297073364257812, -0.20078277587890625, -0.18859481811523438, -0.1764068603515625, -0.16421890258789062, -0.15203094482421875, -0.13984298706054688, -0.127655029296875, -0.11546707153320312, -0.10327911376953125, -0.09109115600585938, -0.0789031982421875, -0.06671524047851562, -0.05452728271484375, -0.042339324951171875, -0.0301513671875, -0.017963409423828125, -0.00577545166015625, 0.006412506103515625, 0.0186004638671875, 0.030788421630859375, 0.04297637939453125, 0.055164337158203125, 0.067352294921875, 0.07954025268554688, 0.09172821044921875, 0.10391616821289062, 0.1161041259765625, 0.12829208374023438, 0.14048004150390625, 0.15266799926757812, 0.16485595703125, 0.17704391479492188, 0.18923187255859375, 0.20141983032226562, 0.2136077880859375, 0.22579574584960938, 0.23798370361328125, 0.2501716613769531, 0.262359619140625, 0.2745475769042969, 0.28673553466796875, 0.2989234924316406, 0.3111114501953125, 0.3232994079589844, 0.33548736572265625, 0.3476753234863281, 0.35986328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 15.0, 17.0, 32.0, 21.0, 35.0, 58.0, 77.0, 117.0, 173.0, 224.0, 368.0, 617.0, 1223.0, 3453.0, 13886.0, 76766.0, 397048.0, 442812.0, 88678.0, 15834.0, 3844.0, 1310.0, 650.0, 398.0, 273.0, 171.0, 129.0, 106.0, 67.0, 38.0, 31.0, 15.0, 16.0, 20.0, 8.0, 3.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.07574462890625, -2.0147705078125, -1.95379638671875, -1.892822265625, -1.83184814453125, -1.7708740234375, -1.70989990234375, -1.64892578125, -1.58795166015625, -1.5269775390625, -1.46600341796875, -1.405029296875, -1.34405517578125, -1.2830810546875, -1.22210693359375, -1.1611328125, -1.10015869140625, -1.0391845703125, -0.97821044921875, -0.917236328125, -0.85626220703125, -0.7952880859375, -0.73431396484375, -0.67333984375, -0.61236572265625, -0.5513916015625, -0.49041748046875, -0.429443359375, -0.36846923828125, -0.3074951171875, -0.24652099609375, -0.185546875, -0.12457275390625, -0.0635986328125, -0.00262451171875, 0.058349609375, 0.11932373046875, 0.1802978515625, 0.24127197265625, 0.30224609375, 0.36322021484375, 0.4241943359375, 0.48516845703125, 0.546142578125, 0.60711669921875, 0.6680908203125, 0.72906494140625, 0.7900390625, 0.85101318359375, 0.9119873046875, 0.97296142578125, 1.033935546875, 1.09490966796875, 1.1558837890625, 1.21685791015625, 1.27783203125, 1.33880615234375, 1.3997802734375, 1.46075439453125, 1.521728515625, 1.58270263671875, 1.6436767578125, 1.70465087890625, 1.765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 9.0, 9.0, 19.0, 7.0, 15.0, 17.0, 23.0, 29.0, 31.0, 28.0, 37.0, 44.0, 31.0, 44.0, 50.0, 44.0, 49.0, 49.0, 54.0, 47.0, 36.0, 42.0, 33.0, 31.0, 28.0, 24.0, 27.0, 20.0, 21.0, 16.0, 14.0, 17.0, 13.0, 6.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.2421875, -1.20428466796875, -1.1663818359375, -1.12847900390625, -1.090576171875, -1.05267333984375, -1.0147705078125, -0.97686767578125, -0.93896484375, -0.90106201171875, -0.8631591796875, -0.82525634765625, -0.787353515625, -0.74945068359375, -0.7115478515625, -0.67364501953125, -0.6357421875, -0.59783935546875, -0.5599365234375, -0.52203369140625, -0.484130859375, -0.44622802734375, -0.4083251953125, -0.37042236328125, -0.33251953125, -0.29461669921875, -0.2567138671875, -0.21881103515625, -0.180908203125, -0.14300537109375, -0.1051025390625, -0.06719970703125, -0.029296875, 0.00860595703125, 0.0465087890625, 0.08441162109375, 0.122314453125, 0.16021728515625, 0.1981201171875, 0.23602294921875, 0.27392578125, 0.31182861328125, 0.3497314453125, 0.38763427734375, 0.425537109375, 0.46343994140625, 0.5013427734375, 0.53924560546875, 0.5771484375, 0.61505126953125, 0.6529541015625, 0.69085693359375, 0.728759765625, 0.76666259765625, 0.8045654296875, 0.84246826171875, 0.88037109375, 0.91827392578125, 0.9561767578125, 0.99407958984375, 1.031982421875, 1.06988525390625, 1.1077880859375, 1.14569091796875, 1.18359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 13.0, 21.0, 35.0, 56.0, 92.0, 143.0, 242.0, 431.0, 832.0, 1758.0, 4427.0, 18077.0, 482936.0, 512293.0, 18921.0, 4583.0, 1774.0, 877.0, 403.0, 247.0, 153.0, 87.0, 52.0, 18.0, 21.0, 16.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.6451416015625, -2.553955078125, -2.4627685546875, -2.37158203125, -2.2803955078125, -2.189208984375, -2.0980224609375, -2.0068359375, -1.9156494140625, -1.824462890625, -1.7332763671875, -1.64208984375, -1.5509033203125, -1.459716796875, -1.3685302734375, -1.27734375, -1.1861572265625, -1.094970703125, -1.0037841796875, -0.91259765625, -0.8214111328125, -0.730224609375, -0.6390380859375, -0.5478515625, -0.4566650390625, -0.365478515625, -0.2742919921875, -0.18310546875, -0.0919189453125, -0.000732421875, 0.0904541015625, 0.181640625, 0.2728271484375, 0.364013671875, 0.4552001953125, 0.54638671875, 0.6375732421875, 0.728759765625, 0.8199462890625, 0.9111328125, 1.0023193359375, 1.093505859375, 1.1846923828125, 1.27587890625, 1.3670654296875, 1.458251953125, 1.5494384765625, 1.640625, 1.7318115234375, 1.822998046875, 1.9141845703125, 2.00537109375, 2.0965576171875, 2.187744140625, 2.2789306640625, 2.3701171875, 2.4613037109375, 2.552490234375, 2.6436767578125, 2.73486328125, 2.8260498046875, 2.917236328125, 3.0084228515625, 3.099609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 10.0, 27.0, 40.0, 68.0, 111.0, 156.0, 177.0, 128.0, 99.0, 58.0, 29.0, 28.0, 15.0, 9.0, 6.0, 10.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004487037658691406, -0.00043727457523345947, -0.0004258453845977783, -0.00041441619396209717, -0.000402987003326416, -0.00039155781269073486, -0.0003801286220550537, -0.00036869943141937256, -0.0003572702407836914, -0.00034584105014801025, -0.0003344118595123291, -0.00032298266887664795, -0.0003115534782409668, -0.00030012428760528564, -0.0002886950969696045, -0.00027726590633392334, -0.0002658367156982422, -0.00025440752506256104, -0.00024297833442687988, -0.00023154914379119873, -0.00022011995315551758, -0.00020869076251983643, -0.00019726157188415527, -0.00018583238124847412, -0.00017440319061279297, -0.00016297399997711182, -0.00015154480934143066, -0.0001401156187057495, -0.00012868642807006836, -0.00011725723743438721, -0.00010582804679870605, -9.43988561630249e-05, -8.296966552734375e-05, -7.15404748916626e-05, -6.0111284255981445e-05, -4.868209362030029e-05, -3.725290298461914e-05, -2.5823712348937988e-05, -1.4394521713256836e-05, -2.9653310775756836e-06, 8.463859558105469e-06, 1.989305019378662e-05, 3.1322240829467773e-05, 4.2751431465148926e-05, 5.418062210083008e-05, 6.560981273651123e-05, 7.703900337219238e-05, 8.846819400787354e-05, 9.989738464355469e-05, 0.00011132657527923584, 0.000122755765914917, 0.00013418495655059814, 0.0001456141471862793, 0.00015704333782196045, 0.0001684725284576416, 0.00017990171909332275, 0.0001913309097290039, 0.00020276010036468506, 0.0002141892910003662, 0.00022561848163604736, 0.00023704767227172852, 0.00024847686290740967, 0.0002599060535430908, 0.00027133524417877197, 0.0002827644348144531]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 10.0, 14.0, 20.0, 35.0, 47.0, 89.0, 157.0, 291.0, 640.0, 1532.0, 4580.0, 21287.0, 842596.0, 162510.0, 9732.0, 2885.0, 1111.0, 466.0, 209.0, 117.0, 75.0, 40.0, 27.0, 19.0, 10.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.23858642578125, -3.1334228515625, -3.02825927734375, -2.923095703125, -2.81793212890625, -2.7127685546875, -2.60760498046875, -2.50244140625, -2.39727783203125, -2.2921142578125, -2.18695068359375, -2.081787109375, -1.97662353515625, -1.8714599609375, -1.76629638671875, -1.6611328125, -1.55596923828125, -1.4508056640625, -1.34564208984375, -1.240478515625, -1.13531494140625, -1.0301513671875, -0.92498779296875, -0.81982421875, -0.71466064453125, -0.6094970703125, -0.50433349609375, -0.399169921875, -0.29400634765625, -0.1888427734375, -0.08367919921875, 0.021484375, 0.12664794921875, 0.2318115234375, 0.33697509765625, 0.442138671875, 0.54730224609375, 0.6524658203125, 0.75762939453125, 0.86279296875, 0.96795654296875, 1.0731201171875, 1.17828369140625, 1.283447265625, 1.38861083984375, 1.4937744140625, 1.59893798828125, 1.7041015625, 1.80926513671875, 1.9144287109375, 2.01959228515625, 2.124755859375, 2.22991943359375, 2.3350830078125, 2.44024658203125, 2.54541015625, 2.65057373046875, 2.7557373046875, 2.86090087890625, 2.966064453125, 3.07122802734375, 3.1763916015625, 3.28155517578125, 3.38671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 15.0, 19.0, 34.0, 64.0, 151.0, 294.0, 219.0, 98.0, 42.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7978515625, -1.7308502197265625, -1.663848876953125, -1.5968475341796875, -1.52984619140625, -1.4628448486328125, -1.395843505859375, -1.3288421630859375, -1.2618408203125, -1.1948394775390625, -1.127838134765625, -1.0608367919921875, -0.99383544921875, -0.9268341064453125, -0.859832763671875, -0.7928314208984375, -0.725830078125, -0.6588287353515625, -0.591827392578125, -0.5248260498046875, -0.45782470703125, -0.3908233642578125, -0.323822021484375, -0.2568206787109375, -0.1898193359375, -0.1228179931640625, -0.055816650390625, 0.0111846923828125, 0.07818603515625, 0.1451873779296875, 0.212188720703125, 0.2791900634765625, 0.34619140625, 0.4131927490234375, 0.480194091796875, 0.5471954345703125, 0.61419677734375, 0.6811981201171875, 0.748199462890625, 0.8152008056640625, 0.8822021484375, 0.9492034912109375, 1.016204833984375, 1.0832061767578125, 1.15020751953125, 1.2172088623046875, 1.284210205078125, 1.3512115478515625, 1.418212890625, 1.4852142333984375, 1.552215576171875, 1.6192169189453125, 1.68621826171875, 1.7532196044921875, 1.820220947265625, 1.8872222900390625, 1.9542236328125, 2.0212249755859375, 2.088226318359375, 2.1552276611328125, 2.22222900390625, 2.2892303466796875, 2.356231689453125, 2.4232330322265625, 2.490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 12.0, 32.0, 126.0, 277.0, 294.0, 175.0, 63.0, 22.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.672521591186523, -10.712645530700684, -9.752769470214844, -8.79289436340332, -7.8330183029174805, -6.873142242431641, -5.913266658782959, -4.953391075134277, -3.9935150146484375, -3.0336391925811768, -2.073763370513916, -1.1138875484466553, -0.15401172637939453, 0.8058643341064453, 1.765739917755127, 2.7256155014038086, 3.6854915618896484, 4.645367622375488, 5.60524320602417, 6.565118789672852, 7.524994850158691, 8.484870910644531, 9.444746017456055, 10.404622077941895, 11.364498138427734, 12.324374198913574, 13.284250259399414, 14.244125366210938, 15.204001426696777, 16.163877487182617, 17.12375259399414, 18.083629608154297, 19.043502807617188, 20.00337791442871, 20.963254928588867, 21.92313003540039, 22.883007049560547, 23.84288215637207, 24.802757263183594, 25.76263427734375, 26.722509384155273, 27.682384490966797, 28.642261505126953, 29.602136611938477, 30.56201171875, 31.521888732910156, 32.48176574707031, 33.4416389465332, 34.40151596069336, 35.361392974853516, 36.321266174316406, 37.28114318847656, 38.24102020263672, 39.200897216796875, 40.160770416259766, 41.12064743041992, 42.08052062988281, 43.04039764404297, 44.00027084350586, 44.960147857666016, 45.92002487182617, 46.87989807128906, 47.83977508544922, 48.799652099609375, 49.75952911376953]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 7.0, 7.0, 14.0, 5.0, 9.0, 14.0, 9.0, 18.0, 30.0, 19.0, 19.0, 26.0, 28.0, 29.0, 32.0, 34.0, 30.0, 44.0, 46.0, 41.0, 55.0, 39.0, 36.0, 32.0, 37.0, 29.0, 42.0, 34.0, 22.0, 18.0, 29.0, 19.0, 22.0, 18.0, 19.0, 17.0, 10.0, 16.0, 5.0, 4.0, 8.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-6.79135274887085, -6.589838981628418, -6.3883256912231445, -6.186811923980713, -5.985298156738281, -5.783784866333008, -5.582271099090576, -5.3807573318481445, -5.179244041442871, -4.9777302742004395, -4.776216983795166, -4.574703216552734, -4.373189449310303, -4.171675682067871, -3.9701623916625977, -3.768648624420166, -3.5671348571777344, -3.365621328353882, -3.16410756111145, -2.9625940322875977, -2.761080265045166, -2.5595667362213135, -2.358053207397461, -2.1565394401550293, -1.9550259113311768, -1.7535122632980347, -1.5519986152648926, -1.35048508644104, -1.148971438407898, -0.9474577903747559, -0.7459442615509033, -0.5444306135177612, -0.34291744232177734, -0.14140382409095764, 0.06010979413986206, 0.2616233825683594, 0.46313703060150146, 0.6646506786346436, 0.8661642074584961, 1.0676778554916382, 1.2691915035247803, 1.4707051515579224, 1.6722187995910645, 1.873732328414917, 2.0752458572387695, 2.276759624481201, 2.4782731533050537, 2.6797866821289062, 2.881300449371338, 3.0828139781951904, 3.284327745437622, 3.4858412742614746, 3.6873550415039062, 3.888868570327759, 4.090382099151611, 4.291895866394043, 4.493409156799316, 4.694922924041748, 4.8964362144470215, 5.097949981689453, 5.299463748931885, 5.500977516174316, 5.70249080657959, 5.9040045738220215, 6.105518341064453]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 3.0, 10.0, 5.0, 14.0, 26.0, 32.0, 71.0, 100.0, 147.0, 246.0, 477.0, 1005.0, 2201.0, 5469.0, 14679.0, 46922.0, 227562.0, 3466818.0, 340122.0, 59454.0, 17431.0, 6459.0, 2537.0, 1111.0, 553.0, 316.0, 182.0, 129.0, 75.0, 47.0, 24.0, 14.0, 17.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.362152099609375, -1.31903076171875, -1.275909423828125, -1.2327880859375, -1.189666748046875, -1.14654541015625, -1.103424072265625, -1.060302734375, -1.017181396484375, -0.97406005859375, -0.930938720703125, -0.8878173828125, -0.844696044921875, -0.80157470703125, -0.758453369140625, -0.71533203125, -0.672210693359375, -0.62908935546875, -0.585968017578125, -0.5428466796875, -0.499725341796875, -0.45660400390625, -0.413482666015625, -0.370361328125, -0.327239990234375, -0.28411865234375, -0.240997314453125, -0.1978759765625, -0.154754638671875, -0.11163330078125, -0.068511962890625, -0.025390625, 0.017730712890625, 0.06085205078125, 0.103973388671875, 0.1470947265625, 0.190216064453125, 0.23333740234375, 0.276458740234375, 0.319580078125, 0.362701416015625, 0.40582275390625, 0.448944091796875, 0.4920654296875, 0.535186767578125, 0.57830810546875, 0.621429443359375, 0.66455078125, 0.707672119140625, 0.75079345703125, 0.793914794921875, 0.8370361328125, 0.880157470703125, 0.92327880859375, 0.966400146484375, 1.009521484375, 1.052642822265625, 1.09576416015625, 1.138885498046875, 1.1820068359375, 1.225128173828125, 1.26824951171875, 1.311370849609375, 1.3544921875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 12.0, 12.0, 18.0, 22.0, 28.0, 35.0, 43.0, 55.0, 44.0, 56.0, 66.0, 53.0, 70.0, 64.0, 70.0, 67.0, 44.0, 51.0, 34.0, 29.0, 32.0, 19.0, 19.0, 11.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.409423828125, -0.3974647521972656, -0.38550567626953125, -0.3735466003417969, -0.3615875244140625, -0.3496284484863281, -0.33766937255859375, -0.3257102966308594, -0.313751220703125, -0.3017921447753906, -0.28983306884765625, -0.2778739929199219, -0.2659149169921875, -0.2539558410644531, -0.24199676513671875, -0.23003768920898438, -0.21807861328125, -0.20611953735351562, -0.19416046142578125, -0.18220138549804688, -0.1702423095703125, -0.15828323364257812, -0.14632415771484375, -0.13436508178710938, -0.122406005859375, -0.11044692993164062, -0.09848785400390625, -0.08652877807617188, -0.0745697021484375, -0.06261062622070312, -0.05065155029296875, -0.038692474365234375, -0.0267333984375, -0.014774322509765625, -0.00281524658203125, 0.009143829345703125, 0.0211029052734375, 0.033061981201171875, 0.04502105712890625, 0.056980133056640625, 0.068939208984375, 0.08089828491210938, 0.09285736083984375, 0.10481643676757812, 0.1167755126953125, 0.12873458862304688, 0.14069366455078125, 0.15265274047851562, 0.16461181640625, 0.17657089233398438, 0.18852996826171875, 0.20048904418945312, 0.2124481201171875, 0.22440719604492188, 0.23636627197265625, 0.24832534790039062, 0.260284423828125, 0.2722434997558594, 0.28420257568359375, 0.2961616516113281, 0.3081207275390625, 0.3200798034667969, 0.33203887939453125, 0.3439979553222656, 0.35595703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 6.0, 3.0, 9.0, 6.0, 15.0, 27.0, 27.0, 64.0, 118.0, 146.0, 237.0, 347.0, 637.0, 1164.0, 1984.0, 3851.0, 7989.0, 17536.0, 42512.0, 119679.0, 457261.0, 2796205.0, 531670.0, 131289.0, 46145.0, 18210.0, 8217.0, 3883.0, 2113.0, 1194.0, 679.0, 393.0, 236.0, 148.0, 97.0, 65.0, 41.0, 19.0, 12.0, 13.0, 16.0, 13.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.013671875, -0.9866714477539062, -0.9596710205078125, -0.9326705932617188, -0.905670166015625, -0.8786697387695312, -0.8516693115234375, -0.8246688842773438, -0.79766845703125, -0.7706680297851562, -0.7436676025390625, -0.7166671752929688, -0.689666748046875, -0.6626663208007812, -0.6356658935546875, -0.6086654663085938, -0.5816650390625, -0.5546646118164062, -0.5276641845703125, -0.5006637573242188, -0.473663330078125, -0.44666290283203125, -0.4196624755859375, -0.39266204833984375, -0.36566162109375, -0.33866119384765625, -0.3116607666015625, -0.28466033935546875, -0.257659912109375, -0.23065948486328125, -0.2036590576171875, -0.17665863037109375, -0.149658203125, -0.12265777587890625, -0.0956573486328125, -0.06865692138671875, -0.041656494140625, -0.01465606689453125, 0.0123443603515625, 0.03934478759765625, 0.06634521484375, 0.09334564208984375, 0.1203460693359375, 0.14734649658203125, 0.174346923828125, 0.20134735107421875, 0.2283477783203125, 0.25534820556640625, 0.2823486328125, 0.30934906005859375, 0.3363494873046875, 0.36334991455078125, 0.390350341796875, 0.41735076904296875, 0.4443511962890625, 0.47135162353515625, 0.49835205078125, 0.5253524780273438, 0.5523529052734375, 0.5793533325195312, 0.606353759765625, 0.6333541870117188, 0.6603546142578125, 0.6873550415039062, 0.71435546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 9.0, 10.0, 15.0, 14.0, 29.0, 35.0, 47.0, 85.0, 103.0, 128.0, 241.0, 440.0, 1115.0, 846.0, 323.0, 194.0, 116.0, 81.0, 64.0, 54.0, 30.0, 22.0, 15.0, 12.0, 8.0, 2.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5226783752441406, -0.5067825317382812, -0.4908866882324219, -0.4749908447265625, -0.4590950012207031, -0.44319915771484375, -0.4273033142089844, -0.411407470703125, -0.3955116271972656, -0.37961578369140625, -0.3637199401855469, -0.3478240966796875, -0.3319282531738281, -0.31603240966796875, -0.3001365661621094, -0.28424072265625, -0.2683448791503906, -0.25244903564453125, -0.23655319213867188, -0.2206573486328125, -0.20476150512695312, -0.18886566162109375, -0.17296981811523438, -0.157073974609375, -0.14117813110351562, -0.12528228759765625, -0.10938644409179688, -0.0934906005859375, -0.07759475708007812, -0.06169891357421875, -0.045803070068359375, -0.0299072265625, -0.014011383056640625, 0.00188446044921875, 0.017780303955078125, 0.0336761474609375, 0.049571990966796875, 0.06546783447265625, 0.08136367797851562, 0.097259521484375, 0.11315536499023438, 0.12905120849609375, 0.14494705200195312, 0.1608428955078125, 0.17673873901367188, 0.19263458251953125, 0.20853042602539062, 0.22442626953125, 0.24032211303710938, 0.25621795654296875, 0.2721138000488281, 0.2880096435546875, 0.3039054870605469, 0.31980133056640625, 0.3356971740722656, 0.351593017578125, 0.3674888610839844, 0.38338470458984375, 0.3992805480957031, 0.4151763916015625, 0.4310722351074219, 0.44696807861328125, 0.4628639221191406, 0.478759765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 12.0, 47.0, 156.0, 243.0, 255.0, 181.0, 83.0, 19.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.820655822753906, -14.526803016662598, -14.232950210571289, -13.93909740447998, -13.645244598388672, -13.351391792297363, -13.057538986206055, -12.763686180114746, -12.469833374023438, -12.175980567932129, -11.88212776184082, -11.588274955749512, -11.294422149658203, -11.000569343566895, -10.706716537475586, -10.412863731384277, -10.119010925292969, -9.82515811920166, -9.531305313110352, -9.237452507019043, -8.943599700927734, -8.649746894836426, -8.355894088745117, -8.062041282653809, -7.7681884765625, -7.474335670471191, -7.180482864379883, -6.886630058288574, -6.592777252197266, -6.298924446105957, -6.005071640014648, -5.71121883392334, -5.417365074157715, -5.123512268066406, -4.829659461975098, -4.535806655883789, -4.2419538497924805, -3.948101043701172, -3.6542482376098633, -3.3603954315185547, -3.066542625427246, -2.7726898193359375, -2.478837013244629, -2.1849842071533203, -1.8911314010620117, -1.5972785949707031, -1.3034257888793945, -1.009572982788086, -0.7157201766967773, -0.42186737060546875, -0.12801456451416016, 0.16583824157714844, 0.45969104766845703, 0.7535438537597656, 1.0473966598510742, 1.3412494659423828, 1.6351022720336914, 1.928955078125, 2.2228078842163086, 2.516660690307617, 2.810513496398926, 3.1043663024902344, 3.398219108581543, 3.6920719146728516, 3.98592472076416]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 14.0, 5.0, 8.0, 9.0, 19.0, 15.0, 20.0, 21.0, 24.0, 26.0, 35.0, 27.0, 39.0, 45.0, 32.0, 38.0, 37.0, 43.0, 53.0, 46.0, 47.0, 47.0, 23.0, 40.0, 40.0, 30.0, 30.0, 29.0, 20.0, 17.0, 24.0, 15.0, 20.0, 14.0, 9.0, 9.0, 6.0, 11.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.092529535293579, -2.0316882133483887, -1.9708471298217773, -1.9100059270858765, -1.8491647243499756, -1.7883235216140747, -1.7274823188781738, -1.6666409969329834, -1.605799913406372, -1.5449587106704712, -1.4841175079345703, -1.4232763051986694, -1.3624351024627686, -1.3015938997268677, -1.2407526969909668, -1.1799113750457764, -1.1190701723098755, -1.0582289695739746, -0.9973877668380737, -0.9365465641021729, -0.875705361366272, -0.8148641586303711, -0.7540228962898254, -0.6931816935539246, -0.6323404908180237, -0.5714992880821228, -0.5106580853462219, -0.44981685280799866, -0.3889756500720978, -0.3281344473361969, -0.26729321479797363, -0.20645201206207275, -0.14561092853546143, -0.08476971834897995, -0.023928508162498474, 0.0369127094745636, 0.09775391221046448, 0.15859511494636536, 0.21943634748458862, 0.2802775502204895, 0.3411187529563904, 0.40195995569229126, 0.46280115842819214, 0.5236424207687378, 0.5844836235046387, 0.6453248262405396, 0.7061660289764404, 0.7670072317123413, 0.8278484344482422, 0.8886896371841431, 0.949530839920044, 1.0103720426559448, 1.0712132453918457, 1.1320544481277466, 1.1928956508636475, 1.253736972808838, 1.3145780563354492, 1.37541925907135, 1.436260461807251, 1.4971016645431519, 1.5579428672790527, 1.6187840700149536, 1.6796252727508545, 1.740466594696045, 1.8013077974319458]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 12.0, 13.0, 26.0, 34.0, 56.0, 98.0, 139.0, 257.0, 428.0, 827.0, 1517.0, 3171.0, 6606.0, 14770.0, 35278.0, 96595.0, 444745.0, 317777.0, 74395.0, 28385.0, 12191.0, 5553.0, 2650.0, 1307.0, 754.0, 394.0, 209.0, 121.0, 69.0, 59.0, 39.0, 19.0, 14.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.372406005859375, -1.32489013671875, -1.277374267578125, -1.2298583984375, -1.182342529296875, -1.13482666015625, -1.087310791015625, -1.039794921875, -0.992279052734375, -0.94476318359375, -0.897247314453125, -0.8497314453125, -0.802215576171875, -0.75469970703125, -0.707183837890625, -0.65966796875, -0.612152099609375, -0.56463623046875, -0.517120361328125, -0.4696044921875, -0.422088623046875, -0.37457275390625, -0.327056884765625, -0.279541015625, -0.232025146484375, -0.18450927734375, -0.136993408203125, -0.0894775390625, -0.041961669921875, 0.00555419921875, 0.053070068359375, 0.1005859375, 0.148101806640625, 0.19561767578125, 0.243133544921875, 0.2906494140625, 0.338165283203125, 0.38568115234375, 0.433197021484375, 0.480712890625, 0.528228759765625, 0.57574462890625, 0.623260498046875, 0.6707763671875, 0.718292236328125, 0.76580810546875, 0.813323974609375, 0.86083984375, 0.908355712890625, 0.95587158203125, 1.003387451171875, 1.0509033203125, 1.098419189453125, 1.14593505859375, 1.193450927734375, 1.240966796875, 1.288482666015625, 1.33599853515625, 1.383514404296875, 1.4310302734375, 1.478546142578125, 1.52606201171875, 1.573577880859375, 1.62109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 13.0, 15.0, 17.0, 27.0, 33.0, 39.0, 50.0, 44.0, 60.0, 60.0, 63.0, 55.0, 65.0, 76.0, 77.0, 60.0, 54.0, 39.0, 43.0, 24.0, 23.0, 19.0, 12.0, 8.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46044921875, -0.4475860595703125, -0.434722900390625, -0.4218597412109375, -0.40899658203125, -0.3961334228515625, -0.383270263671875, -0.3704071044921875, -0.3575439453125, -0.3446807861328125, -0.331817626953125, -0.3189544677734375, -0.30609130859375, -0.2932281494140625, -0.280364990234375, -0.2675018310546875, -0.254638671875, -0.2417755126953125, -0.228912353515625, -0.2160491943359375, -0.20318603515625, -0.1903228759765625, -0.177459716796875, -0.1645965576171875, -0.1517333984375, -0.1388702392578125, -0.126007080078125, -0.1131439208984375, -0.10028076171875, -0.0874176025390625, -0.074554443359375, -0.0616912841796875, -0.048828125, -0.0359649658203125, -0.023101806640625, -0.0102386474609375, 0.00262451171875, 0.0154876708984375, 0.028350830078125, 0.0412139892578125, 0.0540771484375, 0.0669403076171875, 0.079803466796875, 0.0926666259765625, 0.10552978515625, 0.1183929443359375, 0.131256103515625, 0.1441192626953125, 0.156982421875, 0.1698455810546875, 0.182708740234375, 0.1955718994140625, 0.20843505859375, 0.2212982177734375, 0.234161376953125, 0.2470245361328125, 0.2598876953125, 0.2727508544921875, 0.285614013671875, 0.2984771728515625, 0.31134033203125, 0.3242034912109375, 0.337066650390625, 0.3499298095703125, 0.36279296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 4.0, 4.0, 15.0, 12.0, 19.0, 30.0, 28.0, 51.0, 59.0, 83.0, 95.0, 158.0, 205.0, 308.0, 446.0, 693.0, 1294.0, 2940.0, 8385.0, 27760.0, 110392.0, 635274.0, 197587.0, 42405.0, 12120.0, 4105.0, 1636.0, 816.0, 469.0, 323.0, 203.0, 168.0, 105.0, 71.0, 58.0, 56.0, 41.0, 35.0, 25.0, 12.0, 16.0, 11.0, 4.0, 4.0, 4.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6806182861328125, -1.621978759765625, -1.5633392333984375, -1.50469970703125, -1.4460601806640625, -1.387420654296875, -1.3287811279296875, -1.2701416015625, -1.2115020751953125, -1.152862548828125, -1.0942230224609375, -1.03558349609375, -0.9769439697265625, -0.918304443359375, -0.8596649169921875, -0.801025390625, -0.7423858642578125, -0.683746337890625, -0.6251068115234375, -0.56646728515625, -0.5078277587890625, -0.449188232421875, -0.3905487060546875, -0.3319091796875, -0.2732696533203125, -0.214630126953125, -0.1559906005859375, -0.09735107421875, -0.0387115478515625, 0.019927978515625, 0.0785675048828125, 0.13720703125, 0.1958465576171875, 0.254486083984375, 0.3131256103515625, 0.37176513671875, 0.4304046630859375, 0.489044189453125, 0.5476837158203125, 0.6063232421875, 0.6649627685546875, 0.723602294921875, 0.7822418212890625, 0.84088134765625, 0.8995208740234375, 0.958160400390625, 1.0167999267578125, 1.075439453125, 1.1340789794921875, 1.192718505859375, 1.2513580322265625, 1.30999755859375, 1.3686370849609375, 1.427276611328125, 1.4859161376953125, 1.5445556640625, 1.6031951904296875, 1.661834716796875, 1.7204742431640625, 1.77911376953125, 1.8377532958984375, 1.896392822265625, 1.9550323486328125, 2.013671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 10.0, 11.0, 28.0, 25.0, 23.0, 27.0, 39.0, 45.0, 32.0, 62.0, 57.0, 54.0, 57.0, 51.0, 57.0, 61.0, 57.0, 43.0, 50.0, 29.0, 27.0, 40.0, 18.0, 21.0, 11.0, 9.0, 7.0, 14.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.704010009765625, -1.65118408203125, -1.598358154296875, -1.5455322265625, -1.492706298828125, -1.43988037109375, -1.387054443359375, -1.334228515625, -1.281402587890625, -1.22857666015625, -1.175750732421875, -1.1229248046875, -1.070098876953125, -1.01727294921875, -0.964447021484375, -0.91162109375, -0.858795166015625, -0.80596923828125, -0.753143310546875, -0.7003173828125, -0.647491455078125, -0.59466552734375, -0.541839599609375, -0.489013671875, -0.436187744140625, -0.38336181640625, -0.330535888671875, -0.2777099609375, -0.224884033203125, -0.17205810546875, -0.119232177734375, -0.06640625, -0.013580322265625, 0.03924560546875, 0.092071533203125, 0.1448974609375, 0.197723388671875, 0.25054931640625, 0.303375244140625, 0.356201171875, 0.409027099609375, 0.46185302734375, 0.514678955078125, 0.5675048828125, 0.620330810546875, 0.67315673828125, 0.725982666015625, 0.77880859375, 0.831634521484375, 0.88446044921875, 0.937286376953125, 0.9901123046875, 1.042938232421875, 1.09576416015625, 1.148590087890625, 1.201416015625, 1.254241943359375, 1.30706787109375, 1.359893798828125, 1.4127197265625, 1.465545654296875, 1.51837158203125, 1.571197509765625, 1.6240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 15.0, 27.0, 35.0, 43.0, 72.0, 98.0, 186.0, 382.0, 840.0, 2029.0, 5551.0, 18430.0, 79011.0, 715881.0, 181053.0, 31135.0, 8615.0, 2914.0, 1084.0, 485.0, 256.0, 146.0, 92.0, 56.0, 29.0, 23.0, 19.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.4112396240234375, -1.369354248046875, -1.3274688720703125, -1.28558349609375, -1.2436981201171875, -1.201812744140625, -1.1599273681640625, -1.1180419921875, -1.0761566162109375, -1.034271240234375, -0.9923858642578125, -0.95050048828125, -0.9086151123046875, -0.866729736328125, -0.8248443603515625, -0.782958984375, -0.7410736083984375, -0.699188232421875, -0.6573028564453125, -0.61541748046875, -0.5735321044921875, -0.531646728515625, -0.4897613525390625, -0.4478759765625, -0.4059906005859375, -0.364105224609375, -0.3222198486328125, -0.28033447265625, -0.2384490966796875, -0.196563720703125, -0.1546783447265625, -0.11279296875, -0.0709075927734375, -0.029022216796875, 0.0128631591796875, 0.05474853515625, 0.0966339111328125, 0.138519287109375, 0.1804046630859375, 0.2222900390625, 0.2641754150390625, 0.306060791015625, 0.3479461669921875, 0.38983154296875, 0.4317169189453125, 0.473602294921875, 0.5154876708984375, 0.557373046875, 0.5992584228515625, 0.641143798828125, 0.6830291748046875, 0.72491455078125, 0.7667999267578125, 0.808685302734375, 0.8505706787109375, 0.8924560546875, 0.9343414306640625, 0.976226806640625, 1.0181121826171875, 1.05999755859375, 1.1018829345703125, 1.143768310546875, 1.1856536865234375, 1.2275390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 12.0, 21.0, 31.0, 57.0, 125.0, 233.0, 207.0, 97.0, 47.0, 32.0, 25.0, 15.0, 13.0, 9.0, 8.0, 11.0, 5.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003001689910888672, -0.0002904273569583893, -0.0002806857228279114, -0.00027094408869743347, -0.00026120245456695557, -0.00025146082043647766, -0.00024171918630599976, -0.00023197755217552185, -0.00022223591804504395, -0.00021249428391456604, -0.00020275264978408813, -0.00019301101565361023, -0.00018326938152313232, -0.00017352774739265442, -0.00016378611326217651, -0.0001540444791316986, -0.0001443028450012207, -0.0001345612108707428, -0.0001248195767402649, -0.00011507794260978699, -0.00010533630847930908, -9.559467434883118e-05, -8.585304021835327e-05, -7.611140608787537e-05, -6.636977195739746e-05, -5.6628137826919556e-05, -4.688650369644165e-05, -3.7144869565963745e-05, -2.740323543548584e-05, -1.7661601305007935e-05, -7.91996717453003e-06, 1.821666955947876e-06, 1.1563301086425781e-05, 2.1304935216903687e-05, 3.104656934738159e-05, 4.07882034778595e-05, 5.05298376083374e-05, 6.027147173881531e-05, 7.001310586929321e-05, 7.975473999977112e-05, 8.949637413024902e-05, 9.923800826072693e-05, 0.00010897964239120483, 0.00011872127652168274, 0.00012846291065216064, 0.00013820454478263855, 0.00014794617891311646, 0.00015768781304359436, 0.00016742944717407227, 0.00017717108130455017, 0.00018691271543502808, 0.00019665434956550598, 0.0002063959836959839, 0.0002161376178264618, 0.0002258792519569397, 0.0002356208860874176, 0.0002453625202178955, 0.0002551041543483734, 0.0002648457884788513, 0.0002745874226093292, 0.00028432905673980713, 0.00029407069087028503, 0.00030381232500076294, 0.00031355395913124084, 0.00032329559326171875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 14.0, 12.0, 16.0, 21.0, 26.0, 33.0, 43.0, 62.0, 108.0, 167.0, 243.0, 429.0, 927.0, 1973.0, 4974.0, 14891.0, 59297.0, 734772.0, 187072.0, 28598.0, 8622.0, 3202.0, 1349.0, 690.0, 333.0, 208.0, 120.0, 102.0, 59.0, 43.0, 41.0, 28.0, 16.0, 15.0, 8.0, 7.0, 4.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.599609375, -1.5535888671875, -1.507568359375, -1.4615478515625, -1.41552734375, -1.3695068359375, -1.323486328125, -1.2774658203125, -1.2314453125, -1.1854248046875, -1.139404296875, -1.0933837890625, -1.04736328125, -1.0013427734375, -0.955322265625, -0.9093017578125, -0.86328125, -0.8172607421875, -0.771240234375, -0.7252197265625, -0.67919921875, -0.6331787109375, -0.587158203125, -0.5411376953125, -0.4951171875, -0.4490966796875, -0.403076171875, -0.3570556640625, -0.31103515625, -0.2650146484375, -0.218994140625, -0.1729736328125, -0.126953125, -0.0809326171875, -0.034912109375, 0.0111083984375, 0.05712890625, 0.1031494140625, 0.149169921875, 0.1951904296875, 0.2412109375, 0.2872314453125, 0.333251953125, 0.3792724609375, 0.42529296875, 0.4713134765625, 0.517333984375, 0.5633544921875, 0.609375, 0.6553955078125, 0.701416015625, 0.7474365234375, 0.79345703125, 0.8394775390625, 0.885498046875, 0.9315185546875, 0.9775390625, 1.0235595703125, 1.069580078125, 1.1156005859375, 1.16162109375, 1.2076416015625, 1.253662109375, 1.2996826171875, 1.345703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 4.0, 6.0, 3.0, 9.0, 9.0, 10.0, 14.0, 22.0, 30.0, 44.0, 94.0, 143.0, 203.0, 156.0, 77.0, 46.0, 28.0, 20.0, 21.0, 7.0, 5.0, 10.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.0643768310546875, -1.028167724609375, -0.9919586181640625, -0.95574951171875, -0.9195404052734375, -0.883331298828125, -0.8471221923828125, -0.8109130859375, -0.7747039794921875, -0.738494873046875, -0.7022857666015625, -0.66607666015625, -0.6298675537109375, -0.593658447265625, -0.5574493408203125, -0.521240234375, -0.4850311279296875, -0.448822021484375, -0.4126129150390625, -0.37640380859375, -0.3401947021484375, -0.303985595703125, -0.2677764892578125, -0.2315673828125, -0.1953582763671875, -0.159149169921875, -0.1229400634765625, -0.08673095703125, -0.0505218505859375, -0.014312744140625, 0.0218963623046875, 0.05810546875, 0.0943145751953125, 0.130523681640625, 0.1667327880859375, 0.20294189453125, 0.2391510009765625, 0.275360107421875, 0.3115692138671875, 0.3477783203125, 0.3839874267578125, 0.420196533203125, 0.4564056396484375, 0.49261474609375, 0.5288238525390625, 0.565032958984375, 0.6012420654296875, 0.637451171875, 0.6736602783203125, 0.709869384765625, 0.7460784912109375, 0.78228759765625, 0.8184967041015625, 0.854705810546875, 0.8909149169921875, 0.9271240234375, 0.9633331298828125, 0.999542236328125, 1.0357513427734375, 1.07196044921875, 1.1081695556640625, 1.144378662109375, 1.1805877685546875, 1.216796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 20.0, 33.0, 66.0, 124.0, 166.0, 184.0, 173.0, 103.0, 69.0, 25.0, 13.0, 9.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.543813705444336, -21.04570770263672, -20.5476016998291, -20.049495697021484, -19.5513916015625, -19.053285598754883, -18.555179595947266, -18.05707359313965, -17.55896759033203, -17.060861587524414, -16.562755584716797, -16.064651489257812, -15.566544532775879, -15.068439483642578, -14.570333480834961, -14.072227478027344, -13.574122428894043, -13.076016426086426, -12.577911376953125, -12.079805374145508, -11.58169937133789, -11.083593368530273, -10.585488319396973, -10.087382316589355, -9.589277267456055, -9.091171264648438, -8.593066215515137, -8.09496021270752, -7.596854209899902, -7.098748683929443, -6.600643157958984, -6.102537155151367, -5.60443115234375, -5.106325626373291, -4.608219623565674, -4.110114097595215, -3.6120083332061768, -3.1139025688171387, -2.6157970428466797, -2.1176912784576416, -1.6195855140686035, -1.1214797496795654, -0.6233741044998169, -0.12526845932006836, 0.3728373050689697, 0.8709430694580078, 1.3690485954284668, 1.8671543598175049, 2.365260124206543, 2.863365888595581, 3.361471652984619, 3.859577178955078, 4.357683181762695, 4.855788707733154, 5.353894233703613, 5.8520002365112305, 6.3501057624816895, 6.848211288452148, 7.346317291259766, 7.844422817230225, 8.342528343200684, 8.8406343460083, 9.338739395141602, 9.836845397949219, 10.334951400756836]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 14.0, 14.0, 14.0, 19.0, 32.0, 22.0, 28.0, 22.0, 33.0, 43.0, 40.0, 37.0, 43.0, 43.0, 48.0, 36.0, 48.0, 41.0, 45.0, 40.0, 44.0, 37.0, 27.0, 32.0, 28.0, 24.0, 14.0, 28.0, 11.0, 10.0, 9.0, 9.0, 9.0, 7.0, 6.0, 5.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.527933120727539, -7.322896480560303, -7.117860317230225, -6.912823677062988, -6.70778751373291, -6.502750873565674, -6.2977142333984375, -6.092678070068359, -5.887641429901123, -5.682604789733887, -5.477568626403809, -5.272531986236572, -5.067495346069336, -4.862459182739258, -4.6574225425720215, -4.452385902404785, -4.247349739074707, -4.042313098907471, -3.8372769355773926, -3.6322402954101562, -3.427203893661499, -3.222167491912842, -3.0171308517456055, -2.8120944499969482, -2.607058048248291, -2.402021646499634, -2.1969852447509766, -1.9919486045837402, -1.786912202835083, -1.5818758010864258, -1.376839280128479, -1.1718027591705322, -0.966766357421875, -0.761729896068573, -0.556693434715271, -0.351656973361969, -0.146620512008667, 0.058415889739990234, 0.263452410697937, 0.4684889316558838, 0.673525333404541, 0.878561794757843, 1.083598256111145, 1.2886347770690918, 1.493671178817749, 1.6987075805664062, 1.903744101524353, 2.1087806224823, 2.313817024230957, 2.5188534259796143, 2.7238898277282715, 2.928926467895508, 3.133962869644165, 3.3389992713928223, 3.5440359115600586, 3.749072313308716, 3.954108715057373, 4.159145355224609, 4.3641815185546875, 4.569218158721924, 4.77425479888916, 4.979290962219238, 5.184327602386475, 5.389364242553711, 5.594400405883789]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 15.0, 13.0, 47.0, 96.0, 201.0, 488.0, 1273.0, 3573.0, 12315.0, 57025.0, 1141640.0, 2892339.0, 66154.0, 13223.0, 3715.0, 1271.0, 489.0, 218.0, 81.0, 46.0, 20.0, 13.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.40594482421875, -2.3372802734375, -2.26861572265625, -2.199951171875, -2.13128662109375, -2.0626220703125, -1.99395751953125, -1.92529296875, -1.85662841796875, -1.7879638671875, -1.71929931640625, -1.650634765625, -1.58197021484375, -1.5133056640625, -1.44464111328125, -1.3759765625, -1.30731201171875, -1.2386474609375, -1.16998291015625, -1.101318359375, -1.03265380859375, -0.9639892578125, -0.89532470703125, -0.82666015625, -0.75799560546875, -0.6893310546875, -0.62066650390625, -0.552001953125, -0.48333740234375, -0.4146728515625, -0.34600830078125, -0.27734375, -0.20867919921875, -0.1400146484375, -0.07135009765625, -0.002685546875, 0.06597900390625, 0.1346435546875, 0.20330810546875, 0.27197265625, 0.34063720703125, 0.4093017578125, 0.47796630859375, 0.546630859375, 0.61529541015625, 0.6839599609375, 0.75262451171875, 0.8212890625, 0.88995361328125, 0.9586181640625, 1.02728271484375, 1.095947265625, 1.16461181640625, 1.2332763671875, 1.30194091796875, 1.37060546875, 1.43927001953125, 1.5079345703125, 1.57659912109375, 1.645263671875, 1.71392822265625, 1.7825927734375, 1.85125732421875, 1.919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 9.0, 11.0, 9.0, 10.0, 12.0, 14.0, 26.0, 27.0, 26.0, 37.0, 40.0, 45.0, 56.0, 64.0, 73.0, 56.0, 72.0, 68.0, 51.0, 54.0, 70.0, 43.0, 24.0, 29.0, 15.0, 18.0, 18.0, 8.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4408988952636719, -0.42769622802734375, -0.4144935607910156, -0.4012908935546875, -0.3880882263183594, -0.37488555908203125, -0.3616828918457031, -0.348480224609375, -0.3352775573730469, -0.32207489013671875, -0.3088722229003906, -0.2956695556640625, -0.2824668884277344, -0.26926422119140625, -0.2560615539550781, -0.24285888671875, -0.22965621948242188, -0.21645355224609375, -0.20325088500976562, -0.1900482177734375, -0.17684555053710938, -0.16364288330078125, -0.15044021606445312, -0.137237548828125, -0.12403488159179688, -0.11083221435546875, -0.09762954711914062, -0.0844268798828125, -0.07122421264648438, -0.05802154541015625, -0.044818878173828125, -0.0316162109375, -0.018413543701171875, -0.00521087646484375, 0.007991790771484375, 0.0211944580078125, 0.034397125244140625, 0.04759979248046875, 0.060802459716796875, 0.074005126953125, 0.08720779418945312, 0.10041046142578125, 0.11361312866210938, 0.1268157958984375, 0.14001846313476562, 0.15322113037109375, 0.16642379760742188, 0.17962646484375, 0.19282913208007812, 0.20603179931640625, 0.21923446655273438, 0.2324371337890625, 0.24563980102539062, 0.25884246826171875, 0.2720451354980469, 0.285247802734375, 0.2984504699707031, 0.31165313720703125, 0.3248558044433594, 0.3380584716796875, 0.3512611389160156, 0.36446380615234375, 0.3776664733886719, 0.390869140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 9.0, 5.0, 17.0, 18.0, 25.0, 49.0, 61.0, 121.0, 188.0, 285.0, 489.0, 898.0, 1633.0, 3085.0, 6387.0, 14074.0, 35264.0, 111072.0, 626908.0, 3025797.0, 259365.0, 65611.0, 23283.0, 9799.0, 4622.0, 2281.0, 1213.0, 636.0, 391.0, 240.0, 161.0, 87.0, 79.0, 46.0, 32.0, 22.0, 11.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2275390625, -1.1927490234375, -1.157958984375, -1.1231689453125, -1.08837890625, -1.0535888671875, -1.018798828125, -0.9840087890625, -0.94921875, -0.9144287109375, -0.879638671875, -0.8448486328125, -0.81005859375, -0.7752685546875, -0.740478515625, -0.7056884765625, -0.6708984375, -0.6361083984375, -0.601318359375, -0.5665283203125, -0.53173828125, -0.4969482421875, -0.462158203125, -0.4273681640625, -0.392578125, -0.3577880859375, -0.322998046875, -0.2882080078125, -0.25341796875, -0.2186279296875, -0.183837890625, -0.1490478515625, -0.1142578125, -0.0794677734375, -0.044677734375, -0.0098876953125, 0.02490234375, 0.0596923828125, 0.094482421875, 0.1292724609375, 0.1640625, 0.1988525390625, 0.233642578125, 0.2684326171875, 0.30322265625, 0.3380126953125, 0.372802734375, 0.4075927734375, 0.4423828125, 0.4771728515625, 0.511962890625, 0.5467529296875, 0.58154296875, 0.6163330078125, 0.651123046875, 0.6859130859375, 0.720703125, 0.7554931640625, 0.790283203125, 0.8250732421875, 0.85986328125, 0.8946533203125, 0.929443359375, 0.9642333984375, 0.9990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 10.0, 7.0, 12.0, 23.0, 28.0, 33.0, 49.0, 72.0, 96.0, 185.0, 370.0, 1096.0, 1165.0, 351.0, 182.0, 115.0, 78.0, 51.0, 32.0, 30.0, 22.0, 15.0, 5.0, 12.0, 2.0, 1.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5250930786132812, -0.5086822509765625, -0.49227142333984375, -0.475860595703125, -0.45944976806640625, -0.4430389404296875, -0.42662811279296875, -0.41021728515625, -0.39380645751953125, -0.3773956298828125, -0.36098480224609375, -0.344573974609375, -0.32816314697265625, -0.3117523193359375, -0.29534149169921875, -0.2789306640625, -0.26251983642578125, -0.2461090087890625, -0.22969818115234375, -0.213287353515625, -0.19687652587890625, -0.1804656982421875, -0.16405487060546875, -0.14764404296875, -0.13123321533203125, -0.1148223876953125, -0.09841156005859375, -0.082000732421875, -0.06558990478515625, -0.0491790771484375, -0.03276824951171875, -0.016357421875, 5.340576171875e-05, 0.0164642333984375, 0.03287506103515625, 0.049285888671875, 0.06569671630859375, 0.0821075439453125, 0.09851837158203125, 0.11492919921875, 0.13134002685546875, 0.1477508544921875, 0.16416168212890625, 0.180572509765625, 0.19698333740234375, 0.2133941650390625, 0.22980499267578125, 0.2462158203125, 0.26262664794921875, 0.2790374755859375, 0.29544830322265625, 0.311859130859375, 0.32826995849609375, 0.3446807861328125, 0.36109161376953125, 0.37750244140625, 0.39391326904296875, 0.4103240966796875, 0.42673492431640625, 0.443145751953125, 0.45955657958984375, 0.4759674072265625, 0.49237823486328125, 0.5087890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 15.0, 26.0, 48.0, 97.0, 127.0, 169.0, 162.0, 167.0, 86.0, 57.0, 23.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.354272842407227, -6.191716194152832, -6.029159069061279, -5.866602420806885, -5.704045295715332, -5.5414886474609375, -5.378931999206543, -5.216375350952148, -5.053818225860596, -4.891261577606201, -4.728704452514648, -4.566147804260254, -4.403591156005859, -4.241034030914307, -4.078477382659912, -3.9159204959869385, -3.753363609313965, -3.590806722640991, -3.4282498359680176, -3.265693187713623, -3.1031363010406494, -2.940579414367676, -2.7780227661132812, -2.6154658794403076, -2.452908992767334, -2.2903521060943604, -2.1277952194213867, -1.9652385711669922, -1.8026816844940186, -1.640124797821045, -1.4775680303573608, -1.3150112628936768, -1.1524543762207031, -0.9898975491523743, -0.8273407220840454, -0.6647838950157166, -0.5022270679473877, -0.33967024087905884, -0.17711341381072998, -0.014556646347045898, 0.14800024032592773, 0.3105570673942566, 0.47311389446258545, 0.6356707215309143, 0.7982275485992432, 0.960784375667572, 1.1233412027359009, 1.285897970199585, 1.4484548568725586, 1.6110117435455322, 1.7735685110092163, 1.9361252784729004, 2.098682165145874, 2.2612390518188477, 2.423795700073242, 2.586352586746216, 2.7489094734191895, 2.911466360092163, 3.0740232467651367, 3.2365798950195312, 3.399136781692505, 3.5616936683654785, 3.724250316619873, 3.8868072032928467, 4.04936408996582]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 10.0, 12.0, 14.0, 17.0, 23.0, 19.0, 33.0, 25.0, 38.0, 36.0, 49.0, 41.0, 59.0, 51.0, 45.0, 54.0, 51.0, 53.0, 45.0, 44.0, 32.0, 35.0, 33.0, 32.0, 24.0, 18.0, 31.0, 15.0, 12.0, 11.0, 7.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13521671295166, -2.0713541507720947, -2.00749135017395, -1.9436287879943848, -1.8797661066055298, -1.8159034252166748, -1.7520408630371094, -1.6881781816482544, -1.6243155002593994, -1.5604528188705444, -1.4965901374816895, -1.432727575302124, -1.368864893913269, -1.305002212524414, -1.2411396503448486, -1.1772769689559937, -1.1134142875671387, -1.0495516061782837, -0.9856889843940735, -0.9218263626098633, -0.8579636812210083, -0.7941009998321533, -0.7302383780479431, -0.6663757562637329, -0.6025130748748779, -0.538650393486023, -0.47478777170181274, -0.41092512011528015, -0.34706246852874756, -0.28319981694221497, -0.21933716535568237, -0.15547451376914978, -0.09161186218261719, -0.027749210596084595, 0.036113440990448, 0.09997609257698059, 0.16383874416351318, 0.22770139575004578, 0.29156404733657837, 0.35542669892311096, 0.41928935050964355, 0.48315200209617615, 0.5470146536827087, 0.610877275466919, 0.6747399568557739, 0.7386026382446289, 0.8024652600288391, 0.8663278818130493, 0.9301905632019043, 0.9940532445907593, 1.0579159259796143, 1.1217784881591797, 1.1856411695480347, 1.2495038509368896, 1.313366413116455, 1.37722909450531, 1.441091775894165, 1.50495445728302, 1.568817138671875, 1.6326797008514404, 1.6965423822402954, 1.7604050636291504, 1.8242676258087158, 1.8881303071975708, 1.9519929885864258]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 10.0, 10.0, 14.0, 22.0, 44.0, 52.0, 84.0, 127.0, 249.0, 416.0, 908.0, 1891.0, 4366.0, 10730.0, 28220.0, 84275.0, 369976.0, 404376.0, 92468.0, 29843.0, 11755.0, 4770.0, 1965.0, 918.0, 465.0, 243.0, 123.0, 74.0, 51.0, 37.0, 18.0, 10.0, 8.0, 9.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4453125, -1.4028472900390625, -1.360382080078125, -1.3179168701171875, -1.27545166015625, -1.2329864501953125, -1.190521240234375, -1.1480560302734375, -1.1055908203125, -1.0631256103515625, -1.020660400390625, -0.9781951904296875, -0.93572998046875, -0.8932647705078125, -0.850799560546875, -0.8083343505859375, -0.765869140625, -0.7234039306640625, -0.680938720703125, -0.6384735107421875, -0.59600830078125, -0.5535430908203125, -0.511077880859375, -0.4686126708984375, -0.4261474609375, -0.3836822509765625, -0.341217041015625, -0.2987518310546875, -0.25628662109375, -0.2138214111328125, -0.171356201171875, -0.1288909912109375, -0.08642578125, -0.0439605712890625, -0.001495361328125, 0.0409698486328125, 0.08343505859375, 0.1259002685546875, 0.168365478515625, 0.2108306884765625, 0.2532958984375, 0.2957611083984375, 0.338226318359375, 0.3806915283203125, 0.42315673828125, 0.4656219482421875, 0.508087158203125, 0.5505523681640625, 0.593017578125, 0.6354827880859375, 0.677947998046875, 0.7204132080078125, 0.76287841796875, 0.8053436279296875, 0.847808837890625, 0.8902740478515625, 0.9327392578125, 0.9752044677734375, 1.017669677734375, 1.0601348876953125, 1.10260009765625, 1.1450653076171875, 1.187530517578125, 1.2299957275390625, 1.2724609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 13.0, 9.0, 14.0, 14.0, 20.0, 26.0, 29.0, 38.0, 36.0, 49.0, 50.0, 62.0, 48.0, 56.0, 60.0, 53.0, 63.0, 63.0, 53.0, 45.0, 55.0, 31.0, 26.0, 21.0, 13.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4296875, -0.4169807434082031, -0.40427398681640625, -0.3915672302246094, -0.3788604736328125, -0.3661537170410156, -0.35344696044921875, -0.3407402038574219, -0.328033447265625, -0.3153266906738281, -0.30261993408203125, -0.2899131774902344, -0.2772064208984375, -0.2644996643066406, -0.25179290771484375, -0.23908615112304688, -0.22637939453125, -0.21367263793945312, -0.20096588134765625, -0.18825912475585938, -0.1755523681640625, -0.16284561157226562, -0.15013885498046875, -0.13743209838867188, -0.124725341796875, -0.11201858520507812, -0.09931182861328125, -0.08660507202148438, -0.0738983154296875, -0.061191558837890625, -0.04848480224609375, -0.035778045654296875, -0.0230712890625, -0.010364532470703125, 0.00234222412109375, 0.015048980712890625, 0.0277557373046875, 0.040462493896484375, 0.05316925048828125, 0.06587600708007812, 0.078582763671875, 0.09128952026367188, 0.10399627685546875, 0.11670303344726562, 0.1294097900390625, 0.14211654663085938, 0.15482330322265625, 0.16753005981445312, 0.18023681640625, 0.19294357299804688, 0.20565032958984375, 0.21835708618164062, 0.2310638427734375, 0.24377059936523438, 0.25647735595703125, 0.2691841125488281, 0.281890869140625, 0.2945976257324219, 0.30730438232421875, 0.3200111389160156, 0.3327178955078125, 0.3454246520996094, 0.35813140869140625, 0.3708381652832031, 0.383544921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 10.0, 8.0, 15.0, 18.0, 29.0, 26.0, 49.0, 75.0, 146.0, 205.0, 369.0, 703.0, 1710.0, 4500.0, 11882.0, 35192.0, 129111.0, 614057.0, 182773.0, 43539.0, 14674.0, 5349.0, 2076.0, 918.0, 433.0, 260.0, 146.0, 92.0, 59.0, 31.0, 28.0, 23.0, 16.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.4430694580078125, -1.395904541015625, -1.3487396240234375, -1.30157470703125, -1.2544097900390625, -1.207244873046875, -1.1600799560546875, -1.1129150390625, -1.0657501220703125, -1.018585205078125, -0.9714202880859375, -0.92425537109375, -0.8770904541015625, -0.829925537109375, -0.7827606201171875, -0.735595703125, -0.6884307861328125, -0.641265869140625, -0.5941009521484375, -0.54693603515625, -0.4997711181640625, -0.452606201171875, -0.4054412841796875, -0.3582763671875, -0.3111114501953125, -0.263946533203125, -0.2167816162109375, -0.16961669921875, -0.1224517822265625, -0.075286865234375, -0.0281219482421875, 0.01904296875, 0.0662078857421875, 0.113372802734375, 0.1605377197265625, 0.20770263671875, 0.2548675537109375, 0.302032470703125, 0.3491973876953125, 0.3963623046875, 0.4435272216796875, 0.490692138671875, 0.5378570556640625, 0.58502197265625, 0.6321868896484375, 0.679351806640625, 0.7265167236328125, 0.773681640625, 0.8208465576171875, 0.868011474609375, 0.9151763916015625, 0.96234130859375, 1.0095062255859375, 1.056671142578125, 1.1038360595703125, 1.1510009765625, 1.1981658935546875, 1.245330810546875, 1.2924957275390625, 1.33966064453125, 1.3868255615234375, 1.433990478515625, 1.4811553955078125, 1.5283203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 14.0, 10.0, 14.0, 16.0, 17.0, 29.0, 29.0, 34.0, 32.0, 38.0, 44.0, 49.0, 54.0, 45.0, 56.0, 52.0, 63.0, 50.0, 50.0, 31.0, 38.0, 44.0, 37.0, 26.0, 14.0, 26.0, 13.0, 15.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4169921875, -1.368865966796875, -1.32073974609375, -1.272613525390625, -1.2244873046875, -1.176361083984375, -1.12823486328125, -1.080108642578125, -1.031982421875, -0.983856201171875, -0.93572998046875, -0.887603759765625, -0.8394775390625, -0.791351318359375, -0.74322509765625, -0.695098876953125, -0.64697265625, -0.598846435546875, -0.55072021484375, -0.502593994140625, -0.4544677734375, -0.406341552734375, -0.35821533203125, -0.310089111328125, -0.261962890625, -0.213836669921875, -0.16571044921875, -0.117584228515625, -0.0694580078125, -0.021331787109375, 0.02679443359375, 0.074920654296875, 0.123046875, 0.171173095703125, 0.21929931640625, 0.267425537109375, 0.3155517578125, 0.363677978515625, 0.41180419921875, 0.459930419921875, 0.508056640625, 0.556182861328125, 0.60430908203125, 0.652435302734375, 0.7005615234375, 0.748687744140625, 0.79681396484375, 0.844940185546875, 0.89306640625, 0.941192626953125, 0.98931884765625, 1.037445068359375, 1.0855712890625, 1.133697509765625, 1.18182373046875, 1.229949951171875, 1.278076171875, 1.326202392578125, 1.37432861328125, 1.422454833984375, 1.4705810546875, 1.518707275390625, 1.56683349609375, 1.614959716796875, 1.6630859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 11.0, 12.0, 21.0, 31.0, 40.0, 50.0, 98.0, 159.0, 276.0, 499.0, 986.0, 2035.0, 4663.0, 11299.0, 28805.0, 76492.0, 338593.0, 433286.0, 93536.0, 33933.0, 13383.0, 5411.0, 2426.0, 1131.0, 576.0, 311.0, 187.0, 107.0, 70.0, 55.0, 27.0, 21.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5955886840820312, -0.5764312744140625, -0.5572738647460938, -0.538116455078125, -0.5189590454101562, -0.4998016357421875, -0.48064422607421875, -0.46148681640625, -0.44232940673828125, -0.4231719970703125, -0.40401458740234375, -0.384857177734375, -0.36569976806640625, -0.3465423583984375, -0.32738494873046875, -0.3082275390625, -0.28907012939453125, -0.2699127197265625, -0.25075531005859375, -0.231597900390625, -0.21244049072265625, -0.1932830810546875, -0.17412567138671875, -0.15496826171875, -0.13581085205078125, -0.1166534423828125, -0.09749603271484375, -0.078338623046875, -0.05918121337890625, -0.0400238037109375, -0.02086639404296875, -0.001708984375, 0.01744842529296875, 0.0366058349609375, 0.05576324462890625, 0.074920654296875, 0.09407806396484375, 0.1132354736328125, 0.13239288330078125, 0.15155029296875, 0.17070770263671875, 0.1898651123046875, 0.20902252197265625, 0.228179931640625, 0.24733734130859375, 0.2664947509765625, 0.28565216064453125, 0.3048095703125, 0.32396697998046875, 0.3431243896484375, 0.36228179931640625, 0.381439208984375, 0.40059661865234375, 0.4197540283203125, 0.43891143798828125, 0.45806884765625, 0.47722625732421875, 0.4963836669921875, 0.5155410766601562, 0.534698486328125, 0.5538558959960938, 0.5730133056640625, 0.5921707153320312, 0.611328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 5.0, 19.0, 23.0, 19.0, 58.0, 80.0, 176.0, 198.0, 158.0, 74.0, 45.0, 25.0, 18.0, 16.0, 11.0, 10.0, 7.0, 4.0, 4.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0003178119659423828, -0.00031048431992530823, -0.00030315667390823364, -0.00029582902789115906, -0.00028850138187408447, -0.0002811737358570099, -0.0002738460898399353, -0.0002665184438228607, -0.00025919079780578613, -0.00025186315178871155, -0.00024453550577163696, -0.00023720785975456238, -0.0002298802137374878, -0.0002225525677204132, -0.00021522492170333862, -0.00020789727568626404, -0.00020056962966918945, -0.00019324198365211487, -0.00018591433763504028, -0.0001785866916179657, -0.0001712590456008911, -0.00016393139958381653, -0.00015660375356674194, -0.00014927610754966736, -0.00014194846153259277, -0.0001346208155155182, -0.0001272931694984436, -0.00011996552348136902, -0.00011263787746429443, -0.00010531023144721985, -9.798258543014526e-05, -9.065493941307068e-05, -8.33272933959961e-05, -7.599964737892151e-05, -6.867200136184692e-05, -6.134435534477234e-05, -5.4016709327697754e-05, -4.668906331062317e-05, -3.9361417293548584e-05, -3.2033771276474e-05, -2.4706125259399414e-05, -1.737847924232483e-05, -1.0050833225250244e-05, -2.723187208175659e-06, 4.604458808898926e-06, 1.193210482597351e-05, 1.9259750843048096e-05, 2.658739686012268e-05, 3.3915042877197266e-05, 4.124268889427185e-05, 4.8570334911346436e-05, 5.589798092842102e-05, 6.32256269454956e-05, 7.055327296257019e-05, 7.788091897964478e-05, 8.520856499671936e-05, 9.253621101379395e-05, 9.986385703086853e-05, 0.00010719150304794312, 0.0001145191490650177, 0.00012184679508209229, 0.00012917444109916687, 0.00013650208711624146, 0.00014382973313331604, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 11.0, 7.0, 12.0, 29.0, 31.0, 43.0, 92.0, 140.0, 228.0, 461.0, 943.0, 2054.0, 5184.0, 14995.0, 54239.0, 346883.0, 519158.0, 73733.0, 19299.0, 6216.0, 2411.0, 1129.0, 556.0, 259.0, 175.0, 89.0, 55.0, 36.0, 30.0, 13.0, 20.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6221389770507812, -0.5963287353515625, -0.5705184936523438, -0.544708251953125, -0.5188980102539062, -0.4930877685546875, -0.46727752685546875, -0.44146728515625, -0.41565704345703125, -0.3898468017578125, -0.36403656005859375, -0.338226318359375, -0.31241607666015625, -0.2866058349609375, -0.26079559326171875, -0.2349853515625, -0.20917510986328125, -0.1833648681640625, -0.15755462646484375, -0.131744384765625, -0.10593414306640625, -0.0801239013671875, -0.05431365966796875, -0.02850341796875, -0.00269317626953125, 0.0231170654296875, 0.04892730712890625, 0.074737548828125, 0.10054779052734375, 0.1263580322265625, 0.15216827392578125, 0.177978515625, 0.20378875732421875, 0.2295989990234375, 0.25540924072265625, 0.281219482421875, 0.30702972412109375, 0.3328399658203125, 0.35865020751953125, 0.38446044921875, 0.41027069091796875, 0.4360809326171875, 0.46189117431640625, 0.487701416015625, 0.5135116577148438, 0.5393218994140625, 0.5651321411132812, 0.5909423828125, 0.6167526245117188, 0.6425628662109375, 0.6683731079101562, 0.694183349609375, 0.7199935913085938, 0.7458038330078125, 0.7716140747070312, 0.79742431640625, 0.8232345581054688, 0.8490447998046875, 0.8748550415039062, 0.900665283203125, 0.9264755249023438, 0.9522857666015625, 0.9780960083007812, 1.00390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 7.0, 7.0, 13.0, 24.0, 21.0, 28.0, 51.0, 68.0, 88.0, 113.0, 125.0, 113.0, 97.0, 63.0, 43.0, 30.0, 14.0, 20.0, 15.0, 7.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.556640625, -0.5356292724609375, -0.514617919921875, -0.4936065673828125, -0.47259521484375, -0.4515838623046875, -0.430572509765625, -0.4095611572265625, -0.3885498046875, -0.3675384521484375, -0.346527099609375, -0.3255157470703125, -0.30450439453125, -0.2834930419921875, -0.262481689453125, -0.2414703369140625, -0.220458984375, -0.1994476318359375, -0.178436279296875, -0.1574249267578125, -0.13641357421875, -0.1154022216796875, -0.094390869140625, -0.0733795166015625, -0.0523681640625, -0.0313568115234375, -0.010345458984375, 0.0106658935546875, 0.03167724609375, 0.0526885986328125, 0.073699951171875, 0.0947113037109375, 0.11572265625, 0.1367340087890625, 0.157745361328125, 0.1787567138671875, 0.19976806640625, 0.2207794189453125, 0.241790771484375, 0.2628021240234375, 0.2838134765625, 0.3048248291015625, 0.325836181640625, 0.3468475341796875, 0.36785888671875, 0.3888702392578125, 0.409881591796875, 0.4308929443359375, 0.451904296875, 0.4729156494140625, 0.493927001953125, 0.5149383544921875, 0.53594970703125, 0.5569610595703125, 0.577972412109375, 0.5989837646484375, 0.6199951171875, 0.6410064697265625, 0.662017822265625, 0.6830291748046875, 0.70404052734375, 0.7250518798828125, 0.746063232421875, 0.7670745849609375, 0.7880859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 11.0, 17.0, 79.0, 220.0, 286.0, 226.0, 115.0, 41.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.3907470703125, -37.66062545776367, -36.93050765991211, -36.20038604736328, -35.47026443481445, -34.74014663696289, -34.01002502441406, -33.279903411865234, -32.549781799316406, -31.81966209411621, -31.089540481567383, -30.359420776367188, -29.62929916381836, -28.899179458618164, -28.16905975341797, -27.43893814086914, -26.708820343017578, -25.978700637817383, -25.248579025268555, -24.51845932006836, -23.78833770751953, -23.058218002319336, -22.32809829711914, -21.597976684570312, -20.867856979370117, -20.137737274169922, -19.407615661621094, -18.6774959564209, -17.947376251220703, -17.217254638671875, -16.48713493347168, -15.757014274597168, -15.026893615722656, -14.296772956848145, -13.566652297973633, -12.836532592773438, -12.106411933898926, -11.376291275024414, -10.646171569824219, -9.916050910949707, -9.185930252075195, -8.455809593200684, -7.72568941116333, -6.995569229125977, -6.265448570251465, -5.535327911376953, -4.8052077293396, -4.075087547302246, -3.3449668884277344, -2.6148464679718018, -1.8847260475158691, -1.1546056270599365, -0.4244852066040039, 0.3056352138519287, 1.0357556343078613, 1.7658758163452148, 2.4959964752197266, 3.226116895675659, 3.956237316131592, 4.686357498168945, 5.416478157043457, 6.146598815917969, 6.876718997955322, 7.606839179992676, 8.336959838867188]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 6.0, 8.0, 10.0, 5.0, 13.0, 8.0, 15.0, 22.0, 22.0, 23.0, 19.0, 23.0, 30.0, 30.0, 29.0, 36.0, 44.0, 45.0, 33.0, 42.0, 44.0, 47.0, 37.0, 39.0, 32.0, 35.0, 33.0, 37.0, 28.0, 27.0, 16.0, 23.0, 19.0, 21.0, 11.0, 20.0, 15.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.060344696044922, -4.887916564941406, -4.715488433837891, -4.543060302734375, -4.370632171630859, -4.198204040527344, -4.025775909423828, -3.8533477783203125, -3.680919647216797, -3.5084915161132812, -3.3360633850097656, -3.16363525390625, -2.9912071228027344, -2.8187789916992188, -2.646350860595703, -2.4739227294921875, -2.301494598388672, -2.1290664672851562, -1.9566383361816406, -1.784210205078125, -1.6117820739746094, -1.4393539428710938, -1.2669258117675781, -1.0944976806640625, -0.9220695495605469, -0.7496414184570312, -0.5772132873535156, -0.40478515625, -0.23235702514648438, -0.05992889404296875, 0.11249923706054688, 0.2849273681640625, 0.4573554992675781, 0.6297836303710938, 0.8022117614746094, 0.974639892578125, 1.1470680236816406, 1.3194961547851562, 1.4919242858886719, 1.6643524169921875, 1.8367805480957031, 2.0092086791992188, 2.1816368103027344, 2.35406494140625, 2.5264930725097656, 2.6989212036132812, 2.871349334716797, 3.0437774658203125, 3.216205596923828, 3.3886337280273438, 3.5610618591308594, 3.733489990234375, 3.9059181213378906, 4.078346252441406, 4.250774383544922, 4.4232025146484375, 4.595630645751953, 4.768058776855469, 4.940486907958984, 5.1129150390625, 5.285343170166016, 5.457771301269531, 5.630199432373047, 5.8026275634765625, 5.975055694580078]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 11.0, 15.0, 22.0, 35.0, 62.0, 83.0, 137.0, 226.0, 361.0, 639.0, 1129.0, 2221.0, 4752.0, 10287.0, 26569.0, 81039.0, 446291.0, 3335660.0, 200636.0, 51006.0, 18125.0, 7501.0, 3472.0, 1730.0, 925.0, 492.0, 294.0, 186.0, 133.0, 84.0, 45.0, 25.0, 17.0, 14.0, 13.0, 11.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2220916748046875, -1.175628662109375, -1.1291656494140625, -1.08270263671875, -1.0362396240234375, -0.989776611328125, -0.9433135986328125, -0.8968505859375, -0.8503875732421875, -0.803924560546875, -0.7574615478515625, -0.71099853515625, -0.6645355224609375, -0.618072509765625, -0.5716094970703125, -0.525146484375, -0.4786834716796875, -0.432220458984375, -0.3857574462890625, -0.33929443359375, -0.2928314208984375, -0.246368408203125, -0.1999053955078125, -0.1534423828125, -0.1069793701171875, -0.060516357421875, -0.0140533447265625, 0.03240966796875, 0.0788726806640625, 0.125335693359375, 0.1717987060546875, 0.21826171875, 0.2647247314453125, 0.311187744140625, 0.3576507568359375, 0.40411376953125, 0.4505767822265625, 0.497039794921875, 0.5435028076171875, 0.5899658203125, 0.6364288330078125, 0.682891845703125, 0.7293548583984375, 0.77581787109375, 0.8222808837890625, 0.868743896484375, 0.9152069091796875, 0.961669921875, 1.0081329345703125, 1.054595947265625, 1.1010589599609375, 1.14752197265625, 1.1939849853515625, 1.240447998046875, 1.2869110107421875, 1.3333740234375, 1.3798370361328125, 1.426300048828125, 1.4727630615234375, 1.51922607421875, 1.5656890869140625, 1.612152099609375, 1.6586151123046875, 1.705078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 3.0, 6.0, 7.0, 5.0, 16.0, 12.0, 17.0, 22.0, 37.0, 24.0, 26.0, 30.0, 47.0, 55.0, 62.0, 62.0, 71.0, 61.0, 62.0, 53.0, 57.0, 51.0, 32.0, 41.0, 34.0, 31.0, 22.0, 8.0, 10.0, 12.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4658203125, -0.4527626037597656, -0.43970489501953125, -0.4266471862792969, -0.4135894775390625, -0.4005317687988281, -0.38747406005859375, -0.3744163513183594, -0.361358642578125, -0.3483009338378906, -0.33524322509765625, -0.3221855163574219, -0.3091278076171875, -0.2960700988769531, -0.28301239013671875, -0.2699546813964844, -0.25689697265625, -0.24383926391601562, -0.23078155517578125, -0.21772384643554688, -0.2046661376953125, -0.19160842895507812, -0.17855072021484375, -0.16549301147460938, -0.152435302734375, -0.13937759399414062, -0.12631988525390625, -0.11326217651367188, -0.1002044677734375, -0.08714675903320312, -0.07408905029296875, -0.061031341552734375, -0.0479736328125, -0.034915924072265625, -0.02185821533203125, -0.008800506591796875, 0.0042572021484375, 0.017314910888671875, 0.03037261962890625, 0.043430328369140625, 0.056488037109375, 0.06954574584960938, 0.08260345458984375, 0.09566116333007812, 0.1087188720703125, 0.12177658081054688, 0.13483428955078125, 0.14789199829101562, 0.16094970703125, 0.17400741577148438, 0.18706512451171875, 0.20012283325195312, 0.2131805419921875, 0.22623825073242188, 0.23929595947265625, 0.2523536682128906, 0.265411376953125, 0.2784690856933594, 0.29152679443359375, 0.3045845031738281, 0.3176422119140625, 0.3306999206542969, 0.34375762939453125, 0.3568153381347656, 0.369873046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 11.0, 9.0, 20.0, 36.0, 49.0, 47.0, 94.0, 119.0, 184.0, 297.0, 506.0, 726.0, 1169.0, 2048.0, 3841.0, 7595.0, 15257.0, 35040.0, 89827.0, 306289.0, 2993406.0, 526895.0, 125003.0, 45787.0, 19981.0, 9166.0, 4690.0, 2399.0, 1433.0, 828.0, 496.0, 315.0, 225.0, 136.0, 93.0, 91.0, 38.0, 39.0, 29.0, 23.0, 21.0, 6.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.158203125, -1.121612548828125, -1.08502197265625, -1.048431396484375, -1.0118408203125, -0.975250244140625, -0.93865966796875, -0.902069091796875, -0.865478515625, -0.828887939453125, -0.79229736328125, -0.755706787109375, -0.7191162109375, -0.682525634765625, -0.64593505859375, -0.609344482421875, -0.57275390625, -0.536163330078125, -0.49957275390625, -0.462982177734375, -0.4263916015625, -0.389801025390625, -0.35321044921875, -0.316619873046875, -0.280029296875, -0.243438720703125, -0.20684814453125, -0.170257568359375, -0.1336669921875, -0.097076416015625, -0.06048583984375, -0.023895263671875, 0.0126953125, 0.049285888671875, 0.08587646484375, 0.122467041015625, 0.1590576171875, 0.195648193359375, 0.23223876953125, 0.268829345703125, 0.305419921875, 0.342010498046875, 0.37860107421875, 0.415191650390625, 0.4517822265625, 0.488372802734375, 0.52496337890625, 0.561553955078125, 0.59814453125, 0.634735107421875, 0.67132568359375, 0.707916259765625, 0.7445068359375, 0.781097412109375, 0.81768798828125, 0.854278564453125, 0.890869140625, 0.927459716796875, 0.96405029296875, 1.000640869140625, 1.0372314453125, 1.073822021484375, 1.11041259765625, 1.147003173828125, 1.18359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 9.0, 17.0, 16.0, 39.0, 39.0, 65.0, 91.0, 159.0, 317.0, 1510.0, 1043.0, 293.0, 167.0, 82.0, 64.0, 39.0, 30.0, 20.0, 14.0, 10.0, 12.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.67236328125, -0.64990234375, -0.62744140625, -0.60498046875, -0.58251953125, -0.56005859375, -0.53759765625, -0.51513671875, -0.49267578125, -0.47021484375, -0.44775390625, -0.42529296875, -0.40283203125, -0.38037109375, -0.35791015625, -0.33544921875, -0.31298828125, -0.29052734375, -0.26806640625, -0.24560546875, -0.22314453125, -0.20068359375, -0.17822265625, -0.15576171875, -0.13330078125, -0.11083984375, -0.08837890625, -0.06591796875, -0.04345703125, -0.02099609375, 0.00146484375, 0.02392578125, 0.04638671875, 0.06884765625, 0.09130859375, 0.11376953125, 0.13623046875, 0.15869140625, 0.18115234375, 0.20361328125, 0.22607421875, 0.24853515625, 0.27099609375, 0.29345703125, 0.31591796875, 0.33837890625, 0.36083984375, 0.38330078125, 0.40576171875, 0.42822265625, 0.45068359375, 0.47314453125, 0.49560546875, 0.51806640625, 0.54052734375, 0.56298828125, 0.58544921875, 0.60791015625, 0.63037109375, 0.65283203125, 0.67529296875, 0.69775390625, 0.72021484375, 0.74267578125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 10.0, 20.0, 50.0, 107.0, 140.0, 195.0, 176.0, 140.0, 83.0, 45.0, 18.0, 6.0, 9.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.638930320739746, -7.436737537384033, -7.23454475402832, -7.032351970672607, -6.8301591873168945, -6.627966403961182, -6.425773620605469, -6.223580360412598, -6.021388053894043, -5.81919527053833, -5.617002487182617, -5.414809703826904, -5.212616920471191, -5.0104241371154785, -4.808231353759766, -4.6060380935668945, -4.403845310211182, -4.201652526855469, -3.999459743499756, -3.797266960144043, -3.59507417678833, -3.392881393432617, -3.190688371658325, -2.9884955883026123, -2.7863028049468994, -2.5841100215911865, -2.3819172382354736, -2.1797242164611816, -1.9775315523147583, -1.7753387689590454, -1.573145866394043, -1.37095308303833, -1.1687607765197754, -0.9665679931640625, -0.7643751502037048, -0.5621823072433472, -0.3599895238876343, -0.1577967405319214, 0.044396162033081055, 0.24658894538879395, 0.44878172874450684, 0.6509745121002197, 0.8531673550605774, 1.055360198020935, 1.257552981376648, 1.4597457647323608, 1.6619386672973633, 1.8641314506530762, 2.066324234008789, 2.268517017364502, 2.470709800720215, 2.6729025840759277, 2.8750953674316406, 3.0772881507873535, 3.2794811725616455, 3.4816739559173584, 3.6838667392730713, 3.886059522628784, 4.088252544403076, 4.290445327758789, 4.492638111114502, 4.694830894470215, 4.897023677825928, 5.099216461181641, 5.3014092445373535]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 14.0, 11.0, 12.0, 12.0, 8.0, 12.0, 17.0, 20.0, 21.0, 21.0, 26.0, 34.0, 50.0, 29.0, 41.0, 29.0, 49.0, 43.0, 55.0, 44.0, 34.0, 34.0, 40.0, 35.0, 49.0, 32.0, 37.0, 19.0, 24.0, 23.0, 23.0, 20.0, 13.0, 13.0, 12.0, 5.0, 4.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9029884338378906, -1.8425865173339844, -1.7821846008300781, -1.7217828035354614, -1.6613808870315552, -1.600978970527649, -1.5405771732330322, -1.480175256729126, -1.4197733402252197, -1.3593714237213135, -1.2989695072174072, -1.2385677099227905, -1.1781657934188843, -1.117763876914978, -1.0573620796203613, -0.9969601631164551, -0.9365582466125488, -0.8761563301086426, -0.8157544732093811, -0.7553526163101196, -0.6949506998062134, -0.6345487833023071, -0.5741469264030457, -0.5137450695037842, -0.45334315299987793, -0.39294126629829407, -0.3325393795967102, -0.27213749289512634, -0.21173560619354248, -0.15133371949195862, -0.09093183279037476, -0.030529946088790894, 0.02987205982208252, 0.09027394652366638, 0.15067583322525024, 0.2110777199268341, 0.27147960662841797, 0.33188149333000183, 0.3922833800315857, 0.45268526673316956, 0.5130871534347534, 0.5734890699386597, 0.6338909268379211, 0.6942927837371826, 0.7546947002410889, 0.8150966167449951, 0.8754984736442566, 0.9359003305435181, 0.9963022470474243, 1.0567041635513306, 1.1171059608459473, 1.1775078773498535, 1.2379097938537598, 1.298311710357666, 1.3587136268615723, 1.419115424156189, 1.4795173406600952, 1.5399192571640015, 1.6003210544586182, 1.6607229709625244, 1.7211248874664307, 1.781526803970337, 1.8419287204742432, 1.9023305177688599, 1.9627324342727661]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 7.0, 13.0, 15.0, 25.0, 40.0, 52.0, 81.0, 141.0, 243.0, 477.0, 831.0, 1671.0, 3406.0, 7453.0, 16919.0, 37827.0, 82196.0, 177101.0, 338716.0, 207508.0, 94275.0, 43397.0, 19403.0, 8768.0, 3992.0, 1905.0, 961.0, 439.0, 241.0, 155.0, 106.0, 60.0, 49.0, 22.0, 18.0, 7.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.470703125, -1.43157958984375, -1.3924560546875, -1.35333251953125, -1.314208984375, -1.27508544921875, -1.2359619140625, -1.19683837890625, -1.15771484375, -1.11859130859375, -1.0794677734375, -1.04034423828125, -1.001220703125, -0.96209716796875, -0.9229736328125, -0.88385009765625, -0.8447265625, -0.80560302734375, -0.7664794921875, -0.72735595703125, -0.688232421875, -0.64910888671875, -0.6099853515625, -0.57086181640625, -0.53173828125, -0.49261474609375, -0.4534912109375, -0.41436767578125, -0.375244140625, -0.33612060546875, -0.2969970703125, -0.25787353515625, -0.21875, -0.17962646484375, -0.1405029296875, -0.10137939453125, -0.062255859375, -0.02313232421875, 0.0159912109375, 0.05511474609375, 0.09423828125, 0.13336181640625, 0.1724853515625, 0.21160888671875, 0.250732421875, 0.28985595703125, 0.3289794921875, 0.36810302734375, 0.4072265625, 0.44635009765625, 0.4854736328125, 0.52459716796875, 0.563720703125, 0.60284423828125, 0.6419677734375, 0.68109130859375, 0.72021484375, 0.75933837890625, 0.7984619140625, 0.83758544921875, 0.876708984375, 0.91583251953125, 0.9549560546875, 0.99407958984375, 1.033203125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 14.0, 9.0, 21.0, 9.0, 24.0, 19.0, 30.0, 28.0, 39.0, 56.0, 48.0, 61.0, 67.0, 53.0, 64.0, 62.0, 49.0, 58.0, 54.0, 36.0, 27.0, 41.0, 31.0, 22.0, 17.0, 18.0, 13.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.470703125, -0.4572868347167969, -0.44387054443359375, -0.4304542541503906, -0.4170379638671875, -0.4036216735839844, -0.39020538330078125, -0.3767890930175781, -0.363372802734375, -0.3499565124511719, -0.33654022216796875, -0.3231239318847656, -0.3097076416015625, -0.2962913513183594, -0.28287506103515625, -0.2694587707519531, -0.25604248046875, -0.24262619018554688, -0.22920989990234375, -0.21579360961914062, -0.2023773193359375, -0.18896102905273438, -0.17554473876953125, -0.16212844848632812, -0.148712158203125, -0.13529586791992188, -0.12187957763671875, -0.10846328735351562, -0.0950469970703125, -0.08163070678710938, -0.06821441650390625, -0.054798126220703125, -0.0413818359375, -0.027965545654296875, -0.01454925537109375, -0.001132965087890625, 0.0122833251953125, 0.025699615478515625, 0.03911590576171875, 0.052532196044921875, 0.065948486328125, 0.07936477661132812, 0.09278106689453125, 0.10619735717773438, 0.1196136474609375, 0.13302993774414062, 0.14644622802734375, 0.15986251831054688, 0.17327880859375, 0.18669509887695312, 0.20011138916015625, 0.21352767944335938, 0.2269439697265625, 0.24036026000976562, 0.25377655029296875, 0.2671928405761719, 0.280609130859375, 0.2940254211425781, 0.30744171142578125, 0.3208580017089844, 0.3342742919921875, 0.3476905822753906, 0.36110687255859375, 0.3745231628417969, 0.387939453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 0.0, 8.0, 8.0, 2.0, 7.0, 21.0, 15.0, 20.0, 28.0, 36.0, 52.0, 65.0, 82.0, 126.0, 166.0, 226.0, 303.0, 495.0, 759.0, 1306.0, 2893.0, 8769.0, 33708.0, 133582.0, 533514.0, 245356.0, 62706.0, 15249.0, 4487.0, 1736.0, 969.0, 534.0, 348.0, 288.0, 170.0, 130.0, 105.0, 77.0, 58.0, 27.0, 27.0, 22.0, 25.0, 15.0, 9.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.06640625, -2.0032501220703125, -1.940093994140625, -1.8769378662109375, -1.81378173828125, -1.7506256103515625, -1.687469482421875, -1.6243133544921875, -1.5611572265625, -1.4980010986328125, -1.434844970703125, -1.3716888427734375, -1.30853271484375, -1.2453765869140625, -1.182220458984375, -1.1190643310546875, -1.055908203125, -0.9927520751953125, -0.929595947265625, -0.8664398193359375, -0.80328369140625, -0.7401275634765625, -0.676971435546875, -0.6138153076171875, -0.5506591796875, -0.4875030517578125, -0.424346923828125, -0.3611907958984375, -0.29803466796875, -0.2348785400390625, -0.171722412109375, -0.1085662841796875, -0.04541015625, 0.0177459716796875, 0.080902099609375, 0.1440582275390625, 0.20721435546875, 0.2703704833984375, 0.333526611328125, 0.3966827392578125, 0.4598388671875, 0.5229949951171875, 0.586151123046875, 0.6493072509765625, 0.71246337890625, 0.7756195068359375, 0.838775634765625, 0.9019317626953125, 0.965087890625, 1.0282440185546875, 1.091400146484375, 1.1545562744140625, 1.21771240234375, 1.2808685302734375, 1.344024658203125, 1.4071807861328125, 1.4703369140625, 1.5334930419921875, 1.596649169921875, 1.6598052978515625, 1.72296142578125, 1.7861175537109375, 1.849273681640625, 1.9124298095703125, 1.9755859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 6.0, 3.0, 9.0, 7.0, 9.0, 10.0, 8.0, 12.0, 20.0, 21.0, 26.0, 33.0, 27.0, 42.0, 43.0, 54.0, 45.0, 56.0, 43.0, 48.0, 49.0, 52.0, 51.0, 47.0, 46.0, 38.0, 32.0, 36.0, 21.0, 14.0, 13.0, 11.0, 11.0, 9.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.912109375, -1.854644775390625, -1.79718017578125, -1.739715576171875, -1.6822509765625, -1.624786376953125, -1.56732177734375, -1.509857177734375, -1.452392578125, -1.394927978515625, -1.33746337890625, -1.279998779296875, -1.2225341796875, -1.165069580078125, -1.10760498046875, -1.050140380859375, -0.99267578125, -0.935211181640625, -0.87774658203125, -0.820281982421875, -0.7628173828125, -0.705352783203125, -0.64788818359375, -0.590423583984375, -0.532958984375, -0.475494384765625, -0.41802978515625, -0.360565185546875, -0.3031005859375, -0.245635986328125, -0.18817138671875, -0.130706787109375, -0.0732421875, -0.015777587890625, 0.04168701171875, 0.099151611328125, 0.1566162109375, 0.214080810546875, 0.27154541015625, 0.329010009765625, 0.386474609375, 0.443939208984375, 0.50140380859375, 0.558868408203125, 0.6163330078125, 0.673797607421875, 0.73126220703125, 0.788726806640625, 0.84619140625, 0.903656005859375, 0.96112060546875, 1.018585205078125, 1.0760498046875, 1.133514404296875, 1.19097900390625, 1.248443603515625, 1.305908203125, 1.363372802734375, 1.42083740234375, 1.478302001953125, 1.5357666015625, 1.593231201171875, 1.65069580078125, 1.708160400390625, 1.765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 12.0, 27.0, 45.0, 64.0, 110.0, 182.0, 336.0, 752.0, 2088.0, 6958.0, 34519.0, 203908.0, 650716.0, 120274.0, 21124.0, 4571.0, 1536.0, 653.0, 266.0, 120.0, 94.0, 60.0, 30.0, 25.0, 16.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.615234375, -1.571990966796875, -1.52874755859375, -1.485504150390625, -1.4422607421875, -1.399017333984375, -1.35577392578125, -1.312530517578125, -1.269287109375, -1.226043701171875, -1.18280029296875, -1.139556884765625, -1.0963134765625, -1.053070068359375, -1.00982666015625, -0.966583251953125, -0.92333984375, -0.880096435546875, -0.83685302734375, -0.793609619140625, -0.7503662109375, -0.707122802734375, -0.66387939453125, -0.620635986328125, -0.577392578125, -0.534149169921875, -0.49090576171875, -0.447662353515625, -0.4044189453125, -0.361175537109375, -0.31793212890625, -0.274688720703125, -0.2314453125, -0.188201904296875, -0.14495849609375, -0.101715087890625, -0.0584716796875, -0.015228271484375, 0.02801513671875, 0.071258544921875, 0.114501953125, 0.157745361328125, 0.20098876953125, 0.244232177734375, 0.2874755859375, 0.330718994140625, 0.37396240234375, 0.417205810546875, 0.46044921875, 0.503692626953125, 0.54693603515625, 0.590179443359375, 0.6334228515625, 0.676666259765625, 0.71990966796875, 0.763153076171875, 0.806396484375, 0.849639892578125, 0.89288330078125, 0.936126708984375, 0.9793701171875, 1.022613525390625, 1.06585693359375, 1.109100341796875, 1.15234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 11.0, 11.0, 20.0, 24.0, 26.0, 28.0, 32.0, 40.0, 50.0, 66.0, 132.0, 138.0, 97.0, 64.0, 45.0, 41.0, 32.0, 26.0, 15.0, 22.0, 8.0, 17.0, 14.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002073049545288086, -0.00019999034702777863, -0.00019267573952674866, -0.0001853611320257187, -0.00017804652452468872, -0.00017073191702365875, -0.00016341730952262878, -0.00015610270202159882, -0.00014878809452056885, -0.00014147348701953888, -0.0001341588795185089, -0.00012684427201747894, -0.00011952966451644897, -0.000112215057015419, -0.00010490044951438904, -9.758584201335907e-05, -9.02712345123291e-05, -8.295662701129913e-05, -7.564201951026917e-05, -6.83274120092392e-05, -6.101280450820923e-05, -5.369819700717926e-05, -4.638358950614929e-05, -3.9068982005119324e-05, -3.1754374504089355e-05, -2.4439767003059387e-05, -1.712515950202942e-05, -9.81055200099945e-06, -2.4959444999694824e-06, 4.818663001060486e-06, 1.2133270502090454e-05, 1.9447878003120422e-05, 2.676248550415039e-05, 3.407709300518036e-05, 4.139170050621033e-05, 4.8706308007240295e-05, 5.6020915508270264e-05, 6.333552300930023e-05, 7.06501305103302e-05, 7.796473801136017e-05, 8.527934551239014e-05, 9.25939530134201e-05, 9.990856051445007e-05, 0.00010722316801548004, 0.00011453777551651001, 0.00012185238301753998, 0.00012916699051856995, 0.00013648159801959991, 0.00014379620552062988, 0.00015111081302165985, 0.00015842542052268982, 0.0001657400280237198, 0.00017305463552474976, 0.00018036924302577972, 0.0001876838505268097, 0.00019499845802783966, 0.00020231306552886963, 0.0002096276730298996, 0.00021694228053092957, 0.00022425688803195953, 0.0002315714955329895, 0.00023888610303401947, 0.00024620071053504944, 0.0002535153180360794, 0.0002608299255371094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 5.0, 18.0, 34.0, 58.0, 140.0, 298.0, 973.0, 6640.0, 295915.0, 730399.0, 12061.0, 1344.0, 365.0, 144.0, 80.0, 36.0, 22.0, 11.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.1158447265625, -2.005126953125, -1.8944091796875, -1.78369140625, -1.6729736328125, -1.562255859375, -1.4515380859375, -1.3408203125, -1.2301025390625, -1.119384765625, -1.0086669921875, -0.89794921875, -0.7872314453125, -0.676513671875, -0.5657958984375, -0.455078125, -0.3443603515625, -0.233642578125, -0.1229248046875, -0.01220703125, 0.0985107421875, 0.209228515625, 0.3199462890625, 0.4306640625, 0.5413818359375, 0.652099609375, 0.7628173828125, 0.87353515625, 0.9842529296875, 1.094970703125, 1.2056884765625, 1.31640625, 1.4271240234375, 1.537841796875, 1.6485595703125, 1.75927734375, 1.8699951171875, 1.980712890625, 2.0914306640625, 2.2021484375, 2.3128662109375, 2.423583984375, 2.5343017578125, 2.64501953125, 2.7557373046875, 2.866455078125, 2.9771728515625, 3.087890625, 3.1986083984375, 3.309326171875, 3.4200439453125, 3.53076171875, 3.6414794921875, 3.752197265625, 3.8629150390625, 3.9736328125, 4.0843505859375, 4.195068359375, 4.3057861328125, 4.41650390625, 4.5272216796875, 4.637939453125, 4.7486572265625, 4.859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 14.0, 17.0, 22.0, 22.0, 32.0, 43.0, 42.0, 79.0, 102.0, 133.0, 112.0, 85.0, 71.0, 52.0, 44.0, 29.0, 22.0, 17.0, 7.0, 12.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.134765625, -1.0979461669921875, -1.061126708984375, -1.0243072509765625, -0.98748779296875, -0.9506683349609375, -0.913848876953125, -0.8770294189453125, -0.8402099609375, -0.8033905029296875, -0.766571044921875, -0.7297515869140625, -0.69293212890625, -0.6561126708984375, -0.619293212890625, -0.5824737548828125, -0.545654296875, -0.5088348388671875, -0.472015380859375, -0.4351959228515625, -0.39837646484375, -0.3615570068359375, -0.324737548828125, -0.2879180908203125, -0.2510986328125, -0.2142791748046875, -0.177459716796875, -0.1406402587890625, -0.10382080078125, -0.0670013427734375, -0.030181884765625, 0.0066375732421875, 0.04345703125, 0.0802764892578125, 0.117095947265625, 0.1539154052734375, 0.19073486328125, 0.2275543212890625, 0.264373779296875, 0.3011932373046875, 0.3380126953125, 0.3748321533203125, 0.411651611328125, 0.4484710693359375, 0.48529052734375, 0.5221099853515625, 0.558929443359375, 0.5957489013671875, 0.632568359375, 0.6693878173828125, 0.706207275390625, 0.7430267333984375, 0.77984619140625, 0.8166656494140625, 0.853485107421875, 0.8903045654296875, 0.9271240234375, 0.9639434814453125, 1.000762939453125, 1.0375823974609375, 1.07440185546875, 1.1112213134765625, 1.148040771484375, 1.1848602294921875, 1.2216796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 17.0, 41.0, 73.0, 122.0, 176.0, 195.0, 168.0, 111.0, 53.0, 27.0, 7.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.097789764404297, -18.418212890625, -17.738636016845703, -17.059059143066406, -16.37948226928711, -15.699904441833496, -15.020326614379883, -14.340749740600586, -13.661172866821289, -12.981595993041992, -12.302019119262695, -11.622441291809082, -10.942864418029785, -10.263287544250488, -9.583709716796875, -8.904132843017578, -8.224555969238281, -7.544979095458984, -6.865401744842529, -6.185824394226074, -5.506247520446777, -4.8266706466674805, -4.147093296051025, -3.4675159454345703, -2.7879390716552734, -2.1083619594573975, -1.4287848472595215, -0.7492077350616455, -0.06963062286376953, 0.6099464893341064, 1.2895236015319824, 1.9691009521484375, 2.648679733276367, 3.328256845474243, 4.007833957672119, 4.687411308288574, 5.366988182067871, 6.046565055847168, 6.726142406463623, 7.405719757080078, 8.085296630859375, 8.764873504638672, 9.444450378417969, 10.124028205871582, 10.803605079650879, 11.483181953430176, 12.162759780883789, 12.842336654663086, 13.521913528442383, 14.20149040222168, 14.881067276000977, 15.56064510345459, 16.240222930908203, 16.9197998046875, 17.599376678466797, 18.278953552246094, 18.95853042602539, 19.638107299804688, 20.317684173583984, 20.99726104736328, 21.676837921142578, 22.356416702270508, 23.035993576049805, 23.7155704498291, 24.3951473236084]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 8.0, 9.0, 11.0, 17.0, 19.0, 18.0, 27.0, 24.0, 27.0, 28.0, 31.0, 36.0, 27.0, 36.0, 33.0, 35.0, 46.0, 32.0, 58.0, 41.0, 54.0, 42.0, 37.0, 38.0, 33.0, 31.0, 37.0, 17.0, 20.0, 24.0, 12.0, 18.0, 13.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.588407516479492, -8.307476043701172, -8.026544570922852, -7.745614051818848, -7.464682579040527, -7.183751106262207, -6.902820110321045, -6.621889114379883, -6.3409576416015625, -6.060026168823242, -5.77909517288208, -5.498164176940918, -5.217232704162598, -4.936301231384277, -4.655370235443115, -4.374439239501953, -4.093507766723633, -3.8125765323638916, -3.5316452980041504, -3.250714063644409, -2.969782829284668, -2.6888515949249268, -2.4079203605651855, -2.1269891262054443, -1.8460578918457031, -1.565126657485962, -1.2841954231262207, -1.0032641887664795, -0.7223329544067383, -0.44140172004699707, -0.16047048568725586, 0.12046074867248535, 0.40139102935791016, 0.6823222637176514, 0.9632534980773926, 1.2441847324371338, 1.525115966796875, 1.8060472011566162, 2.0869784355163574, 2.3679096698760986, 2.64884090423584, 2.929772138595581, 3.2107033729553223, 3.4916346073150635, 3.7725658416748047, 4.053497314453125, 4.334428310394287, 4.615359306335449, 4.8962907791137695, 5.17722225189209, 5.458153247833252, 5.739084243774414, 6.020015716552734, 6.300947189331055, 6.581878185272217, 6.862809181213379, 7.143740653991699, 7.4246721267700195, 7.705603122711182, 7.986534118652344, 8.267465591430664, 8.548397064208984, 8.829328536987305, 9.110259056091309, 9.391190528869629]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 12.0, 29.0, 37.0, 85.0, 142.0, 208.0, 393.0, 740.0, 1567.0, 3530.0, 8469.0, 23897.0, 81698.0, 496976.0, 3291564.0, 210927.0, 48169.0, 15365.0, 5733.0, 2432.0, 1101.0, 549.0, 241.0, 172.0, 92.0, 48.0, 33.0, 27.0, 14.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1494293212890625, -1.092803955078125, -1.0361785888671875, -0.97955322265625, -0.9229278564453125, -0.866302490234375, -0.8096771240234375, -0.7530517578125, -0.6964263916015625, -0.639801025390625, -0.5831756591796875, -0.52655029296875, -0.4699249267578125, -0.413299560546875, -0.3566741943359375, -0.300048828125, -0.2434234619140625, -0.186798095703125, -0.1301727294921875, -0.07354736328125, -0.0169219970703125, 0.039703369140625, 0.0963287353515625, 0.1529541015625, 0.2095794677734375, 0.266204833984375, 0.3228302001953125, 0.37945556640625, 0.4360809326171875, 0.492706298828125, 0.5493316650390625, 0.60595703125, 0.6625823974609375, 0.719207763671875, 0.7758331298828125, 0.83245849609375, 0.8890838623046875, 0.945709228515625, 1.0023345947265625, 1.0589599609375, 1.1155853271484375, 1.172210693359375, 1.2288360595703125, 1.28546142578125, 1.3420867919921875, 1.398712158203125, 1.4553375244140625, 1.511962890625, 1.5685882568359375, 1.625213623046875, 1.6818389892578125, 1.73846435546875, 1.7950897216796875, 1.851715087890625, 1.9083404541015625, 1.9649658203125, 2.0215911865234375, 2.078216552734375, 2.1348419189453125, 2.19146728515625, 2.2480926513671875, 2.304718017578125, 2.3613433837890625, 2.41796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 9.0, 7.0, 13.0, 19.0, 17.0, 18.0, 18.0, 22.0, 27.0, 38.0, 52.0, 48.0, 57.0, 63.0, 45.0, 52.0, 58.0, 58.0, 56.0, 43.0, 52.0, 40.0, 32.0, 13.0, 30.0, 25.0, 22.0, 15.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.48095703125, -0.4669036865234375, -0.452850341796875, -0.4387969970703125, -0.42474365234375, -0.4106903076171875, -0.396636962890625, -0.3825836181640625, -0.3685302734375, -0.3544769287109375, -0.340423583984375, -0.3263702392578125, -0.31231689453125, -0.2982635498046875, -0.284210205078125, -0.2701568603515625, -0.256103515625, -0.2420501708984375, -0.227996826171875, -0.2139434814453125, -0.19989013671875, -0.1858367919921875, -0.171783447265625, -0.1577301025390625, -0.1436767578125, -0.1296234130859375, -0.115570068359375, -0.1015167236328125, -0.08746337890625, -0.0734100341796875, -0.059356689453125, -0.0453033447265625, -0.03125, -0.0171966552734375, -0.003143310546875, 0.0109100341796875, 0.02496337890625, 0.0390167236328125, 0.053070068359375, 0.0671234130859375, 0.0811767578125, 0.0952301025390625, 0.109283447265625, 0.1233367919921875, 0.13739013671875, 0.1514434814453125, 0.165496826171875, 0.1795501708984375, 0.193603515625, 0.2076568603515625, 0.221710205078125, 0.2357635498046875, 0.24981689453125, 0.2638702392578125, 0.277923583984375, 0.2919769287109375, 0.3060302734375, 0.3200836181640625, 0.334136962890625, 0.3481903076171875, 0.36224365234375, 0.3762969970703125, 0.390350341796875, 0.4044036865234375, 0.41845703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 9.0, 20.0, 14.0, 25.0, 42.0, 61.0, 92.0, 168.0, 266.0, 481.0, 882.0, 1597.0, 3058.0, 6295.0, 13736.0, 32240.0, 87184.0, 302477.0, 2700713.0, 789608.0, 161127.0, 53781.0, 21490.0, 9415.0, 4506.0, 2207.0, 1188.0, 639.0, 353.0, 201.0, 119.0, 90.0, 54.0, 51.0, 26.0, 10.0, 17.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3515625, -1.3076324462890625, -1.263702392578125, -1.2197723388671875, -1.17584228515625, -1.1319122314453125, -1.087982177734375, -1.0440521240234375, -1.0001220703125, -0.9561920166015625, -0.912261962890625, -0.8683319091796875, -0.82440185546875, -0.7804718017578125, -0.736541748046875, -0.6926116943359375, -0.648681640625, -0.6047515869140625, -0.560821533203125, -0.5168914794921875, -0.47296142578125, -0.4290313720703125, -0.385101318359375, -0.3411712646484375, -0.2972412109375, -0.2533111572265625, -0.209381103515625, -0.1654510498046875, -0.12152099609375, -0.0775909423828125, -0.033660888671875, 0.0102691650390625, 0.05419921875, 0.0981292724609375, 0.142059326171875, 0.1859893798828125, 0.22991943359375, 0.2738494873046875, 0.317779541015625, 0.3617095947265625, 0.4056396484375, 0.4495697021484375, 0.493499755859375, 0.5374298095703125, 0.58135986328125, 0.6252899169921875, 0.669219970703125, 0.7131500244140625, 0.757080078125, 0.8010101318359375, 0.844940185546875, 0.8888702392578125, 0.93280029296875, 0.9767303466796875, 1.020660400390625, 1.0645904541015625, 1.1085205078125, 1.1524505615234375, 1.196380615234375, 1.2403106689453125, 1.28424072265625, 1.3281707763671875, 1.372100830078125, 1.4160308837890625, 1.4599609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 13.0, 16.0, 20.0, 40.0, 48.0, 63.0, 116.0, 156.0, 238.0, 527.0, 1504.0, 581.0, 275.0, 138.0, 109.0, 53.0, 53.0, 32.0, 25.0, 9.0, 10.0, 7.0, 4.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.037109375, -1.0061798095703125, -0.975250244140625, -0.9443206787109375, -0.91339111328125, -0.8824615478515625, -0.851531982421875, -0.8206024169921875, -0.7896728515625, -0.7587432861328125, -0.727813720703125, -0.6968841552734375, -0.66595458984375, -0.6350250244140625, -0.604095458984375, -0.5731658935546875, -0.542236328125, -0.5113067626953125, -0.480377197265625, -0.4494476318359375, -0.41851806640625, -0.3875885009765625, -0.356658935546875, -0.3257293701171875, -0.2947998046875, -0.2638702392578125, -0.232940673828125, -0.2020111083984375, -0.17108154296875, -0.1401519775390625, -0.109222412109375, -0.0782928466796875, -0.04736328125, -0.0164337158203125, 0.014495849609375, 0.0454254150390625, 0.07635498046875, 0.1072845458984375, 0.138214111328125, 0.1691436767578125, 0.2000732421875, 0.2310028076171875, 0.261932373046875, 0.2928619384765625, 0.32379150390625, 0.3547210693359375, 0.385650634765625, 0.4165802001953125, 0.447509765625, 0.4784393310546875, 0.509368896484375, 0.5402984619140625, 0.57122802734375, 0.6021575927734375, 0.633087158203125, 0.6640167236328125, 0.6949462890625, 0.7258758544921875, 0.756805419921875, 0.7877349853515625, 0.81866455078125, 0.8495941162109375, 0.880523681640625, 0.9114532470703125, 0.9423828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 23.0, 43.0, 65.0, 122.0, 161.0, 168.0, 161.0, 120.0, 76.0, 26.0, 16.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.415340423583984, -13.128097534179688, -12.84085464477539, -12.553610801696777, -12.26636791229248, -11.979125022888184, -11.691882133483887, -11.40463924407959, -11.117395401000977, -10.83015251159668, -10.542909622192383, -10.25566577911377, -9.968422889709473, -9.681180000305176, -9.393937110900879, -9.106694221496582, -8.819451332092285, -8.532208442687988, -8.244965553283691, -7.957722187042236, -7.670478820800781, -7.383235931396484, -7.0959930419921875, -6.808750152587891, -6.5215067863464355, -6.234263896942139, -5.947020530700684, -5.659777641296387, -5.37253475189209, -5.085291385650635, -4.798048496246338, -4.510805130004883, -4.223561763763428, -3.9363186359405518, -3.649075508117676, -3.361832618713379, -3.074589490890503, -2.787346363067627, -2.50010347366333, -2.212860345840454, -1.9256172180175781, -1.6383740901947021, -1.3511310815811157, -1.0638880729675293, -0.7766449451446533, -0.48940181732177734, -0.20215880870819092, 0.08508419990539551, 0.3723273277282715, 0.6595703959465027, 0.9468134641647339, 1.2340564727783203, 1.5212996006011963, 1.8085427284240723, 2.095785617828369, 2.383028745651245, 2.670271873474121, 2.957515001296997, 3.244758129119873, 3.53200101852417, 3.819244146347046, 4.106487274169922, 4.393730163574219, 4.680973052978516, 4.968216419219971]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 11.0, 7.0, 8.0, 14.0, 18.0, 27.0, 23.0, 30.0, 31.0, 33.0, 40.0, 45.0, 39.0, 42.0, 55.0, 40.0, 51.0, 52.0, 49.0, 37.0, 40.0, 42.0, 40.0, 32.0, 36.0, 26.0, 14.0, 15.0, 20.0, 18.0, 13.0, 13.0, 8.0, 5.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5559964179992676, -3.444936990737915, -3.3338775634765625, -3.222817897796631, -3.1117584705352783, -3.000699043273926, -2.889639377593994, -2.7785799503326416, -2.667520523071289, -2.5564610958099365, -2.445401668548584, -2.3343420028686523, -2.2232825756073, -2.1122231483459473, -2.0011634826660156, -1.890104055404663, -1.7790446281433105, -1.667985200881958, -1.556925654411316, -1.4458661079406738, -1.3348066806793213, -1.2237472534179688, -1.1126877069473267, -1.0016281604766846, -0.890568733215332, -0.7795092463493347, -0.6684497594833374, -0.5573902726173401, -0.4463307857513428, -0.33527129888534546, -0.22421181201934814, -0.11315232515335083, -0.002092599868774414, 0.1089668869972229, 0.22002637386322021, 0.33108586072921753, 0.44214534759521484, 0.5532048344612122, 0.6642643213272095, 0.7753238081932068, 0.8863832950592041, 0.9974427819252014, 1.1085022687911987, 1.2195618152618408, 1.3306212425231934, 1.441680669784546, 1.552740216255188, 1.66379976272583, 1.7748591899871826, 1.8859186172485352, 1.9969781637191772, 2.1080377101898193, 2.219097137451172, 2.3301565647125244, 2.441215991973877, 2.5522756576538086, 2.663335084915161, 2.7743945121765137, 2.8854541778564453, 2.996513605117798, 3.1075730323791504, 3.218632459640503, 3.3296918869018555, 3.440751552581787, 3.5518109798431396]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 13.0, 14.0, 29.0, 33.0, 67.0, 76.0, 137.0, 245.0, 427.0, 840.0, 1776.0, 3769.0, 8665.0, 20849.0, 50929.0, 121193.0, 245005.0, 289868.0, 173067.0, 76268.0, 31447.0, 12981.0, 5683.0, 2543.0, 1198.0, 598.0, 333.0, 185.0, 112.0, 79.0, 44.0, 29.0, 11.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4384765625, -1.3951873779296875, -1.351898193359375, -1.3086090087890625, -1.26531982421875, -1.2220306396484375, -1.178741455078125, -1.1354522705078125, -1.0921630859375, -1.0488739013671875, -1.005584716796875, -0.9622955322265625, -0.91900634765625, -0.8757171630859375, -0.832427978515625, -0.7891387939453125, -0.745849609375, -0.7025604248046875, -0.659271240234375, -0.6159820556640625, -0.57269287109375, -0.5294036865234375, -0.486114501953125, -0.4428253173828125, -0.3995361328125, -0.3562469482421875, -0.312957763671875, -0.2696685791015625, -0.22637939453125, -0.1830902099609375, -0.139801025390625, -0.0965118408203125, -0.05322265625, -0.0099334716796875, 0.033355712890625, 0.0766448974609375, 0.11993408203125, 0.1632232666015625, 0.206512451171875, 0.2498016357421875, 0.2930908203125, 0.3363800048828125, 0.379669189453125, 0.4229583740234375, 0.46624755859375, 0.5095367431640625, 0.552825927734375, 0.5961151123046875, 0.639404296875, 0.6826934814453125, 0.725982666015625, 0.7692718505859375, 0.81256103515625, 0.8558502197265625, 0.899139404296875, 0.9424285888671875, 0.9857177734375, 1.0290069580078125, 1.072296142578125, 1.1155853271484375, 1.15887451171875, 1.2021636962890625, 1.245452880859375, 1.2887420654296875, 1.33203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 3.0, 6.0, 13.0, 13.0, 9.0, 18.0, 22.0, 26.0, 24.0, 37.0, 37.0, 31.0, 47.0, 46.0, 40.0, 51.0, 51.0, 62.0, 59.0, 58.0, 48.0, 47.0, 46.0, 42.0, 32.0, 32.0, 22.0, 22.0, 11.0, 11.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4773597717285156, -0.46277618408203125, -0.4481925964355469, -0.4336090087890625, -0.4190254211425781, -0.40444183349609375, -0.3898582458496094, -0.375274658203125, -0.3606910705566406, -0.34610748291015625, -0.3315238952636719, -0.3169403076171875, -0.3023567199707031, -0.28777313232421875, -0.2731895446777344, -0.25860595703125, -0.24402236938476562, -0.22943878173828125, -0.21485519409179688, -0.2002716064453125, -0.18568801879882812, -0.17110443115234375, -0.15652084350585938, -0.141937255859375, -0.12735366821289062, -0.11277008056640625, -0.09818649291992188, -0.0836029052734375, -0.06901931762695312, -0.05443572998046875, -0.039852142333984375, -0.0252685546875, -0.010684967041015625, 0.00389862060546875, 0.018482208251953125, 0.0330657958984375, 0.047649383544921875, 0.06223297119140625, 0.07681655883789062, 0.091400146484375, 0.10598373413085938, 0.12056732177734375, 0.13515090942382812, 0.1497344970703125, 0.16431808471679688, 0.17890167236328125, 0.19348526000976562, 0.20806884765625, 0.22265243530273438, 0.23723602294921875, 0.2518196105957031, 0.2664031982421875, 0.2809867858886719, 0.29557037353515625, 0.3101539611816406, 0.324737548828125, 0.3393211364746094, 0.35390472412109375, 0.3684883117675781, 0.3830718994140625, 0.3976554870605469, 0.41223907470703125, 0.4268226623535156, 0.44140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 9.0, 5.0, 25.0, 25.0, 29.0, 39.0, 72.0, 87.0, 107.0, 202.0, 273.0, 433.0, 726.0, 1355.0, 3601.0, 15184.0, 92782.0, 481092.0, 372010.0, 63588.0, 11118.0, 2744.0, 1159.0, 607.0, 380.0, 274.0, 194.0, 137.0, 93.0, 49.0, 52.0, 33.0, 12.0, 17.0, 7.0, 11.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.376495361328125, -2.28814697265625, -2.199798583984375, -2.1114501953125, -2.023101806640625, -1.93475341796875, -1.846405029296875, -1.758056640625, -1.669708251953125, -1.58135986328125, -1.493011474609375, -1.4046630859375, -1.316314697265625, -1.22796630859375, -1.139617919921875, -1.05126953125, -0.962921142578125, -0.87457275390625, -0.786224365234375, -0.6978759765625, -0.609527587890625, -0.52117919921875, -0.432830810546875, -0.344482421875, -0.256134033203125, -0.16778564453125, -0.079437255859375, 0.0089111328125, 0.097259521484375, 0.18560791015625, 0.273956298828125, 0.3623046875, 0.450653076171875, 0.53900146484375, 0.627349853515625, 0.7156982421875, 0.804046630859375, 0.89239501953125, 0.980743408203125, 1.069091796875, 1.157440185546875, 1.24578857421875, 1.334136962890625, 1.4224853515625, 1.510833740234375, 1.59918212890625, 1.687530517578125, 1.77587890625, 1.864227294921875, 1.95257568359375, 2.040924072265625, 2.1292724609375, 2.217620849609375, 2.30596923828125, 2.394317626953125, 2.482666015625, 2.571014404296875, 2.65936279296875, 2.747711181640625, 2.8360595703125, 2.924407958984375, 3.01275634765625, 3.101104736328125, 3.189453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 13.0, 5.0, 9.0, 12.0, 12.0, 18.0, 17.0, 18.0, 21.0, 36.0, 26.0, 37.0, 32.0, 29.0, 35.0, 44.0, 47.0, 36.0, 46.0, 47.0, 38.0, 49.0, 41.0, 38.0, 24.0, 28.0, 31.0, 23.0, 20.0, 26.0, 16.0, 17.0, 17.0, 13.0, 16.0, 10.0, 14.0, 5.0, 3.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.017578125, -1.952178955078125, -1.88677978515625, -1.821380615234375, -1.7559814453125, -1.690582275390625, -1.62518310546875, -1.559783935546875, -1.494384765625, -1.428985595703125, -1.36358642578125, -1.298187255859375, -1.2327880859375, -1.167388916015625, -1.10198974609375, -1.036590576171875, -0.97119140625, -0.905792236328125, -0.84039306640625, -0.774993896484375, -0.7095947265625, -0.644195556640625, -0.57879638671875, -0.513397216796875, -0.447998046875, -0.382598876953125, -0.31719970703125, -0.251800537109375, -0.1864013671875, -0.121002197265625, -0.05560302734375, 0.009796142578125, 0.0751953125, 0.140594482421875, 0.20599365234375, 0.271392822265625, 0.3367919921875, 0.402191162109375, 0.46759033203125, 0.532989501953125, 0.598388671875, 0.663787841796875, 0.72918701171875, 0.794586181640625, 0.8599853515625, 0.925384521484375, 0.99078369140625, 1.056182861328125, 1.12158203125, 1.186981201171875, 1.25238037109375, 1.317779541015625, 1.3831787109375, 1.448577880859375, 1.51397705078125, 1.579376220703125, 1.644775390625, 1.710174560546875, 1.77557373046875, 1.840972900390625, 1.9063720703125, 1.971771240234375, 2.03717041015625, 2.102569580078125, 2.16796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 7.0, 6.0, 8.0, 6.0, 11.0, 15.0, 19.0, 36.0, 55.0, 82.0, 130.0, 272.0, 540.0, 1065.0, 2343.0, 6647.0, 23043.0, 97857.0, 416354.0, 381691.0, 87634.0, 20363.0, 6097.0, 2217.0, 955.0, 473.0, 251.0, 132.0, 95.0, 42.0, 31.0, 31.0, 18.0, 11.0, 9.0, 1.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9666900634765625, -0.924591064453125, -0.8824920654296875, -0.84039306640625, -0.7982940673828125, -0.756195068359375, -0.7140960693359375, -0.6719970703125, -0.6298980712890625, -0.587799072265625, -0.5457000732421875, -0.50360107421875, -0.4615020751953125, -0.419403076171875, -0.3773040771484375, -0.335205078125, -0.2931060791015625, -0.251007080078125, -0.2089080810546875, -0.16680908203125, -0.1247100830078125, -0.082611083984375, -0.0405120849609375, 0.0015869140625, 0.0436859130859375, 0.085784912109375, 0.1278839111328125, 0.16998291015625, 0.2120819091796875, 0.254180908203125, 0.2962799072265625, 0.33837890625, 0.3804779052734375, 0.422576904296875, 0.4646759033203125, 0.50677490234375, 0.5488739013671875, 0.590972900390625, 0.6330718994140625, 0.6751708984375, 0.7172698974609375, 0.759368896484375, 0.8014678955078125, 0.84356689453125, 0.8856658935546875, 0.927764892578125, 0.9698638916015625, 1.011962890625, 1.0540618896484375, 1.096160888671875, 1.1382598876953125, 1.18035888671875, 1.2224578857421875, 1.264556884765625, 1.3066558837890625, 1.3487548828125, 1.3908538818359375, 1.432952880859375, 1.4750518798828125, 1.51715087890625, 1.5592498779296875, 1.601348876953125, 1.6434478759765625, 1.685546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 2.0, 7.0, 13.0, 24.0, 25.0, 27.0, 37.0, 55.0, 60.0, 83.0, 105.0, 96.0, 104.0, 74.0, 56.0, 54.0, 37.0, 30.0, 23.0, 19.0, 16.0, 5.0, 18.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031280517578125, -0.0003044009208679199, -0.00029599666595458984, -0.00028759241104125977, -0.0002791881561279297, -0.0002707839012145996, -0.00026237964630126953, -0.00025397539138793945, -0.0002455711364746094, -0.0002371668815612793, -0.00022876262664794922, -0.00022035837173461914, -0.00021195411682128906, -0.00020354986190795898, -0.0001951456069946289, -0.00018674135208129883, -0.00017833709716796875, -0.00016993284225463867, -0.0001615285873413086, -0.00015312433242797852, -0.00014472007751464844, -0.00013631582260131836, -0.00012791156768798828, -0.0001195073127746582, -0.00011110305786132812, -0.00010269880294799805, -9.429454803466797e-05, -8.589029312133789e-05, -7.748603820800781e-05, -6.908178329467773e-05, -6.0677528381347656e-05, -5.227327346801758e-05, -4.38690185546875e-05, -3.546476364135742e-05, -2.7060508728027344e-05, -1.8656253814697266e-05, -1.0251998901367188e-05, -1.8477439880371094e-06, 6.556510925292969e-06, 1.4960765838623047e-05, 2.3365020751953125e-05, 3.17692756652832e-05, 4.017353057861328e-05, 4.857778549194336e-05, 5.698204040527344e-05, 6.538629531860352e-05, 7.37905502319336e-05, 8.219480514526367e-05, 9.059906005859375e-05, 9.900331497192383e-05, 0.0001074075698852539, 0.00011581182479858398, 0.00012421607971191406, 0.00013262033462524414, 0.00014102458953857422, 0.0001494288444519043, 0.00015783309936523438, 0.00016623735427856445, 0.00017464160919189453, 0.0001830458641052246, 0.0001914501190185547, 0.00019985437393188477, 0.00020825862884521484, 0.00021666288375854492, 0.000225067138671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 15.0, 9.0, 13.0, 20.0, 22.0, 47.0, 59.0, 85.0, 135.0, 169.0, 279.0, 510.0, 894.0, 1681.0, 3518.0, 8885.0, 27734.0, 105180.0, 403992.0, 363862.0, 91701.0, 24592.0, 8141.0, 3237.0, 1542.0, 829.0, 473.0, 294.0, 181.0, 142.0, 81.0, 53.0, 38.0, 33.0, 31.0, 16.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2265625, -1.1869354248046875, -1.147308349609375, -1.1076812744140625, -1.06805419921875, -1.0284271240234375, -0.988800048828125, -0.9491729736328125, -0.9095458984375, -0.8699188232421875, -0.830291748046875, -0.7906646728515625, -0.75103759765625, -0.7114105224609375, -0.671783447265625, -0.6321563720703125, -0.592529296875, -0.5529022216796875, -0.513275146484375, -0.4736480712890625, -0.43402099609375, -0.3943939208984375, -0.354766845703125, -0.3151397705078125, -0.2755126953125, -0.2358856201171875, -0.196258544921875, -0.1566314697265625, -0.11700439453125, -0.0773773193359375, -0.037750244140625, 0.0018768310546875, 0.04150390625, 0.0811309814453125, 0.120758056640625, 0.1603851318359375, 0.20001220703125, 0.2396392822265625, 0.279266357421875, 0.3188934326171875, 0.3585205078125, 0.3981475830078125, 0.437774658203125, 0.4774017333984375, 0.51702880859375, 0.5566558837890625, 0.596282958984375, 0.6359100341796875, 0.675537109375, 0.7151641845703125, 0.754791259765625, 0.7944183349609375, 0.83404541015625, 0.8736724853515625, 0.913299560546875, 0.9529266357421875, 0.9925537109375, 1.0321807861328125, 1.071807861328125, 1.1114349365234375, 1.15106201171875, 1.1906890869140625, 1.230316162109375, 1.2699432373046875, 1.3095703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 5.0, 6.0, 11.0, 15.0, 21.0, 20.0, 29.0, 28.0, 39.0, 48.0, 58.0, 55.0, 63.0, 63.0, 83.0, 77.0, 54.0, 59.0, 44.0, 37.0, 39.0, 27.0, 30.0, 13.0, 14.0, 16.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1119232177734375, -1.078338623046875, -1.0447540283203125, -1.01116943359375, -0.9775848388671875, -0.944000244140625, -0.9104156494140625, -0.8768310546875, -0.8432464599609375, -0.809661865234375, -0.7760772705078125, -0.74249267578125, -0.7089080810546875, -0.675323486328125, -0.6417388916015625, -0.608154296875, -0.5745697021484375, -0.540985107421875, -0.5074005126953125, -0.47381591796875, -0.4402313232421875, -0.406646728515625, -0.3730621337890625, -0.3394775390625, -0.3058929443359375, -0.272308349609375, -0.2387237548828125, -0.20513916015625, -0.1715545654296875, -0.137969970703125, -0.1043853759765625, -0.07080078125, -0.0372161865234375, -0.003631591796875, 0.0299530029296875, 0.06353759765625, 0.0971221923828125, 0.130706787109375, 0.1642913818359375, 0.1978759765625, 0.2314605712890625, 0.265045166015625, 0.2986297607421875, 0.33221435546875, 0.3657989501953125, 0.399383544921875, 0.4329681396484375, 0.466552734375, 0.5001373291015625, 0.533721923828125, 0.5673065185546875, 0.60089111328125, 0.6344757080078125, 0.668060302734375, 0.7016448974609375, 0.7352294921875, 0.7688140869140625, 0.802398681640625, 0.8359832763671875, 0.86956787109375, 0.9031524658203125, 0.936737060546875, 0.9703216552734375, 1.00390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 13.0, 28.0, 67.0, 104.0, 146.0, 165.0, 159.0, 143.0, 77.0, 43.0, 20.0, 21.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.57615852355957, -22.898099899291992, -22.22003936767578, -21.541980743408203, -20.863920211791992, -20.185861587524414, -19.507801055908203, -18.829742431640625, -18.151683807373047, -17.47362518310547, -16.795564651489258, -16.11750602722168, -15.439445495605469, -14.76138687133789, -14.083327293395996, -13.405267715454102, -12.72720718383789, -12.049147605895996, -11.371088027954102, -10.693029403686523, -10.014968872070312, -9.336910247802734, -8.65885066986084, -7.980791091918945, -7.302731513977051, -6.624671936035156, -5.946612358093262, -5.268553256988525, -4.590493679046631, -3.9124341011047363, -3.234375, -2.5563154220581055, -1.8782539367675781, -1.2001944780349731, -0.5221350193023682, 0.15592432022094727, 0.8339838981628418, 1.5120434761047363, 2.1901025772094727, 2.868162155151367, 3.5462217330932617, 4.224281311035156, 4.902340888977051, 5.580399990081787, 6.258459568023682, 6.936519145965576, 7.6145782470703125, 8.292637825012207, 8.970697402954102, 9.648756980895996, 10.32681655883789, 11.004875183105469, 11.68293571472168, 12.360994338989258, 13.039053916931152, 13.717113494873047, 14.395173072814941, 15.073232650756836, 15.75129222869873, 16.429351806640625, 17.107410430908203, 17.785470962524414, 18.463529586791992, 19.141590118408203, 19.81964874267578]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 7.0, 3.0, 4.0, 13.0, 11.0, 14.0, 8.0, 11.0, 16.0, 11.0, 26.0, 21.0, 28.0, 31.0, 36.0, 43.0, 42.0, 34.0, 37.0, 46.0, 43.0, 45.0, 48.0, 56.0, 41.0, 43.0, 44.0, 37.0, 33.0, 25.0, 20.0, 19.0, 21.0, 12.0, 11.0, 11.0, 13.0, 6.0, 10.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.2324857711792, -10.869551658630371, -10.506617546081543, -10.143683433532715, -9.78074836730957, -9.417814254760742, -9.054880142211914, -8.691946029663086, -8.329011917114258, -7.96607780456543, -7.603143692016602, -7.240209102630615, -6.877274990081787, -6.514340877532959, -6.151406288146973, -5.7884721755981445, -5.425538063049316, -5.062603950500488, -4.69966983795166, -4.336735248565674, -3.9738011360168457, -3.6108670234680176, -3.2479326725006104, -2.884998321533203, -2.522064208984375, -2.159130096435547, -1.7961957454681396, -1.433261513710022, -1.0703272819519043, -0.7073930501937866, -0.34445881843566895, 0.01847553253173828, 0.3814096450805664, 0.7443438768386841, 1.1072781085968018, 1.4702123403549194, 1.833146572113037, 2.1960806846618652, 2.5590150356292725, 2.9219493865966797, 3.284883499145508, 3.647817611694336, 4.010751724243164, 4.37368631362915, 4.7366204261779785, 5.099554538726807, 5.462489128112793, 5.825423240661621, 6.188357353210449, 6.551291465759277, 6.9142255783081055, 7.277160167694092, 7.64009428024292, 8.003028869628906, 8.365962982177734, 8.728897094726562, 9.09183120727539, 9.454765319824219, 9.817699432373047, 10.180633544921875, 10.543567657470703, 10.906502723693848, 11.269436836242676, 11.632370948791504, 11.995305061340332]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 6.0, 0.0, 2.0, 5.0, 13.0, 10.0, 13.0, 30.0, 31.0, 44.0, 83.0, 88.0, 154.0, 204.0, 349.0, 538.0, 851.0, 1534.0, 2703.0, 5881.0, 16038.0, 67660.0, 3908214.0, 148674.0, 24630.0, 8255.0, 3631.0, 1858.0, 1010.0, 592.0, 375.0, 237.0, 187.0, 110.0, 79.0, 46.0, 44.0, 32.0, 21.0, 11.0, 11.0, 9.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.949462890625, -1.87353515625, -1.797607421875, -1.7216796875, -1.645751953125, -1.56982421875, -1.493896484375, -1.41796875, -1.342041015625, -1.26611328125, -1.190185546875, -1.1142578125, -1.038330078125, -0.96240234375, -0.886474609375, -0.810546875, -0.734619140625, -0.65869140625, -0.582763671875, -0.5068359375, -0.430908203125, -0.35498046875, -0.279052734375, -0.203125, -0.127197265625, -0.05126953125, 0.024658203125, 0.1005859375, 0.176513671875, 0.25244140625, 0.328369140625, 0.404296875, 0.480224609375, 0.55615234375, 0.632080078125, 0.7080078125, 0.783935546875, 0.85986328125, 0.935791015625, 1.01171875, 1.087646484375, 1.16357421875, 1.239501953125, 1.3154296875, 1.391357421875, 1.46728515625, 1.543212890625, 1.619140625, 1.695068359375, 1.77099609375, 1.846923828125, 1.9228515625, 1.998779296875, 2.07470703125, 2.150634765625, 2.2265625, 2.302490234375, 2.37841796875, 2.454345703125, 2.5302734375, 2.606201171875, 2.68212890625, 2.758056640625, 2.833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 7.0, 12.0, 11.0, 21.0, 17.0, 24.0, 17.0, 31.0, 36.0, 37.0, 49.0, 40.0, 46.0, 52.0, 57.0, 57.0, 57.0, 70.0, 47.0, 38.0, 46.0, 41.0, 33.0, 25.0, 22.0, 15.0, 10.0, 14.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.62060546875, -0.6035995483398438, -0.5865936279296875, -0.5695877075195312, -0.552581787109375, -0.5355758666992188, -0.5185699462890625, -0.5015640258789062, -0.48455810546875, -0.46755218505859375, -0.4505462646484375, -0.43354034423828125, -0.416534423828125, -0.39952850341796875, -0.3825225830078125, -0.36551666259765625, -0.3485107421875, -0.33150482177734375, -0.3144989013671875, -0.29749298095703125, -0.280487060546875, -0.26348114013671875, -0.2464752197265625, -0.22946929931640625, -0.21246337890625, -0.19545745849609375, -0.1784515380859375, -0.16144561767578125, -0.144439697265625, -0.12743377685546875, -0.1104278564453125, -0.09342193603515625, -0.076416015625, -0.05941009521484375, -0.0424041748046875, -0.02539825439453125, -0.008392333984375, 0.00861358642578125, 0.0256195068359375, 0.04262542724609375, 0.05963134765625, 0.07663726806640625, 0.0936431884765625, 0.11064910888671875, 0.127655029296875, 0.14466094970703125, 0.1616668701171875, 0.17867279052734375, 0.1956787109375, 0.21268463134765625, 0.2296905517578125, 0.24669647216796875, 0.263702392578125, 0.28070831298828125, 0.2977142333984375, 0.31472015380859375, 0.33172607421875, 0.34873199462890625, 0.3657379150390625, 0.38274383544921875, 0.399749755859375, 0.41675567626953125, 0.4337615966796875, 0.45076751708984375, 0.4677734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 10.0, 8.0, 17.0, 23.0, 29.0, 62.0, 85.0, 132.0, 197.0, 364.0, 725.0, 1497.0, 3434.0, 9237.0, 35689.0, 3485323.0, 611064.0, 31635.0, 8481.0, 3145.0, 1408.0, 727.0, 385.0, 206.0, 123.0, 87.0, 55.0, 42.0, 23.0, 17.0, 9.0, 14.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.91339111328125, -2.8092041015625, -2.70501708984375, -2.600830078125, -2.49664306640625, -2.3924560546875, -2.28826904296875, -2.18408203125, -2.07989501953125, -1.9757080078125, -1.87152099609375, -1.767333984375, -1.66314697265625, -1.5589599609375, -1.45477294921875, -1.3505859375, -1.24639892578125, -1.1422119140625, -1.03802490234375, -0.933837890625, -0.82965087890625, -0.7254638671875, -0.62127685546875, -0.51708984375, -0.41290283203125, -0.3087158203125, -0.20452880859375, -0.100341796875, 0.00384521484375, 0.1080322265625, 0.21221923828125, 0.31640625, 0.42059326171875, 0.5247802734375, 0.62896728515625, 0.733154296875, 0.83734130859375, 0.9415283203125, 1.04571533203125, 1.14990234375, 1.25408935546875, 1.3582763671875, 1.46246337890625, 1.566650390625, 1.67083740234375, 1.7750244140625, 1.87921142578125, 1.9833984375, 2.08758544921875, 2.1917724609375, 2.29595947265625, 2.400146484375, 2.50433349609375, 2.6085205078125, 2.71270751953125, 2.81689453125, 2.92108154296875, 3.0252685546875, 3.12945556640625, 3.233642578125, 3.33782958984375, 3.4420166015625, 3.54620361328125, 3.650390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 10.0, 10.0, 23.0, 13.0, 26.0, 39.0, 73.0, 182.0, 3104.0, 338.0, 101.0, 65.0, 28.0, 15.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44287109375, -0.4249267578125, -0.406982421875, -0.3890380859375, -0.37109375, -0.3531494140625, -0.335205078125, -0.3172607421875, -0.29931640625, -0.2813720703125, -0.263427734375, -0.2454833984375, -0.2275390625, -0.2095947265625, -0.191650390625, -0.1737060546875, -0.15576171875, -0.1378173828125, -0.119873046875, -0.1019287109375, -0.083984375, -0.0660400390625, -0.048095703125, -0.0301513671875, -0.01220703125, 0.0057373046875, 0.023681640625, 0.0416259765625, 0.0595703125, 0.0775146484375, 0.095458984375, 0.1134033203125, 0.13134765625, 0.1492919921875, 0.167236328125, 0.1851806640625, 0.203125, 0.2210693359375, 0.239013671875, 0.2569580078125, 0.27490234375, 0.2928466796875, 0.310791015625, 0.3287353515625, 0.3466796875, 0.3646240234375, 0.382568359375, 0.4005126953125, 0.41845703125, 0.4364013671875, 0.454345703125, 0.4722900390625, 0.490234375, 0.5081787109375, 0.526123046875, 0.5440673828125, 0.56201171875, 0.5799560546875, 0.597900390625, 0.6158447265625, 0.6337890625, 0.6517333984375, 0.669677734375, 0.6876220703125, 0.70556640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 15.0, 23.0, 38.0, 51.0, 67.0, 85.0, 92.0, 87.0, 86.0, 93.0, 75.0, 61.0, 65.0, 36.0, 40.0, 22.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3268327713012695, -1.2658958435058594, -1.2049589157104492, -1.144021987915039, -1.0830851793289185, -1.0221482515335083, -0.9612113237380981, -0.900274395942688, -0.8393375277519226, -0.7784005999565125, -0.7174637317657471, -0.6565268039703369, -0.5955898761749268, -0.5346530079841614, -0.4737160801887512, -0.41277918219566345, -0.3518422842025757, -0.2909053862094879, -0.22996847331523895, -0.16903156042099, -0.10809466242790222, -0.04715776443481445, 0.013779163360595703, 0.07471606135368347, 0.13565295934677124, 0.196589857339859, 0.2575267553329468, 0.31846368312835693, 0.3794005811214447, 0.44033747911453247, 0.5012744069099426, 0.562211275100708, 0.6231482028961182, 0.6840851306915283, 0.7450219988822937, 0.8059589266777039, 0.8668957948684692, 0.9278327226638794, 0.9887696504592896, 1.0497065782546997, 1.1106433868408203, 1.1715803146362305, 1.2325172424316406, 1.2934541702270508, 1.3543909788131714, 1.4153279066085815, 1.4762648344039917, 1.5372017621994019, 1.598138689994812, 1.6590756177902222, 1.7200125455856323, 1.780949354171753, 1.841886281967163, 1.9028232097625732, 1.9637601375579834, 2.0246970653533936, 2.0856339931488037, 2.146570920944214, 2.207507848739624, 2.268444776535034, 2.3293817043304443, 2.3903183937072754, 2.4512553215026855, 2.5121922492980957, 2.573129177093506]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 7.0, 12.0, 9.0, 20.0, 18.0, 22.0, 31.0, 31.0, 37.0, 46.0, 39.0, 49.0, 45.0, 37.0, 38.0, 58.0, 55.0, 47.0, 34.0, 44.0, 28.0, 26.0, 37.0, 32.0, 23.0, 23.0, 24.0, 24.0, 12.0, 12.0, 14.0, 8.0, 13.0, 5.0, 3.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1505343914031982, -1.1135934591293335, -1.0766524076461792, -1.0397114753723145, -1.0027705430984497, -0.9658295512199402, -0.9288885593414307, -0.8919476270675659, -0.8550066351890564, -0.8180656433105469, -0.7811247110366821, -0.7441837191581726, -0.7072427272796631, -0.6703017950057983, -0.6333608031272888, -0.5964198112487793, -0.5594788789749146, -0.522537887096405, -0.4855969548225403, -0.44865596294403076, -0.41171500086784363, -0.3747740387916565, -0.337833046913147, -0.30089208483695984, -0.2639511227607727, -0.22701016068458557, -0.19006918370723724, -0.15312820672988892, -0.11618724465370178, -0.07924628257751465, -0.04230530560016632, -0.005364328622817993, 0.03157663345336914, 0.06851760298013687, 0.1054585725069046, 0.14239954948425293, 0.17934051156044006, 0.2162814736366272, 0.2532224655151367, 0.29016342759132385, 0.327104389667511, 0.3640453517436981, 0.40098631381988525, 0.4379273056983948, 0.4748682677745819, 0.511809229850769, 0.5487502217292786, 0.5856912136077881, 0.6226321458816528, 0.6595731377601624, 0.6965140700340271, 0.7334550619125366, 0.7703959941864014, 0.8073369860649109, 0.8442779779434204, 0.8812189102172852, 0.9181599020957947, 0.9551008939743042, 0.992041826248169, 1.0289827585220337, 1.065923810005188, 1.1028647422790527, 1.1398056745529175, 1.1767467260360718, 1.2136876583099365]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 11.0, 5.0, 20.0, 13.0, 26.0, 34.0, 78.0, 91.0, 192.0, 341.0, 654.0, 1536.0, 3506.0, 8647.0, 22349.0, 57896.0, 145612.0, 287022.0, 283748.0, 143748.0, 56804.0, 21428.0, 8372.0, 3412.0, 1515.0, 658.0, 356.0, 187.0, 109.0, 66.0, 38.0, 22.0, 13.0, 11.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.8525390625, -1.805023193359375, -1.75750732421875, -1.709991455078125, -1.6624755859375, -1.614959716796875, -1.56744384765625, -1.519927978515625, -1.472412109375, -1.424896240234375, -1.37738037109375, -1.329864501953125, -1.2823486328125, -1.234832763671875, -1.18731689453125, -1.139801025390625, -1.09228515625, -1.044769287109375, -0.99725341796875, -0.949737548828125, -0.9022216796875, -0.854705810546875, -0.80718994140625, -0.759674072265625, -0.712158203125, -0.664642333984375, -0.61712646484375, -0.569610595703125, -0.5220947265625, -0.474578857421875, -0.42706298828125, -0.379547119140625, -0.33203125, -0.284515380859375, -0.23699951171875, -0.189483642578125, -0.1419677734375, -0.094451904296875, -0.04693603515625, 0.000579833984375, 0.048095703125, 0.095611572265625, 0.14312744140625, 0.190643310546875, 0.2381591796875, 0.285675048828125, 0.33319091796875, 0.380706787109375, 0.42822265625, 0.475738525390625, 0.52325439453125, 0.570770263671875, 0.6182861328125, 0.665802001953125, 0.71331787109375, 0.760833740234375, 0.808349609375, 0.855865478515625, 0.90338134765625, 0.950897216796875, 0.9984130859375, 1.045928955078125, 1.09344482421875, 1.140960693359375, 1.1884765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 6.0, 9.0, 14.0, 14.0, 15.0, 25.0, 26.0, 27.0, 37.0, 30.0, 44.0, 57.0, 58.0, 55.0, 75.0, 63.0, 61.0, 59.0, 45.0, 35.0, 35.0, 37.0, 32.0, 31.0, 21.0, 12.0, 11.0, 10.0, 8.0, 5.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6729507446289062, -0.6540069580078125, -0.6350631713867188, -0.616119384765625, -0.5971755981445312, -0.5782318115234375, -0.5592880249023438, -0.54034423828125, -0.5214004516601562, -0.5024566650390625, -0.48351287841796875, -0.464569091796875, -0.44562530517578125, -0.4266815185546875, -0.40773773193359375, -0.3887939453125, -0.36985015869140625, -0.3509063720703125, -0.33196258544921875, -0.313018798828125, -0.29407501220703125, -0.2751312255859375, -0.25618743896484375, -0.23724365234375, -0.21829986572265625, -0.1993560791015625, -0.18041229248046875, -0.161468505859375, -0.14252471923828125, -0.1235809326171875, -0.10463714599609375, -0.085693359375, -0.06674957275390625, -0.0478057861328125, -0.02886199951171875, -0.009918212890625, 0.00902557373046875, 0.0279693603515625, 0.04691314697265625, 0.06585693359375, 0.08480072021484375, 0.1037445068359375, 0.12268829345703125, 0.141632080078125, 0.16057586669921875, 0.1795196533203125, 0.19846343994140625, 0.2174072265625, 0.23635101318359375, 0.2552947998046875, 0.27423858642578125, 0.293182373046875, 0.31212615966796875, 0.3310699462890625, 0.35001373291015625, 0.36895751953125, 0.38790130615234375, 0.4068450927734375, 0.42578887939453125, 0.444732666015625, 0.46367645263671875, 0.4826202392578125, 0.5015640258789062, 0.5205078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 14.0, 14.0, 16.0, 32.0, 38.0, 61.0, 86.0, 106.0, 160.0, 219.0, 316.0, 467.0, 781.0, 1309.0, 2999.0, 10517.0, 60934.0, 416820.0, 465301.0, 69614.0, 11840.0, 3162.0, 1396.0, 746.0, 483.0, 314.0, 225.0, 158.0, 120.0, 72.0, 53.0, 41.0, 28.0, 27.0, 20.0, 15.0, 14.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.28515625, -3.188629150390625, -3.09210205078125, -2.995574951171875, -2.8990478515625, -2.802520751953125, -2.70599365234375, -2.609466552734375, -2.512939453125, -2.416412353515625, -2.31988525390625, -2.223358154296875, -2.1268310546875, -2.030303955078125, -1.93377685546875, -1.837249755859375, -1.74072265625, -1.644195556640625, -1.54766845703125, -1.451141357421875, -1.3546142578125, -1.258087158203125, -1.16156005859375, -1.065032958984375, -0.968505859375, -0.871978759765625, -0.77545166015625, -0.678924560546875, -0.5823974609375, -0.485870361328125, -0.38934326171875, -0.292816162109375, -0.1962890625, -0.099761962890625, -0.00323486328125, 0.093292236328125, 0.1898193359375, 0.286346435546875, 0.38287353515625, 0.479400634765625, 0.575927734375, 0.672454833984375, 0.76898193359375, 0.865509033203125, 0.9620361328125, 1.058563232421875, 1.15509033203125, 1.251617431640625, 1.34814453125, 1.444671630859375, 1.54119873046875, 1.637725830078125, 1.7342529296875, 1.830780029296875, 1.92730712890625, 2.023834228515625, 2.120361328125, 2.216888427734375, 2.31341552734375, 2.409942626953125, 2.5064697265625, 2.602996826171875, 2.69952392578125, 2.796051025390625, 2.892578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 15.0, 9.0, 15.0, 11.0, 15.0, 23.0, 24.0, 26.0, 35.0, 39.0, 38.0, 51.0, 56.0, 54.0, 44.0, 51.0, 53.0, 48.0, 43.0, 40.0, 42.0, 40.0, 32.0, 32.0, 22.0, 24.0, 14.0, 16.0, 15.0, 13.0, 10.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.0595703125, -2.955078125, -2.8505859375, -2.74609375, -2.6416015625, -2.537109375, -2.4326171875, -2.328125, -2.2236328125, -2.119140625, -2.0146484375, -1.91015625, -1.8056640625, -1.701171875, -1.5966796875, -1.4921875, -1.3876953125, -1.283203125, -1.1787109375, -1.07421875, -0.9697265625, -0.865234375, -0.7607421875, -0.65625, -0.5517578125, -0.447265625, -0.3427734375, -0.23828125, -0.1337890625, -0.029296875, 0.0751953125, 0.1796875, 0.2841796875, 0.388671875, 0.4931640625, 0.59765625, 0.7021484375, 0.806640625, 0.9111328125, 1.015625, 1.1201171875, 1.224609375, 1.3291015625, 1.43359375, 1.5380859375, 1.642578125, 1.7470703125, 1.8515625, 1.9560546875, 2.060546875, 2.1650390625, 2.26953125, 2.3740234375, 2.478515625, 2.5830078125, 2.6875, 2.7919921875, 2.896484375, 3.0009765625, 3.10546875, 3.2099609375, 3.314453125, 3.4189453125, 3.5234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 7.0, 8.0, 19.0, 7.0, 36.0, 30.0, 49.0, 70.0, 129.0, 181.0, 292.0, 623.0, 1453.0, 4012.0, 14539.0, 69398.0, 404337.0, 452434.0, 77470.0, 16072.0, 4267.0, 1552.0, 659.0, 320.0, 208.0, 101.0, 76.0, 51.0, 46.0, 23.0, 23.0, 13.0, 14.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4039764404296875, -1.358734130859375, -1.3134918212890625, -1.26824951171875, -1.2230072021484375, -1.177764892578125, -1.1325225830078125, -1.0872802734375, -1.0420379638671875, -0.996795654296875, -0.9515533447265625, -0.90631103515625, -0.8610687255859375, -0.815826416015625, -0.7705841064453125, -0.725341796875, -0.6800994873046875, -0.634857177734375, -0.5896148681640625, -0.54437255859375, -0.4991302490234375, -0.453887939453125, -0.4086456298828125, -0.3634033203125, -0.3181610107421875, -0.272918701171875, -0.2276763916015625, -0.18243408203125, -0.1371917724609375, -0.091949462890625, -0.0467071533203125, -0.00146484375, 0.0437774658203125, 0.089019775390625, 0.1342620849609375, 0.17950439453125, 0.2247467041015625, 0.269989013671875, 0.3152313232421875, 0.3604736328125, 0.4057159423828125, 0.450958251953125, 0.4962005615234375, 0.54144287109375, 0.5866851806640625, 0.631927490234375, 0.6771697998046875, 0.722412109375, 0.7676544189453125, 0.812896728515625, 0.8581390380859375, 0.90338134765625, 0.9486236572265625, 0.993865966796875, 1.0391082763671875, 1.0843505859375, 1.1295928955078125, 1.174835205078125, 1.2200775146484375, 1.26531982421875, 1.3105621337890625, 1.355804443359375, 1.4010467529296875, 1.4462890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 12.0, 19.0, 13.0, 16.0, 29.0, 37.0, 56.0, 61.0, 72.0, 86.0, 77.0, 91.0, 70.0, 79.0, 49.0, 36.0, 38.0, 24.0, 32.0, 18.0, 15.0, 14.0, 8.0, 7.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000194549560546875, -0.00018706917762756348, -0.00017958879470825195, -0.00017210841178894043, -0.0001646280288696289, -0.00015714764595031738, -0.00014966726303100586, -0.00014218688011169434, -0.0001347064971923828, -0.0001272261142730713, -0.00011974573135375977, -0.00011226534843444824, -0.00010478496551513672, -9.73045825958252e-05, -8.982419967651367e-05, -8.234381675720215e-05, -7.486343383789062e-05, -6.73830509185791e-05, -5.990266799926758e-05, -5.2422285079956055e-05, -4.494190216064453e-05, -3.746151924133301e-05, -2.9981136322021484e-05, -2.250075340270996e-05, -1.5020370483398438e-05, -7.539987564086914e-06, -5.960464477539063e-08, 7.420778274536133e-06, 1.4901161193847656e-05, 2.238154411315918e-05, 2.9861927032470703e-05, 3.7342309951782227e-05, 4.482269287109375e-05, 5.2303075790405273e-05, 5.97834587097168e-05, 6.726384162902832e-05, 7.474422454833984e-05, 8.222460746765137e-05, 8.970499038696289e-05, 9.718537330627441e-05, 0.00010466575622558594, 0.00011214613914489746, 0.00011962652206420898, 0.0001271069049835205, 0.00013458728790283203, 0.00014206767082214355, 0.00014954805374145508, 0.0001570284366607666, 0.00016450881958007812, 0.00017198920249938965, 0.00017946958541870117, 0.0001869499683380127, 0.00019443035125732422, 0.00020191073417663574, 0.00020939111709594727, 0.0002168715000152588, 0.0002243518829345703, 0.00023183226585388184, 0.00023931264877319336, 0.0002467930316925049, 0.0002542734146118164, 0.00026175379753112793, 0.00026923418045043945, 0.000276714563369751, 0.0002841949462890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 17.0, 15.0, 27.0, 25.0, 62.0, 70.0, 114.0, 211.0, 388.0, 753.0, 1816.0, 5816.0, 33446.0, 379908.0, 562846.0, 51291.0, 7676.0, 2144.0, 857.0, 430.0, 248.0, 123.0, 98.0, 42.0, 30.0, 22.0, 17.0, 12.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.115234375, -2.054962158203125, -1.99468994140625, -1.934417724609375, -1.8741455078125, -1.813873291015625, -1.75360107421875, -1.693328857421875, -1.633056640625, -1.572784423828125, -1.51251220703125, -1.452239990234375, -1.3919677734375, -1.331695556640625, -1.27142333984375, -1.211151123046875, -1.15087890625, -1.090606689453125, -1.03033447265625, -0.970062255859375, -0.9097900390625, -0.849517822265625, -0.78924560546875, -0.728973388671875, -0.668701171875, -0.608428955078125, -0.54815673828125, -0.487884521484375, -0.4276123046875, -0.367340087890625, -0.30706787109375, -0.246795654296875, -0.1865234375, -0.126251220703125, -0.06597900390625, -0.005706787109375, 0.0545654296875, 0.114837646484375, 0.17510986328125, 0.235382080078125, 0.295654296875, 0.355926513671875, 0.41619873046875, 0.476470947265625, 0.5367431640625, 0.597015380859375, 0.65728759765625, 0.717559814453125, 0.77783203125, 0.838104248046875, 0.89837646484375, 0.958648681640625, 1.0189208984375, 1.079193115234375, 1.13946533203125, 1.199737548828125, 1.260009765625, 1.320281982421875, 1.38055419921875, 1.440826416015625, 1.5010986328125, 1.561370849609375, 1.62164306640625, 1.681915283203125, 1.7421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 14.0, 17.0, 26.0, 36.0, 49.0, 43.0, 72.0, 71.0, 80.0, 89.0, 93.0, 72.0, 61.0, 53.0, 36.0, 39.0, 25.0, 21.0, 15.0, 12.0, 10.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.662109375, -1.6167755126953125, -1.571441650390625, -1.5261077880859375, -1.48077392578125, -1.4354400634765625, -1.390106201171875, -1.3447723388671875, -1.2994384765625, -1.2541046142578125, -1.208770751953125, -1.1634368896484375, -1.11810302734375, -1.0727691650390625, -1.027435302734375, -0.9821014404296875, -0.936767578125, -0.8914337158203125, -0.846099853515625, -0.8007659912109375, -0.75543212890625, -0.7100982666015625, -0.664764404296875, -0.6194305419921875, -0.5740966796875, -0.5287628173828125, -0.483428955078125, -0.4380950927734375, -0.39276123046875, -0.3474273681640625, -0.302093505859375, -0.2567596435546875, -0.21142578125, -0.1660919189453125, -0.120758056640625, -0.0754241943359375, -0.03009033203125, 0.0152435302734375, 0.060577392578125, 0.1059112548828125, 0.1512451171875, 0.1965789794921875, 0.241912841796875, 0.2872467041015625, 0.33258056640625, 0.3779144287109375, 0.423248291015625, 0.4685821533203125, 0.513916015625, 0.5592498779296875, 0.604583740234375, 0.6499176025390625, 0.69525146484375, 0.7405853271484375, 0.785919189453125, 0.8312530517578125, 0.8765869140625, 0.9219207763671875, 0.967254638671875, 1.0125885009765625, 1.05792236328125, 1.1032562255859375, 1.148590087890625, 1.1939239501953125, 1.2392578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 40.0, 127.0, 253.0, 315.0, 164.0, 67.0, 17.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.206470489501953, -14.763477325439453, -13.32048511505127, -11.877492904663086, -10.434499740600586, -8.991506576538086, -7.548514366149902, -6.105522155761719, -4.662528991699219, -3.219536304473877, -1.7765436172485352, -0.33355093002319336, 1.1094417572021484, 2.5524344444274902, 3.995427131652832, 5.438419342041016, 6.881412506103516, 8.324405670166016, 9.7673978805542, 11.210390090942383, 12.653383255004883, 14.096376419067383, 15.539368629455566, 16.98236083984375, 18.42535400390625, 19.86834716796875, 21.31134033203125, 22.754331588745117, 24.197324752807617, 25.640317916870117, 27.083309173583984, 28.526302337646484, 29.96929168701172, 31.41228485107422, 32.85527801513672, 34.29827117919922, 35.74126434326172, 37.18425369262695, 38.62724685668945, 40.07024002075195, 41.51323318481445, 42.95622634887695, 44.39921951293945, 45.84221267700195, 47.28520202636719, 48.72819519042969, 50.17118835449219, 51.61418151855469, 53.05717468261719, 54.50016784667969, 55.94316101074219, 57.38615417480469, 58.82914733886719, 60.27213668823242, 61.71512985229492, 63.15812301635742, 64.60111999511719, 66.04411315917969, 67.48710632324219, 68.93009948730469, 70.37309265136719, 71.81608581542969, 73.25907897949219, 74.70207214355469, 76.14505767822266]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 7.0, 11.0, 9.0, 19.0, 11.0, 20.0, 20.0, 23.0, 22.0, 36.0, 39.0, 41.0, 43.0, 57.0, 44.0, 61.0, 47.0, 50.0, 43.0, 53.0, 44.0, 40.0, 36.0, 27.0, 26.0, 25.0, 25.0, 20.0, 26.0, 14.0, 8.0, 6.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.999813079833984, -16.508935928344727, -16.018056869506836, -15.527179718017578, -15.036301612854004, -14.54542350769043, -14.054546356201172, -13.563668251037598, -13.072790145874023, -12.58191204071045, -12.091034889221191, -11.600156784057617, -11.109278678894043, -10.618400573730469, -10.127523422241211, -9.636645317077637, -9.145768165588379, -8.654890060424805, -8.164012908935547, -7.673134803771973, -7.182256698608398, -6.691379070281982, -6.200501441955566, -5.709623336791992, -5.218745708465576, -4.72786808013916, -4.236989974975586, -3.74611234664917, -3.255234479904175, -2.7643566131591797, -2.2734789848327637, -1.7826011180877686, -1.2917232513427734, -0.8008454442024231, -0.30996763706207275, 0.1809101104736328, 0.6717879772186279, 1.162665843963623, 1.653543472290039, 2.144421339035034, 2.6352992057800293, 3.1261770725250244, 3.6170549392700195, 4.1079325675964355, 4.598810195922852, 5.089688301086426, 5.580565929412842, 6.071443557739258, 6.562321662902832, 7.053199291229248, 7.544077396392822, 8.034955024719238, 8.525833129882812, 9.01671028137207, 9.507588386535645, 9.998466491699219, 10.489343643188477, 10.98022174835205, 11.471098899841309, 11.961977005004883, 12.452855110168457, 12.943733215332031, 13.434610366821289, 13.925488471984863, 14.416366577148438]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 2.0, 8.0, 10.0, 15.0, 31.0, 30.0, 63.0, 102.0, 111.0, 221.0, 351.0, 603.0, 1168.0, 2464.0, 5984.0, 19345.0, 147975.0, 3948504.0, 48670.0, 10969.0, 3912.0, 1757.0, 818.0, 444.0, 280.0, 147.0, 123.0, 66.0, 26.0, 31.0, 9.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.74609375, -2.6553955078125, -2.564697265625, -2.4739990234375, -2.38330078125, -2.2926025390625, -2.201904296875, -2.1112060546875, -2.0205078125, -1.9298095703125, -1.839111328125, -1.7484130859375, -1.65771484375, -1.5670166015625, -1.476318359375, -1.3856201171875, -1.294921875, -1.2042236328125, -1.113525390625, -1.0228271484375, -0.93212890625, -0.8414306640625, -0.750732421875, -0.6600341796875, -0.5693359375, -0.4786376953125, -0.387939453125, -0.2972412109375, -0.20654296875, -0.1158447265625, -0.025146484375, 0.0655517578125, 0.15625, 0.2469482421875, 0.337646484375, 0.4283447265625, 0.51904296875, 0.6097412109375, 0.700439453125, 0.7911376953125, 0.8818359375, 0.9725341796875, 1.063232421875, 1.1539306640625, 1.24462890625, 1.3353271484375, 1.426025390625, 1.5167236328125, 1.607421875, 1.6981201171875, 1.788818359375, 1.8795166015625, 1.97021484375, 2.0609130859375, 2.151611328125, 2.2423095703125, 2.3330078125, 2.4237060546875, 2.514404296875, 2.6051025390625, 2.69580078125, 2.7864990234375, 2.877197265625, 2.9678955078125, 3.05859375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 5.0, 5.0, 14.0, 9.0, 12.0, 11.0, 13.0, 16.0, 22.0, 34.0, 34.0, 45.0, 49.0, 79.0, 73.0, 57.0, 65.0, 70.0, 73.0, 56.0, 53.0, 52.0, 35.0, 23.0, 19.0, 16.0, 14.0, 9.0, 10.0, 4.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92236328125, -0.8979415893554688, -0.8735198974609375, -0.8490982055664062, -0.824676513671875, -0.8002548217773438, -0.7758331298828125, -0.7514114379882812, -0.72698974609375, -0.7025680541992188, -0.6781463623046875, -0.6537246704101562, -0.629302978515625, -0.6048812866210938, -0.5804595947265625, -0.5560379028320312, -0.5316162109375, -0.5071945190429688, -0.4827728271484375, -0.45835113525390625, -0.433929443359375, -0.40950775146484375, -0.3850860595703125, -0.36066436767578125, -0.33624267578125, -0.31182098388671875, -0.2873992919921875, -0.26297760009765625, -0.238555908203125, -0.21413421630859375, -0.1897125244140625, -0.16529083251953125, -0.140869140625, -0.11644744873046875, -0.0920257568359375, -0.06760406494140625, -0.043182373046875, -0.01876068115234375, 0.0056610107421875, 0.03008270263671875, 0.05450439453125, 0.07892608642578125, 0.1033477783203125, 0.12776947021484375, 0.152191162109375, 0.17661285400390625, 0.2010345458984375, 0.22545623779296875, 0.2498779296875, 0.27429962158203125, 0.2987213134765625, 0.32314300537109375, 0.347564697265625, 0.37198638916015625, 0.3964080810546875, 0.42082977294921875, 0.44525146484375, 0.46967315673828125, 0.4940948486328125, 0.5185165405273438, 0.542938232421875, 0.5673599243164062, 0.5917816162109375, 0.6162033081054688, 0.640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 8.0, 5.0, 9.0, 7.0, 9.0, 14.0, 10.0, 23.0, 21.0, 48.0, 70.0, 82.0, 101.0, 154.0, 239.0, 375.0, 633.0, 1124.0, 2258.0, 4673.0, 10614.0, 32282.0, 185008.0, 3813200.0, 103163.0, 23651.0, 8250.0, 3745.0, 1854.0, 988.0, 576.0, 343.0, 209.0, 118.0, 100.0, 86.0, 61.0, 39.0, 31.0, 26.0, 24.0, 12.0, 12.0, 8.0, 10.0, 6.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.31488037109375, -2.2410888671875, -2.16729736328125, -2.093505859375, -2.01971435546875, -1.9459228515625, -1.87213134765625, -1.79833984375, -1.72454833984375, -1.6507568359375, -1.57696533203125, -1.503173828125, -1.42938232421875, -1.3555908203125, -1.28179931640625, -1.2080078125, -1.13421630859375, -1.0604248046875, -0.98663330078125, -0.912841796875, -0.83905029296875, -0.7652587890625, -0.69146728515625, -0.61767578125, -0.54388427734375, -0.4700927734375, -0.39630126953125, -0.322509765625, -0.24871826171875, -0.1749267578125, -0.10113525390625, -0.02734375, 0.04644775390625, 0.1202392578125, 0.19403076171875, 0.267822265625, 0.34161376953125, 0.4154052734375, 0.48919677734375, 0.56298828125, 0.63677978515625, 0.7105712890625, 0.78436279296875, 0.858154296875, 0.93194580078125, 1.0057373046875, 1.07952880859375, 1.1533203125, 1.22711181640625, 1.3009033203125, 1.37469482421875, 1.448486328125, 1.52227783203125, 1.5960693359375, 1.66986083984375, 1.74365234375, 1.81744384765625, 1.8912353515625, 1.96502685546875, 2.038818359375, 2.11260986328125, 2.1864013671875, 2.26019287109375, 2.333984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 8.0, 2.0, 5.0, 6.0, 12.0, 29.0, 26.0, 49.0, 90.0, 174.0, 924.0, 2409.0, 143.0, 70.0, 38.0, 30.0, 14.0, 9.0, 5.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7744140625, -0.75506591796875, -0.7357177734375, -0.71636962890625, -0.697021484375, -0.67767333984375, -0.6583251953125, -0.63897705078125, -0.61962890625, -0.60028076171875, -0.5809326171875, -0.56158447265625, -0.542236328125, -0.52288818359375, -0.5035400390625, -0.48419189453125, -0.46484375, -0.44549560546875, -0.4261474609375, -0.40679931640625, -0.387451171875, -0.36810302734375, -0.3487548828125, -0.32940673828125, -0.31005859375, -0.29071044921875, -0.2713623046875, -0.25201416015625, -0.232666015625, -0.21331787109375, -0.1939697265625, -0.17462158203125, -0.1552734375, -0.13592529296875, -0.1165771484375, -0.09722900390625, -0.077880859375, -0.05853271484375, -0.0391845703125, -0.01983642578125, -0.00048828125, 0.01885986328125, 0.0382080078125, 0.05755615234375, 0.076904296875, 0.09625244140625, 0.1156005859375, 0.13494873046875, 0.154296875, 0.17364501953125, 0.1929931640625, 0.21234130859375, 0.231689453125, 0.25103759765625, 0.2703857421875, 0.28973388671875, 0.30908203125, 0.32843017578125, 0.3477783203125, 0.36712646484375, 0.386474609375, 0.40582275390625, 0.4251708984375, 0.44451904296875, 0.4638671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 6.0, 12.0, 24.0, 39.0, 52.0, 88.0, 89.0, 123.0, 143.0, 114.0, 101.0, 82.0, 52.0, 30.0, 20.0, 9.0, 7.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.143301010131836, -5.041082859039307, -4.938864231109619, -4.83664608001709, -4.734427452087402, -4.632209300994873, -4.529991149902344, -4.427772521972656, -4.325554370880127, -4.223336219787598, -4.12111759185791, -4.018899440765381, -3.9166810512542725, -3.814462661743164, -3.7122442722320557, -3.6100258827209473, -3.507807731628418, -3.4055893421173096, -3.303370952606201, -3.201152801513672, -3.0989344120025635, -2.996716022491455, -2.8944976329803467, -2.7922792434692383, -2.69006085395813, -2.5878424644470215, -2.485624074935913, -2.383405923843384, -2.2811875343322754, -2.178969144821167, -2.0767507553100586, -1.9745324850082397, -1.872314214706421, -1.7700958251953125, -1.6678775548934937, -1.5656591653823853, -1.4634408950805664, -1.361222505569458, -1.2590041160583496, -1.1567858457565308, -1.054567575454712, -0.9523492455482483, -0.8501309156417847, -0.7479125261306763, -0.6456942558288574, -0.543475866317749, -0.4412575364112854, -0.3390392065048218, -0.23682081699371338, -0.13460248708724976, -0.03238414227962494, 0.06983420252799988, 0.1720525324344635, 0.2742708921432495, 0.37648922204971313, 0.47870755195617676, 0.5809258818626404, 0.683144211769104, 0.7853625416755676, 0.8875808715820312, 0.9897992610931396, 1.092017650604248, 1.194235920906067, 1.2964541912078857, 1.3986725807189941]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 5.0, 11.0, 13.0, 10.0, 10.0, 11.0, 18.0, 26.0, 20.0, 32.0, 44.0, 38.0, 45.0, 42.0, 34.0, 44.0, 41.0, 41.0, 42.0, 37.0, 45.0, 39.0, 33.0, 38.0, 33.0, 36.0, 25.0, 27.0, 27.0, 20.0, 24.0, 19.0, 16.0, 10.0, 7.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.382106065750122, -1.3313755989074707, -1.2806451320648193, -1.229914665222168, -1.1791841983795166, -1.1284537315368652, -1.0777232646942139, -1.0269927978515625, -0.9762623906135559, -0.9255319237709045, -0.8748014569282532, -0.8240710496902466, -0.7733405828475952, -0.7226101160049438, -0.6718796491622925, -0.6211491823196411, -0.5704187154769897, -0.5196882486343384, -0.468957781791687, -0.41822734475135803, -0.36749687790870667, -0.3167664110660553, -0.2660359740257263, -0.21530550718307495, -0.16457504034042358, -0.11384458094835281, -0.06311412155628204, -0.01238366961479187, 0.0383467972278595, 0.08907726407051086, 0.13980770111083984, 0.1905381679534912, 0.24126863479614258, 0.29199910163879395, 0.3427295684814453, 0.3934600055217743, 0.44419047236442566, 0.494920939207077, 0.545651376247406, 0.5963818430900574, 0.6471123099327087, 0.6978427767753601, 0.7485732436180115, 0.7993036508560181, 0.8500341176986694, 0.9007645845413208, 0.9514950513839722, 1.0022255182266235, 1.052955985069275, 1.1036864519119263, 1.1544169187545776, 1.205147385597229, 1.2558778524398804, 1.3066083192825317, 1.3573386669158936, 1.408069133758545, 1.4587996006011963, 1.5095300674438477, 1.560260534286499, 1.6109910011291504, 1.6617214679718018, 1.7124519348144531, 1.7631824016571045, 1.8139128684997559, 1.8646433353424072]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 21.0, 20.0, 28.0, 50.0, 77.0, 113.0, 165.0, 296.0, 455.0, 723.0, 1244.0, 2395.0, 4315.0, 8394.0, 17226.0, 35427.0, 73117.0, 141707.0, 225872.0, 232150.0, 150757.0, 78511.0, 37778.0, 18334.0, 8951.0, 4587.0, 2462.0, 1362.0, 721.0, 479.0, 281.0, 183.0, 115.0, 70.0, 56.0, 30.0, 14.0, 15.0, 15.0, 9.0, 9.0, 6.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78564453125, -0.7565994262695312, -0.7275543212890625, -0.6985092163085938, -0.669464111328125, -0.6404190063476562, -0.6113739013671875, -0.5823287963867188, -0.55328369140625, -0.5242385864257812, -0.4951934814453125, -0.46614837646484375, -0.437103271484375, -0.40805816650390625, -0.3790130615234375, -0.34996795654296875, -0.3209228515625, -0.29187774658203125, -0.2628326416015625, -0.23378753662109375, -0.204742431640625, -0.17569732666015625, -0.1466522216796875, -0.11760711669921875, -0.08856201171875, -0.05951690673828125, -0.0304718017578125, -0.00142669677734375, 0.027618408203125, 0.05666351318359375, 0.0857086181640625, 0.11475372314453125, 0.143798828125, 0.17284393310546875, 0.2018890380859375, 0.23093414306640625, 0.259979248046875, 0.28902435302734375, 0.3180694580078125, 0.34711456298828125, 0.37615966796875, 0.40520477294921875, 0.4342498779296875, 0.46329498291015625, 0.492340087890625, 0.5213851928710938, 0.5504302978515625, 0.5794754028320312, 0.6085205078125, 0.6375656127929688, 0.6666107177734375, 0.6956558227539062, 0.724700927734375, 0.7537460327148438, 0.7827911376953125, 0.8118362426757812, 0.84088134765625, 0.8699264526367188, 0.8989715576171875, 0.9280166625976562, 0.957061767578125, 0.9861068725585938, 1.0151519775390625, 1.0441970825195312, 1.0732421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 8.0, 11.0, 12.0, 14.0, 17.0, 23.0, 27.0, 22.0, 30.0, 43.0, 42.0, 60.0, 60.0, 63.0, 72.0, 75.0, 65.0, 63.0, 48.0, 53.0, 40.0, 36.0, 20.0, 12.0, 14.0, 15.0, 12.0, 8.0, 3.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.00390625, -0.9789276123046875, -0.953948974609375, -0.9289703369140625, -0.90399169921875, -0.8790130615234375, -0.854034423828125, -0.8290557861328125, -0.8040771484375, -0.7790985107421875, -0.754119873046875, -0.7291412353515625, -0.70416259765625, -0.6791839599609375, -0.654205322265625, -0.6292266845703125, -0.604248046875, -0.5792694091796875, -0.554290771484375, -0.5293121337890625, -0.50433349609375, -0.4793548583984375, -0.454376220703125, -0.4293975830078125, -0.4044189453125, -0.3794403076171875, -0.354461669921875, -0.3294830322265625, -0.30450439453125, -0.2795257568359375, -0.254547119140625, -0.2295684814453125, -0.20458984375, -0.1796112060546875, -0.154632568359375, -0.1296539306640625, -0.10467529296875, -0.0796966552734375, -0.054718017578125, -0.0297393798828125, -0.0047607421875, 0.0202178955078125, 0.045196533203125, 0.0701751708984375, 0.09515380859375, 0.1201324462890625, 0.145111083984375, 0.1700897216796875, 0.195068359375, 0.2200469970703125, 0.245025634765625, 0.2700042724609375, 0.29498291015625, 0.3199615478515625, 0.344940185546875, 0.3699188232421875, 0.3948974609375, 0.4198760986328125, 0.444854736328125, 0.4698333740234375, 0.49481201171875, 0.5197906494140625, 0.544769287109375, 0.5697479248046875, 0.5947265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 27.0, 25.0, 54.0, 79.0, 107.0, 191.0, 302.0, 453.0, 874.0, 1647.0, 4692.0, 34239.0, 565038.0, 409218.0, 24319.0, 3930.0, 1420.0, 743.0, 393.0, 262.0, 172.0, 106.0, 67.0, 48.0, 30.0, 18.0, 20.0, 16.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.548828125, -3.43768310546875, -3.3265380859375, -3.21539306640625, -3.104248046875, -2.99310302734375, -2.8819580078125, -2.77081298828125, -2.65966796875, -2.54852294921875, -2.4373779296875, -2.32623291015625, -2.215087890625, -2.10394287109375, -1.9927978515625, -1.88165283203125, -1.7705078125, -1.65936279296875, -1.5482177734375, -1.43707275390625, -1.325927734375, -1.21478271484375, -1.1036376953125, -0.99249267578125, -0.88134765625, -0.77020263671875, -0.6590576171875, -0.54791259765625, -0.436767578125, -0.32562255859375, -0.2144775390625, -0.10333251953125, 0.0078125, 0.11895751953125, 0.2301025390625, 0.34124755859375, 0.452392578125, 0.56353759765625, 0.6746826171875, 0.78582763671875, 0.89697265625, 1.00811767578125, 1.1192626953125, 1.23040771484375, 1.341552734375, 1.45269775390625, 1.5638427734375, 1.67498779296875, 1.7861328125, 1.89727783203125, 2.0084228515625, 2.11956787109375, 2.230712890625, 2.34185791015625, 2.4530029296875, 2.56414794921875, 2.67529296875, 2.78643798828125, 2.8975830078125, 3.00872802734375, 3.119873046875, 3.23101806640625, 3.3421630859375, 3.45330810546875, 3.564453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 12.0, 19.0, 16.0, 16.0, 24.0, 23.0, 31.0, 37.0, 55.0, 46.0, 47.0, 59.0, 42.0, 48.0, 49.0, 52.0, 53.0, 39.0, 48.0, 54.0, 40.0, 25.0, 21.0, 27.0, 10.0, 12.0, 8.0, 12.0, 8.0, 11.0, 8.0, 2.0, 3.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46484375, -3.353057861328125, -3.24127197265625, -3.129486083984375, -3.0177001953125, -2.905914306640625, -2.79412841796875, -2.682342529296875, -2.570556640625, -2.458770751953125, -2.34698486328125, -2.235198974609375, -2.1234130859375, -2.011627197265625, -1.89984130859375, -1.788055419921875, -1.67626953125, -1.564483642578125, -1.45269775390625, -1.340911865234375, -1.2291259765625, -1.117340087890625, -1.00555419921875, -0.893768310546875, -0.781982421875, -0.670196533203125, -0.55841064453125, -0.446624755859375, -0.3348388671875, -0.223052978515625, -0.11126708984375, 0.000518798828125, 0.1123046875, 0.224090576171875, 0.33587646484375, 0.447662353515625, 0.5594482421875, 0.671234130859375, 0.78302001953125, 0.894805908203125, 1.006591796875, 1.118377685546875, 1.23016357421875, 1.341949462890625, 1.4537353515625, 1.565521240234375, 1.67730712890625, 1.789093017578125, 1.90087890625, 2.012664794921875, 2.12445068359375, 2.236236572265625, 2.3480224609375, 2.459808349609375, 2.57159423828125, 2.683380126953125, 2.795166015625, 2.906951904296875, 3.01873779296875, 3.130523681640625, 3.2423095703125, 3.354095458984375, 3.46588134765625, 3.577667236328125, 3.689453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 3.0, 5.0, 13.0, 11.0, 14.0, 19.0, 33.0, 62.0, 72.0, 142.0, 254.0, 413.0, 955.0, 3179.0, 20751.0, 467024.0, 527129.0, 23033.0, 3310.0, 1021.0, 436.0, 230.0, 140.0, 85.0, 45.0, 32.0, 31.0, 15.0, 22.0, 12.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.849609375, -1.783599853515625, -1.71759033203125, -1.651580810546875, -1.5855712890625, -1.519561767578125, -1.45355224609375, -1.387542724609375, -1.321533203125, -1.255523681640625, -1.18951416015625, -1.123504638671875, -1.0574951171875, -0.991485595703125, -0.92547607421875, -0.859466552734375, -0.79345703125, -0.727447509765625, -0.66143798828125, -0.595428466796875, -0.5294189453125, -0.463409423828125, -0.39739990234375, -0.331390380859375, -0.265380859375, -0.199371337890625, -0.13336181640625, -0.067352294921875, -0.0013427734375, 0.064666748046875, 0.13067626953125, 0.196685791015625, 0.2626953125, 0.328704833984375, 0.39471435546875, 0.460723876953125, 0.5267333984375, 0.592742919921875, 0.65875244140625, 0.724761962890625, 0.790771484375, 0.856781005859375, 0.92279052734375, 0.988800048828125, 1.0548095703125, 1.120819091796875, 1.18682861328125, 1.252838134765625, 1.31884765625, 1.384857177734375, 1.45086669921875, 1.516876220703125, 1.5828857421875, 1.648895263671875, 1.71490478515625, 1.780914306640625, 1.846923828125, 1.912933349609375, 1.97894287109375, 2.044952392578125, 2.1109619140625, 2.176971435546875, 2.24298095703125, 2.308990478515625, 2.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 12.0, 12.0, 14.0, 12.0, 19.0, 30.0, 36.0, 32.0, 48.0, 46.0, 50.0, 87.0, 89.0, 73.0, 88.0, 78.0, 59.0, 36.0, 45.0, 29.0, 28.0, 18.0, 15.0, 12.0, 6.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018835067749023438, -0.00018247216939926147, -0.00017659366130828857, -0.00017071515321731567, -0.00016483664512634277, -0.00015895813703536987, -0.00015307962894439697, -0.00014720112085342407, -0.00014132261276245117, -0.00013544410467147827, -0.00012956559658050537, -0.00012368708848953247, -0.00011780858039855957, -0.00011193007230758667, -0.00010605156421661377, -0.00010017305612564087, -9.429454803466797e-05, -8.841603994369507e-05, -8.253753185272217e-05, -7.665902376174927e-05, -7.078051567077637e-05, -6.490200757980347e-05, -5.9023499488830566e-05, -5.3144991397857666e-05, -4.7266483306884766e-05, -4.1387975215911865e-05, -3.5509467124938965e-05, -2.9630959033966064e-05, -2.3752450942993164e-05, -1.7873942852020264e-05, -1.1995434761047363e-05, -6.116926670074463e-06, -2.384185791015625e-07, 5.640089511871338e-06, 1.1518597602844238e-05, 1.739710569381714e-05, 2.327561378479004e-05, 2.915412187576294e-05, 3.503262996673584e-05, 4.091113805770874e-05, 4.678964614868164e-05, 5.266815423965454e-05, 5.854666233062744e-05, 6.442517042160034e-05, 7.030367851257324e-05, 7.618218660354614e-05, 8.206069469451904e-05, 8.793920278549194e-05, 9.381771087646484e-05, 9.969621896743774e-05, 0.00010557472705841064, 0.00011145323514938354, 0.00011733174324035645, 0.00012321025133132935, 0.00012908875942230225, 0.00013496726751327515, 0.00014084577560424805, 0.00014672428369522095, 0.00015260279178619385, 0.00015848129987716675, 0.00016435980796813965, 0.00017023831605911255, 0.00017611682415008545, 0.00018199533224105835, 0.00018787384033203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 12.0, 18.0, 22.0, 36.0, 66.0, 96.0, 181.0, 409.0, 1023.0, 3811.0, 45000.0, 911474.0, 79392.0, 4867.0, 1191.0, 437.0, 204.0, 94.0, 77.0, 46.0, 24.0, 23.0, 14.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.69921875, -3.605743408203125, -3.51226806640625, -3.418792724609375, -3.3253173828125, -3.231842041015625, -3.13836669921875, -3.044891357421875, -2.951416015625, -2.857940673828125, -2.76446533203125, -2.670989990234375, -2.5775146484375, -2.484039306640625, -2.39056396484375, -2.297088623046875, -2.20361328125, -2.110137939453125, -2.01666259765625, -1.923187255859375, -1.8297119140625, -1.736236572265625, -1.64276123046875, -1.549285888671875, -1.455810546875, -1.362335205078125, -1.26885986328125, -1.175384521484375, -1.0819091796875, -0.988433837890625, -0.89495849609375, -0.801483154296875, -0.7080078125, -0.614532470703125, -0.52105712890625, -0.427581787109375, -0.3341064453125, -0.240631103515625, -0.14715576171875, -0.053680419921875, 0.039794921875, 0.133270263671875, 0.22674560546875, 0.320220947265625, 0.4136962890625, 0.507171630859375, 0.60064697265625, 0.694122314453125, 0.78759765625, 0.881072998046875, 0.97454833984375, 1.068023681640625, 1.1614990234375, 1.254974365234375, 1.34844970703125, 1.441925048828125, 1.535400390625, 1.628875732421875, 1.72235107421875, 1.815826416015625, 1.9093017578125, 2.002777099609375, 2.09625244140625, 2.189727783203125, 2.283203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 12.0, 17.0, 35.0, 31.0, 40.0, 43.0, 58.0, 73.0, 90.0, 85.0, 81.0, 81.0, 78.0, 65.0, 46.0, 30.0, 28.0, 16.0, 10.0, 11.0, 12.0, 12.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.234375, -1.1913909912109375, -1.148406982421875, -1.1054229736328125, -1.06243896484375, -1.0194549560546875, -0.976470947265625, -0.9334869384765625, -0.8905029296875, -0.8475189208984375, -0.804534912109375, -0.7615509033203125, -0.71856689453125, -0.6755828857421875, -0.632598876953125, -0.5896148681640625, -0.546630859375, -0.5036468505859375, -0.460662841796875, -0.4176788330078125, -0.37469482421875, -0.3317108154296875, -0.288726806640625, -0.2457427978515625, -0.2027587890625, -0.1597747802734375, -0.116790771484375, -0.0738067626953125, -0.03082275390625, 0.0121612548828125, 0.055145263671875, 0.0981292724609375, 0.14111328125, 0.1840972900390625, 0.227081298828125, 0.2700653076171875, 0.31304931640625, 0.3560333251953125, 0.399017333984375, 0.4420013427734375, 0.4849853515625, 0.5279693603515625, 0.570953369140625, 0.6139373779296875, 0.65692138671875, 0.6999053955078125, 0.742889404296875, 0.7858734130859375, 0.828857421875, 0.8718414306640625, 0.914825439453125, 0.9578094482421875, 1.00079345703125, 1.0437774658203125, 1.086761474609375, 1.1297454833984375, 1.1727294921875, 1.2157135009765625, 1.258697509765625, 1.3016815185546875, 1.34466552734375, 1.3876495361328125, 1.430633544921875, 1.4736175537109375, 1.5166015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 42.0, 149.0, 354.0, 301.0, 108.0, 26.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015113830566406, -20.432607650756836, -18.850101470947266, -17.267597198486328, -15.685091018676758, -14.102584838867188, -12.520078659057617, -10.937573432922363, -9.355067253112793, -7.772561550140381, -6.190055847167969, -4.607549667358398, -3.0250439643859863, -1.4425382614135742, 0.1399679183959961, 1.72247314453125, 3.3049793243408203, 4.887485027313232, 6.4699907302856445, 8.052496910095215, 9.635002136230469, 11.217508316040039, 12.80001449584961, 14.382519721984863, 15.965025901794434, 17.547531127929688, 19.130037307739258, 20.712543487548828, 22.2950496673584, 23.87755584716797, 25.460060119628906, 27.042566299438477, 28.625072479248047, 30.207578659057617, 31.790084838867188, 33.372589111328125, 34.95509719848633, 36.537601470947266, 38.12010955810547, 39.702613830566406, 41.285118103027344, 42.86762237548828, 44.450130462646484, 46.03263473510742, 47.615142822265625, 49.19764709472656, 50.7801513671875, 52.3626594543457, 53.945167541503906, 55.527671813964844, 57.11017990112305, 58.692684173583984, 60.27519226074219, 61.857696533203125, 63.44020080566406, 65.022705078125, 66.60520935058594, 68.18771362304688, 69.77021789550781, 71.35272979736328, 72.93523406982422, 74.51773834228516, 76.1002426147461, 77.68274688720703, 79.2652587890625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 7.0, 10.0, 11.0, 6.0, 21.0, 7.0, 31.0, 20.0, 34.0, 29.0, 30.0, 47.0, 44.0, 45.0, 36.0, 32.0, 50.0, 46.0, 56.0, 39.0, 28.0, 36.0, 37.0, 35.0, 39.0, 37.0, 25.0, 20.0, 15.0, 26.0, 18.0, 13.0, 19.0, 7.0, 9.0, 8.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.968815803527832, -12.532960891723633, -12.097105979919434, -11.661251068115234, -11.225396156311035, -10.789541244506836, -10.35368537902832, -9.917831420898438, -9.481975555419922, -9.046120643615723, -8.610265731811523, -8.174410820007324, -7.738555908203125, -7.302700996398926, -6.866845607757568, -6.430990695953369, -5.995136260986328, -5.559281349182129, -5.12342643737793, -4.6875715255737305, -4.251716613769531, -3.815861463546753, -3.3800063133239746, -2.9441514015197754, -2.508296489715576, -2.072441577911377, -1.6365865468978882, -1.2007315158843994, -0.7648766040802002, -0.329021692276001, 0.10683345794677734, 0.5426883697509766, 0.9785423278808594, 1.4143972396850586, 1.8502522706985474, 2.286107301712036, 2.7219622135162354, 3.1578171253204346, 3.593672275543213, 4.029527187347412, 4.465382099151611, 4.9012370109558105, 5.33709192276001, 5.772947311401367, 6.208802223205566, 6.644657135009766, 7.080512046813965, 7.516366958618164, 7.952221870422363, 8.388076782226562, 8.823931694030762, 9.259786605834961, 9.69564151763916, 10.13149642944336, 10.567352294921875, 11.003206253051758, 11.439062118530273, 11.874917030334473, 12.310771942138672, 12.746626853942871, 13.18248176574707, 13.61833667755127, 14.054191589355469, 14.490047454833984, 14.925901412963867]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 12.0, 14.0, 28.0, 20.0, 42.0, 54.0, 94.0, 98.0, 175.0, 250.0, 444.0, 770.0, 1452.0, 2877.0, 8056.0, 35642.0, 4042361.0, 81358.0, 12247.0, 4059.0, 1826.0, 954.0, 510.0, 328.0, 186.0, 124.0, 77.0, 54.0, 48.0, 31.0, 17.0, 13.0, 12.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.827728271484375, -2.73553466796875, -2.643341064453125, -2.5511474609375, -2.458953857421875, -2.36676025390625, -2.274566650390625, -2.182373046875, -2.090179443359375, -1.99798583984375, -1.905792236328125, -1.8135986328125, -1.721405029296875, -1.62921142578125, -1.537017822265625, -1.44482421875, -1.352630615234375, -1.26043701171875, -1.168243408203125, -1.0760498046875, -0.983856201171875, -0.89166259765625, -0.799468994140625, -0.707275390625, -0.615081787109375, -0.52288818359375, -0.430694580078125, -0.3385009765625, -0.246307373046875, -0.15411376953125, -0.061920166015625, 0.0302734375, 0.122467041015625, 0.21466064453125, 0.306854248046875, 0.3990478515625, 0.491241455078125, 0.58343505859375, 0.675628662109375, 0.767822265625, 0.860015869140625, 0.95220947265625, 1.044403076171875, 1.1365966796875, 1.228790283203125, 1.32098388671875, 1.413177490234375, 1.50537109375, 1.597564697265625, 1.68975830078125, 1.781951904296875, 1.8741455078125, 1.966339111328125, 2.05853271484375, 2.150726318359375, 2.242919921875, 2.335113525390625, 2.42730712890625, 2.519500732421875, 2.6116943359375, 2.703887939453125, 2.79608154296875, 2.888275146484375, 2.98046875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 8.0, 10.0, 13.0, 15.0, 15.0, 13.0, 24.0, 14.0, 32.0, 43.0, 62.0, 45.0, 67.0, 86.0, 83.0, 60.0, 79.0, 68.0, 58.0, 46.0, 36.0, 25.0, 28.0, 19.0, 13.0, 6.0, 7.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8623046875, -0.83306884765625, -0.8038330078125, -0.77459716796875, -0.745361328125, -0.71612548828125, -0.6868896484375, -0.65765380859375, -0.62841796875, -0.59918212890625, -0.5699462890625, -0.54071044921875, -0.511474609375, -0.48223876953125, -0.4530029296875, -0.42376708984375, -0.39453125, -0.36529541015625, -0.3360595703125, -0.30682373046875, -0.277587890625, -0.24835205078125, -0.2191162109375, -0.18988037109375, -0.16064453125, -0.13140869140625, -0.1021728515625, -0.07293701171875, -0.043701171875, -0.01446533203125, 0.0147705078125, 0.04400634765625, 0.0732421875, 0.10247802734375, 0.1317138671875, 0.16094970703125, 0.190185546875, 0.21942138671875, 0.2486572265625, 0.27789306640625, 0.30712890625, 0.33636474609375, 0.3656005859375, 0.39483642578125, 0.424072265625, 0.45330810546875, 0.4825439453125, 0.51177978515625, 0.541015625, 0.57025146484375, 0.5994873046875, 0.62872314453125, 0.657958984375, 0.68719482421875, 0.7164306640625, 0.74566650390625, 0.77490234375, 0.80413818359375, 0.8333740234375, 0.86260986328125, 0.891845703125, 0.92108154296875, 0.9503173828125, 0.97955322265625, 1.0087890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 18.0, 35.0, 44.0, 58.0, 95.0, 145.0, 263.0, 433.0, 804.0, 1670.0, 4066.0, 15333.0, 293901.0, 3847668.0, 20714.0, 4924.0, 1901.0, 972.0, 501.0, 281.0, 163.0, 96.0, 62.0, 50.0, 23.0, 11.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2265625, -3.107421875, -2.98828125, -2.869140625, -2.75, -2.630859375, -2.51171875, -2.392578125, -2.2734375, -2.154296875, -2.03515625, -1.916015625, -1.796875, -1.677734375, -1.55859375, -1.439453125, -1.3203125, -1.201171875, -1.08203125, -0.962890625, -0.84375, -0.724609375, -0.60546875, -0.486328125, -0.3671875, -0.248046875, -0.12890625, -0.009765625, 0.109375, 0.228515625, 0.34765625, 0.466796875, 0.5859375, 0.705078125, 0.82421875, 0.943359375, 1.0625, 1.181640625, 1.30078125, 1.419921875, 1.5390625, 1.658203125, 1.77734375, 1.896484375, 2.015625, 2.134765625, 2.25390625, 2.373046875, 2.4921875, 2.611328125, 2.73046875, 2.849609375, 2.96875, 3.087890625, 3.20703125, 3.326171875, 3.4453125, 3.564453125, 3.68359375, 3.802734375, 3.921875, 4.041015625, 4.16015625, 4.279296875, 4.3984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 19.0, 31.0, 46.0, 106.0, 732.0, 2872.0, 94.0, 62.0, 34.0, 13.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64892578125, -0.6292800903320312, -0.6096343994140625, -0.5899887084960938, -0.570343017578125, -0.5506973266601562, -0.5310516357421875, -0.5114059448242188, -0.49176025390625, -0.47211456298828125, -0.4524688720703125, -0.43282318115234375, -0.413177490234375, -0.39353179931640625, -0.3738861083984375, -0.35424041748046875, -0.3345947265625, -0.31494903564453125, -0.2953033447265625, -0.27565765380859375, -0.256011962890625, -0.23636627197265625, -0.2167205810546875, -0.19707489013671875, -0.17742919921875, -0.15778350830078125, -0.1381378173828125, -0.11849212646484375, -0.098846435546875, -0.07920074462890625, -0.0595550537109375, -0.03990936279296875, -0.020263671875, -0.00061798095703125, 0.0190277099609375, 0.03867340087890625, 0.058319091796875, 0.07796478271484375, 0.0976104736328125, 0.11725616455078125, 0.13690185546875, 0.15654754638671875, 0.1761932373046875, 0.19583892822265625, 0.215484619140625, 0.23513031005859375, 0.2547760009765625, 0.27442169189453125, 0.2940673828125, 0.31371307373046875, 0.3333587646484375, 0.35300445556640625, 0.372650146484375, 0.39229583740234375, 0.4119415283203125, 0.43158721923828125, 0.45123291015625, 0.47087860107421875, 0.4905242919921875, 0.5101699829101562, 0.529815673828125, 0.5494613647460938, 0.5691070556640625, 0.5887527465820312, 0.6083984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 10.0, 16.0, 17.0, 15.0, 33.0, 56.0, 52.0, 79.0, 88.0, 90.0, 85.0, 95.0, 88.0, 64.0, 58.0, 34.0, 32.0, 25.0, 14.0, 6.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9634976387023926, -1.9067236185073853, -1.8499497175216675, -1.7931756973266602, -1.7364016771316528, -1.679627776145935, -1.6228537559509277, -1.56607985496521, -1.5093058347702026, -1.4525318145751953, -1.3957579135894775, -1.3389838933944702, -1.282209873199463, -1.2254359722137451, -1.1686619520187378, -1.1118879318237305, -1.0551140308380127, -0.9983400702476501, -0.9415660500526428, -0.8847920894622803, -0.8280181288719177, -0.7712441682815552, -0.7144701480865479, -0.6576961874961853, -0.6009221076965332, -0.5441481471061707, -0.4873741567134857, -0.4306001663208008, -0.37382620573043823, -0.3170522153377533, -0.26027822494506836, -0.2035042643547058, -0.14673030376434326, -0.08995632827281952, -0.03318234533071518, 0.02359163761138916, 0.0803656131029129, 0.13713958859443665, 0.19391357898712158, 0.25068753957748413, 0.30746152997016907, 0.364235520362854, 0.42100948095321655, 0.4777834713459015, 0.5345574617385864, 0.591331422328949, 0.6481053829193115, 0.7048794031143188, 0.7616533637046814, 0.818427324295044, 0.8752013444900513, 0.9319753050804138, 0.9887492656707764, 1.0455232858657837, 1.102297306060791, 1.1590712070465088, 1.2158452272415161, 1.2726192474365234, 1.3293931484222412, 1.3861671686172485, 1.4429411888122559, 1.4997150897979736, 1.556489109992981, 1.6132631301879883, 1.670037031173706]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 8.0, 13.0, 9.0, 18.0, 32.0, 21.0, 22.0, 28.0, 26.0, 40.0, 32.0, 43.0, 52.0, 49.0, 59.0, 52.0, 50.0, 44.0, 47.0, 43.0, 38.0, 37.0, 36.0, 22.0, 29.0, 19.0, 20.0, 15.0, 10.0, 12.0, 13.0, 19.0, 5.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2582471370697021, -1.2196928262710571, -1.1811383962631226, -1.1425840854644775, -1.104029655456543, -1.065475344657898, -1.0269209146499634, -0.9883666038513184, -0.9498122334480286, -0.9112578630447388, -0.872703492641449, -0.8341491222381592, -0.7955948114395142, -0.7570403814315796, -0.7184860706329346, -0.6799317002296448, -0.641377329826355, -0.6028229594230652, -0.5642685890197754, -0.5257142186164856, -0.4871598780155182, -0.4486055076122284, -0.410051167011261, -0.3714967966079712, -0.3329424262046814, -0.2943880558013916, -0.2558336853981018, -0.2172793447971344, -0.1787249743938446, -0.1401706039905548, -0.10161624848842621, -0.06306189298629761, -0.024507522583007812, 0.014046840369701385, 0.052601203322410583, 0.09115556627511978, 0.12970992922782898, 0.16826429963111877, 0.20681865513324738, 0.24537301063537598, 0.28392738103866577, 0.32248175144195557, 0.36103612184524536, 0.39959046244621277, 0.43814483284950256, 0.47669920325279236, 0.5152535438537598, 0.5538079142570496, 0.5923622846603394, 0.6309166550636292, 0.669471025466919, 0.7080253958702087, 0.7465797662734985, 0.7851340770721436, 0.8236884474754333, 0.8622428178787231, 0.9007971882820129, 0.9393515586853027, 0.9779059290885925, 1.0164602994918823, 1.0550146102905273, 1.093569040298462, 1.132123351097107, 1.170677661895752, 1.2092320919036865]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 11.0, 9.0, 20.0, 23.0, 26.0, 40.0, 80.0, 93.0, 205.0, 354.0, 646.0, 1442.0, 3127.0, 7621.0, 21459.0, 63312.0, 187565.0, 391144.0, 242390.0, 83445.0, 27945.0, 10013.0, 3910.0, 1803.0, 815.0, 457.0, 203.0, 139.0, 98.0, 48.0, 34.0, 27.0, 14.0, 10.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.447265625, -1.4029083251953125, -1.358551025390625, -1.3141937255859375, -1.26983642578125, -1.2254791259765625, -1.181121826171875, -1.1367645263671875, -1.0924072265625, -1.0480499267578125, -1.003692626953125, -0.9593353271484375, -0.91497802734375, -0.8706207275390625, -0.826263427734375, -0.7819061279296875, -0.737548828125, -0.6931915283203125, -0.648834228515625, -0.6044769287109375, -0.56011962890625, -0.5157623291015625, -0.471405029296875, -0.4270477294921875, -0.3826904296875, -0.3383331298828125, -0.293975830078125, -0.2496185302734375, -0.20526123046875, -0.1609039306640625, -0.116546630859375, -0.0721893310546875, -0.02783203125, 0.0165252685546875, 0.060882568359375, 0.1052398681640625, 0.14959716796875, 0.1939544677734375, 0.238311767578125, 0.2826690673828125, 0.3270263671875, 0.3713836669921875, 0.415740966796875, 0.4600982666015625, 0.50445556640625, 0.5488128662109375, 0.593170166015625, 0.6375274658203125, 0.681884765625, 0.7262420654296875, 0.770599365234375, 0.8149566650390625, 0.85931396484375, 0.9036712646484375, 0.948028564453125, 0.9923858642578125, 1.0367431640625, 1.0811004638671875, 1.125457763671875, 1.1698150634765625, 1.21417236328125, 1.2585296630859375, 1.302886962890625, 1.3472442626953125, 1.3916015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 10.0, 14.0, 15.0, 17.0, 17.0, 36.0, 33.0, 38.0, 44.0, 64.0, 72.0, 66.0, 74.0, 69.0, 69.0, 59.0, 54.0, 51.0, 48.0, 28.0, 21.0, 16.0, 19.0, 5.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.870452880859375, -0.84100341796875, -0.811553955078125, -0.7821044921875, -0.752655029296875, -0.72320556640625, -0.693756103515625, -0.664306640625, -0.634857177734375, -0.60540771484375, -0.575958251953125, -0.5465087890625, -0.517059326171875, -0.48760986328125, -0.458160400390625, -0.4287109375, -0.399261474609375, -0.36981201171875, -0.340362548828125, -0.3109130859375, -0.281463623046875, -0.25201416015625, -0.222564697265625, -0.193115234375, -0.163665771484375, -0.13421630859375, -0.104766845703125, -0.0753173828125, -0.045867919921875, -0.01641845703125, 0.013031005859375, 0.04248046875, 0.071929931640625, 0.10137939453125, 0.130828857421875, 0.1602783203125, 0.189727783203125, 0.21917724609375, 0.248626708984375, 0.278076171875, 0.307525634765625, 0.33697509765625, 0.366424560546875, 0.3958740234375, 0.425323486328125, 0.45477294921875, 0.484222412109375, 0.513671875, 0.543121337890625, 0.57257080078125, 0.602020263671875, 0.6314697265625, 0.660919189453125, 0.69036865234375, 0.719818115234375, 0.749267578125, 0.778717041015625, 0.80816650390625, 0.837615966796875, 0.8670654296875, 0.896514892578125, 0.92596435546875, 0.955413818359375, 0.98486328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 15.0, 20.0, 53.0, 104.0, 246.0, 672.0, 2359.0, 66825.0, 966939.0, 9192.0, 1319.0, 419.0, 182.0, 72.0, 53.0, 21.0, 15.0, 7.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1640625, -8.91156005859375, -8.6590576171875, -8.40655517578125, -8.154052734375, -7.90155029296875, -7.6490478515625, -7.39654541015625, -7.14404296875, -6.89154052734375, -6.6390380859375, -6.38653564453125, -6.134033203125, -5.88153076171875, -5.6290283203125, -5.37652587890625, -5.1240234375, -4.87152099609375, -4.6190185546875, -4.36651611328125, -4.114013671875, -3.86151123046875, -3.6090087890625, -3.35650634765625, -3.10400390625, -2.85150146484375, -2.5989990234375, -2.34649658203125, -2.093994140625, -1.84149169921875, -1.5889892578125, -1.33648681640625, -1.083984375, -0.83148193359375, -0.5789794921875, -0.32647705078125, -0.073974609375, 0.17852783203125, 0.4310302734375, 0.68353271484375, 0.93603515625, 1.18853759765625, 1.4410400390625, 1.69354248046875, 1.946044921875, 2.19854736328125, 2.4510498046875, 2.70355224609375, 2.9560546875, 3.20855712890625, 3.4610595703125, 3.71356201171875, 3.966064453125, 4.21856689453125, 4.4710693359375, 4.72357177734375, 4.97607421875, 5.22857666015625, 5.4810791015625, 5.73358154296875, 5.986083984375, 6.23858642578125, 6.4910888671875, 6.74359130859375, 6.99609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 10.0, 19.0, 26.0, 35.0, 38.0, 62.0, 59.0, 57.0, 72.0, 72.0, 88.0, 83.0, 63.0, 65.0, 58.0, 45.0, 26.0, 25.0, 19.0, 11.0, 9.0, 9.0, 12.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.84716796875, -3.6748046875, -3.50244140625, -3.330078125, -3.15771484375, -2.9853515625, -2.81298828125, -2.640625, -2.46826171875, -2.2958984375, -2.12353515625, -1.951171875, -1.77880859375, -1.6064453125, -1.43408203125, -1.26171875, -1.08935546875, -0.9169921875, -0.74462890625, -0.572265625, -0.39990234375, -0.2275390625, -0.05517578125, 0.1171875, 0.28955078125, 0.4619140625, 0.63427734375, 0.806640625, 0.97900390625, 1.1513671875, 1.32373046875, 1.49609375, 1.66845703125, 1.8408203125, 2.01318359375, 2.185546875, 2.35791015625, 2.5302734375, 2.70263671875, 2.875, 3.04736328125, 3.2197265625, 3.39208984375, 3.564453125, 3.73681640625, 3.9091796875, 4.08154296875, 4.25390625, 4.42626953125, 4.5986328125, 4.77099609375, 4.943359375, 5.11572265625, 5.2880859375, 5.46044921875, 5.6328125, 5.80517578125, 5.9775390625, 6.14990234375, 6.322265625, 6.49462890625, 6.6669921875, 6.83935546875, 7.01171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 14.0, 5.0, 10.0, 21.0, 31.0, 48.0, 63.0, 106.0, 222.0, 432.0, 1261.0, 5983.0, 172377.0, 845480.0, 18983.0, 2140.0, 650.0, 291.0, 154.0, 94.0, 58.0, 34.0, 30.0, 18.0, 7.0, 6.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.406280517578125, -2.31451416015625, -2.222747802734375, -2.1309814453125, -2.039215087890625, -1.94744873046875, -1.855682373046875, -1.763916015625, -1.672149658203125, -1.58038330078125, -1.488616943359375, -1.3968505859375, -1.305084228515625, -1.21331787109375, -1.121551513671875, -1.02978515625, -0.938018798828125, -0.84625244140625, -0.754486083984375, -0.6627197265625, -0.570953369140625, -0.47918701171875, -0.387420654296875, -0.295654296875, -0.203887939453125, -0.11212158203125, -0.020355224609375, 0.0714111328125, 0.163177490234375, 0.25494384765625, 0.346710205078125, 0.4384765625, 0.530242919921875, 0.62200927734375, 0.713775634765625, 0.8055419921875, 0.897308349609375, 0.98907470703125, 1.080841064453125, 1.172607421875, 1.264373779296875, 1.35614013671875, 1.447906494140625, 1.5396728515625, 1.631439208984375, 1.72320556640625, 1.814971923828125, 1.90673828125, 1.998504638671875, 2.09027099609375, 2.182037353515625, 2.2738037109375, 2.365570068359375, 2.45733642578125, 2.549102783203125, 2.640869140625, 2.732635498046875, 2.82440185546875, 2.916168212890625, 3.0079345703125, 3.099700927734375, 3.19146728515625, 3.283233642578125, 3.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 12.0, 11.0, 14.0, 27.0, 29.0, 37.0, 44.0, 55.0, 65.0, 102.0, 109.0, 89.0, 79.0, 65.0, 45.0, 44.0, 26.0, 18.0, 23.0, 20.0, 10.0, 10.0, 5.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00023055076599121094, -0.00022425130009651184, -0.00021795183420181274, -0.00021165236830711365, -0.00020535290241241455, -0.00019905343651771545, -0.00019275397062301636, -0.00018645450472831726, -0.00018015503883361816, -0.00017385557293891907, -0.00016755610704421997, -0.00016125664114952087, -0.00015495717525482178, -0.00014865770936012268, -0.00014235824346542358, -0.0001360587775707245, -0.0001297593116760254, -0.0001234598457813263, -0.0001171603798866272, -0.0001108609139919281, -0.000104561448097229, -9.826198220252991e-05, -9.196251630783081e-05, -8.566305041313171e-05, -7.936358451843262e-05, -7.306411862373352e-05, -6.676465272903442e-05, -6.046518683433533e-05, -5.416572093963623e-05, -4.7866255044937134e-05, -4.156678915023804e-05, -3.526732325553894e-05, -2.8967857360839844e-05, -2.2668391466140747e-05, -1.636892557144165e-05, -1.0069459676742554e-05, -3.769993782043457e-06, 2.5294721126556396e-06, 8.828938007354736e-06, 1.5128403902053833e-05, 2.142786979675293e-05, 2.7727335691452026e-05, 3.402680158615112e-05, 4.032626748085022e-05, 4.6625733375549316e-05, 5.292519927024841e-05, 5.922466516494751e-05, 6.55241310596466e-05, 7.18235969543457e-05, 7.81230628490448e-05, 8.44225287437439e-05, 9.072199463844299e-05, 9.702146053314209e-05, 0.00010332092642784119, 0.00010962039232254028, 0.00011591985821723938, 0.00012221932411193848, 0.00012851879000663757, 0.00013481825590133667, 0.00014111772179603577, 0.00014741718769073486, 0.00015371665358543396, 0.00016001611948013306, 0.00016631558537483215, 0.00017261505126953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 8.0, 10.0, 10.0, 29.0, 39.0, 45.0, 67.0, 135.0, 285.0, 578.0, 1366.0, 4407.0, 35598.0, 776840.0, 213318.0, 11530.0, 2423.0, 924.0, 409.0, 212.0, 108.0, 61.0, 39.0, 25.0, 22.0, 23.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.405120849609375, -2.33172607421875, -2.258331298828125, -2.1849365234375, -2.111541748046875, -2.03814697265625, -1.964752197265625, -1.891357421875, -1.817962646484375, -1.74456787109375, -1.671173095703125, -1.5977783203125, -1.524383544921875, -1.45098876953125, -1.377593994140625, -1.30419921875, -1.230804443359375, -1.15740966796875, -1.084014892578125, -1.0106201171875, -0.937225341796875, -0.86383056640625, -0.790435791015625, -0.717041015625, -0.643646240234375, -0.57025146484375, -0.496856689453125, -0.4234619140625, -0.350067138671875, -0.27667236328125, -0.203277587890625, -0.1298828125, -0.056488037109375, 0.01690673828125, 0.090301513671875, 0.1636962890625, 0.237091064453125, 0.31048583984375, 0.383880615234375, 0.457275390625, 0.530670166015625, 0.60406494140625, 0.677459716796875, 0.7508544921875, 0.824249267578125, 0.89764404296875, 0.971038818359375, 1.04443359375, 1.117828369140625, 1.19122314453125, 1.264617919921875, 1.3380126953125, 1.411407470703125, 1.48480224609375, 1.558197021484375, 1.631591796875, 1.704986572265625, 1.77838134765625, 1.851776123046875, 1.9251708984375, 1.998565673828125, 2.07196044921875, 2.145355224609375, 2.21875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 15.0, 12.0, 26.0, 26.0, 55.0, 60.0, 101.0, 109.0, 120.0, 121.0, 88.0, 68.0, 47.0, 31.0, 30.0, 19.0, 14.0, 9.0, 6.0, 5.0, 10.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8759918212890625, -1.807647705078125, -1.7393035888671875, -1.67095947265625, -1.6026153564453125, -1.534271240234375, -1.4659271240234375, -1.3975830078125, -1.3292388916015625, -1.260894775390625, -1.1925506591796875, -1.12420654296875, -1.0558624267578125, -0.987518310546875, -0.9191741943359375, -0.850830078125, -0.7824859619140625, -0.714141845703125, -0.6457977294921875, -0.57745361328125, -0.5091094970703125, -0.440765380859375, -0.3724212646484375, -0.3040771484375, -0.2357330322265625, -0.167388916015625, -0.0990447998046875, -0.03070068359375, 0.0376434326171875, 0.105987548828125, 0.1743316650390625, 0.24267578125, 0.3110198974609375, 0.379364013671875, 0.4477081298828125, 0.51605224609375, 0.5843963623046875, 0.652740478515625, 0.7210845947265625, 0.7894287109375, 0.8577728271484375, 0.926116943359375, 0.9944610595703125, 1.06280517578125, 1.1311492919921875, 1.199493408203125, 1.2678375244140625, 1.336181640625, 1.4045257568359375, 1.472869873046875, 1.5412139892578125, 1.60955810546875, 1.6779022216796875, 1.746246337890625, 1.8145904541015625, 1.8829345703125, 1.9512786865234375, 2.019622802734375, 2.0879669189453125, 2.15631103515625, 2.2246551513671875, 2.292999267578125, 2.3613433837890625, 2.4296875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 12.0, 53.0, 235.0, 423.0, 213.0, 43.0, 12.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.392494201660156, -32.712867736816406, -31.033245086669922, -29.353618621826172, -27.673995971679688, -25.994369506835938, -24.31474494934082, -22.635120391845703, -20.955495834350586, -19.27587127685547, -17.59624671936035, -15.916621208190918, -14.2369966506958, -12.557372093200684, -10.87774658203125, -9.198122024536133, -7.518497467041016, -5.838872909545898, -4.159247875213623, -2.4796228408813477, -0.7999982833862305, 0.8796262741088867, 2.5592517852783203, 4.2388763427734375, 5.918500900268555, 7.598125457763672, 9.277750015258789, 10.957375526428223, 12.63700008392334, 14.316624641418457, 15.99625015258789, 17.675874710083008, 19.355499267578125, 21.035123825073242, 22.71474838256836, 24.39437484741211, 26.073997497558594, 27.753623962402344, 29.43324851989746, 31.112873077392578, 32.79249572753906, 34.47212219238281, 36.1517448425293, 37.83137130737305, 39.51099395751953, 41.19062042236328, 42.87024688720703, 44.549869537353516, 46.229496002197266, 47.909122467041016, 49.5887451171875, 51.26837158203125, 52.947994232177734, 54.627620697021484, 56.30724334716797, 57.98686981201172, 59.66649627685547, 61.34612274169922, 63.0257453918457, 64.70536804199219, 66.38499450683594, 68.06462097167969, 69.74424743652344, 71.42387390136719, 73.1034927368164]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 8.0, 10.0, 6.0, 13.0, 14.0, 15.0, 19.0, 29.0, 22.0, 22.0, 21.0, 27.0, 41.0, 40.0, 44.0, 46.0, 37.0, 51.0, 47.0, 48.0, 42.0, 40.0, 40.0, 35.0, 35.0, 31.0, 32.0, 24.0, 15.0, 16.0, 15.0, 16.0, 9.0, 8.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.982881546020508, -12.583287239074707, -12.183693885803223, -11.784099578857422, -11.384506225585938, -10.984911918640137, -10.585317611694336, -10.185724258422852, -9.78612995147705, -9.38653564453125, -8.986942291259766, -8.587347984313965, -8.187753677368164, -7.78816032409668, -7.388566017150879, -6.988972187042236, -6.589378356933594, -6.189784526824951, -5.790190696716309, -5.390596389770508, -4.991002559661865, -4.591408729553223, -4.191814422607422, -3.7922205924987793, -3.3926267623901367, -2.993032932281494, -2.5934388637542725, -2.193844795227051, -1.7942509651184082, -1.394657015800476, -0.995063066482544, -0.5954689979553223, -0.1958761215209961, 0.20371782779693604, 0.6033117771148682, 1.0029057264328003, 1.4024996757507324, 1.8020936250686646, 2.2016875743865967, 2.6012816429138184, 3.000875473022461, 3.4004693031311035, 3.800063371658325, 4.199657440185547, 4.5992512702941895, 4.998845100402832, 5.398439407348633, 5.798033237457275, 6.197627067565918, 6.5972208976745605, 6.996814727783203, 7.396409034729004, 7.7960028648376465, 8.195596694946289, 8.59519100189209, 8.99478530883789, 9.394378662109375, 9.793972969055176, 10.19356632232666, 10.593160629272461, 10.992753982543945, 11.392348289489746, 11.791942596435547, 12.191535949707031, 12.591130256652832]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 9.0, 14.0, 14.0, 15.0, 25.0, 32.0, 42.0, 72.0, 85.0, 138.0, 186.0, 300.0, 378.0, 656.0, 1095.0, 1896.0, 4033.0, 9992.0, 33704.0, 295228.0, 3757550.0, 61888.0, 15139.0, 5579.0, 2492.0, 1389.0, 762.0, 498.0, 329.0, 238.0, 144.0, 103.0, 69.0, 47.0, 39.0, 30.0, 15.0, 15.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.14453125, -2.077911376953125, -2.01129150390625, -1.944671630859375, -1.8780517578125, -1.811431884765625, -1.74481201171875, -1.678192138671875, -1.611572265625, -1.544952392578125, -1.47833251953125, -1.411712646484375, -1.3450927734375, -1.278472900390625, -1.21185302734375, -1.145233154296875, -1.07861328125, -1.011993408203125, -0.94537353515625, -0.878753662109375, -0.8121337890625, -0.745513916015625, -0.67889404296875, -0.612274169921875, -0.545654296875, -0.479034423828125, -0.41241455078125, -0.345794677734375, -0.2791748046875, -0.212554931640625, -0.14593505859375, -0.079315185546875, -0.0126953125, 0.053924560546875, 0.12054443359375, 0.187164306640625, 0.2537841796875, 0.320404052734375, 0.38702392578125, 0.453643798828125, 0.520263671875, 0.586883544921875, 0.65350341796875, 0.720123291015625, 0.7867431640625, 0.853363037109375, 0.91998291015625, 0.986602783203125, 1.05322265625, 1.119842529296875, 1.18646240234375, 1.253082275390625, 1.3197021484375, 1.386322021484375, 1.45294189453125, 1.519561767578125, 1.586181640625, 1.652801513671875, 1.71942138671875, 1.786041259765625, 1.8526611328125, 1.919281005859375, 1.98590087890625, 2.052520751953125, 2.119140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 7.0, 12.0, 17.0, 11.0, 19.0, 27.0, 29.0, 45.0, 54.0, 50.0, 51.0, 61.0, 54.0, 65.0, 65.0, 62.0, 63.0, 53.0, 43.0, 50.0, 36.0, 21.0, 14.0, 19.0, 11.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8300933837890625, -0.805206298828125, -0.7803192138671875, -0.75543212890625, -0.7305450439453125, -0.705657958984375, -0.6807708740234375, -0.6558837890625, -0.6309967041015625, -0.606109619140625, -0.5812225341796875, -0.55633544921875, -0.5314483642578125, -0.506561279296875, -0.4816741943359375, -0.456787109375, -0.4319000244140625, -0.407012939453125, -0.3821258544921875, -0.35723876953125, -0.3323516845703125, -0.307464599609375, -0.2825775146484375, -0.2576904296875, -0.2328033447265625, -0.207916259765625, -0.1830291748046875, -0.15814208984375, -0.1332550048828125, -0.108367919921875, -0.0834808349609375, -0.05859375, -0.0337066650390625, -0.008819580078125, 0.0160675048828125, 0.04095458984375, 0.0658416748046875, 0.090728759765625, 0.1156158447265625, 0.1405029296875, 0.1653900146484375, 0.190277099609375, 0.2151641845703125, 0.24005126953125, 0.2649383544921875, 0.289825439453125, 0.3147125244140625, 0.339599609375, 0.3644866943359375, 0.389373779296875, 0.4142608642578125, 0.43914794921875, 0.4640350341796875, 0.488922119140625, 0.5138092041015625, 0.5386962890625, 0.5635833740234375, 0.588470458984375, 0.6133575439453125, 0.63824462890625, 0.6631317138671875, 0.688018798828125, 0.7129058837890625, 0.73779296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 11.0, 8.0, 7.0, 7.0, 19.0, 22.0, 17.0, 41.0, 77.0, 126.0, 202.0, 321.0, 604.0, 1146.0, 2357.0, 6205.0, 24501.0, 412099.0, 3689529.0, 42300.0, 8559.0, 2962.0, 1432.0, 751.0, 373.0, 201.0, 126.0, 94.0, 69.0, 38.0, 29.0, 17.0, 4.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.445068359375, -2.35498046875, -2.264892578125, -2.1748046875, -2.084716796875, -1.99462890625, -1.904541015625, -1.814453125, -1.724365234375, -1.63427734375, -1.544189453125, -1.4541015625, -1.364013671875, -1.27392578125, -1.183837890625, -1.09375, -1.003662109375, -0.91357421875, -0.823486328125, -0.7333984375, -0.643310546875, -0.55322265625, -0.463134765625, -0.373046875, -0.282958984375, -0.19287109375, -0.102783203125, -0.0126953125, 0.077392578125, 0.16748046875, 0.257568359375, 0.34765625, 0.437744140625, 0.52783203125, 0.617919921875, 0.7080078125, 0.798095703125, 0.88818359375, 0.978271484375, 1.068359375, 1.158447265625, 1.24853515625, 1.338623046875, 1.4287109375, 1.518798828125, 1.60888671875, 1.698974609375, 1.7890625, 1.879150390625, 1.96923828125, 2.059326171875, 2.1494140625, 2.239501953125, 2.32958984375, 2.419677734375, 2.509765625, 2.599853515625, 2.68994140625, 2.780029296875, 2.8701171875, 2.960205078125, 3.05029296875, 3.140380859375, 3.23046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 11.0, 19.0, 39.0, 45.0, 112.0, 337.0, 2780.0, 404.0, 148.0, 63.0, 31.0, 25.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.244140625, -1.2091598510742188, -1.1741790771484375, -1.1391983032226562, -1.104217529296875, -1.0692367553710938, -1.0342559814453125, -0.9992752075195312, -0.96429443359375, -0.9293136596679688, -0.8943328857421875, -0.8593521118164062, -0.824371337890625, -0.7893905639648438, -0.7544097900390625, -0.7194290161132812, -0.6844482421875, -0.6494674682617188, -0.6144866943359375, -0.5795059204101562, -0.544525146484375, -0.5095443725585938, -0.4745635986328125, -0.43958282470703125, -0.40460205078125, -0.36962127685546875, -0.3346405029296875, -0.29965972900390625, -0.264678955078125, -0.22969818115234375, -0.1947174072265625, -0.15973663330078125, -0.124755859375, -0.08977508544921875, -0.0547943115234375, -0.01981353759765625, 0.015167236328125, 0.05014801025390625, 0.0851287841796875, 0.12010955810546875, 0.15509033203125, 0.19007110595703125, 0.2250518798828125, 0.26003265380859375, 0.295013427734375, 0.32999420166015625, 0.3649749755859375, 0.39995574951171875, 0.4349365234375, 0.46991729736328125, 0.5048980712890625, 0.5398788452148438, 0.574859619140625, 0.6098403930664062, 0.6448211669921875, 0.6798019409179688, 0.71478271484375, 0.7497634887695312, 0.7847442626953125, 0.8197250366210938, 0.854705810546875, 0.8896865844726562, 0.9246673583984375, 0.9596481323242188, 0.99462890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 14.0, 19.0, 34.0, 59.0, 98.0, 121.0, 142.0, 141.0, 114.0, 91.0, 51.0, 27.0, 25.0, 17.0, 12.0, 6.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.239797592163086, -3.081843852996826, -2.9238898754119873, -2.7659361362457275, -2.6079823970794678, -2.450028419494629, -2.292074680328369, -2.1341209411621094, -1.97616708278656, -1.8182132244110107, -1.660259485244751, -1.5023056268692017, -1.3443517684936523, -1.1863980293273926, -1.0284441709518433, -0.8704904317855835, -0.7125365734100342, -0.5545827746391296, -0.3966289460659027, -0.23867511749267578, -0.08072131872177124, 0.0772324800491333, 0.23518633842468262, 0.3931400775909424, 0.5510939359664917, 0.7090477347373962, 0.8670015335083008, 1.02495539188385, 1.1829092502593994, 1.3408629894256592, 1.4988168478012085, 1.6567705869674683, 1.8147244453430176, 1.972678303718567, 2.130632162094116, 2.288585901260376, 2.4465396404266357, 2.6044936180114746, 2.7624473571777344, 2.920401096343994, 3.078354835510254, 3.2363085746765137, 3.3942625522613525, 3.5522162914276123, 3.710170030593872, 3.868124008178711, 4.026077747344971, 4.1840314865112305, 4.341985702514648, 4.499939441680908, 4.657893180847168, 4.815847396850586, 4.973801136016846, 5.1317548751831055, 5.289708614349365, 5.447662353515625, 5.605616092681885, 5.7635698318481445, 5.921523571014404, 6.079477310180664, 6.237431526184082, 6.395385265350342, 6.553339004516602, 6.711292743682861, 6.869246482849121]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 2.0, 8.0, 13.0, 10.0, 11.0, 18.0, 27.0, 21.0, 28.0, 26.0, 33.0, 31.0, 30.0, 47.0, 45.0, 40.0, 34.0, 35.0, 44.0, 46.0, 45.0, 38.0, 38.0, 39.0, 35.0, 17.0, 29.0, 29.0, 20.0, 20.0, 23.0, 16.0, 18.0, 9.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3008830547332764, -2.2314326763153076, -2.161982297897339, -2.09253191947937, -2.0230817794799805, -1.9536312818527222, -1.884181022644043, -1.8147306442260742, -1.7452802658081055, -1.6758298873901367, -1.606379508972168, -1.5369292497634888, -1.46747887134552, -1.3980284929275513, -1.328578233718872, -1.2591278553009033, -1.1896774768829346, -1.1202270984649658, -1.050776720046997, -0.9813264608383179, -0.9118760824203491, -0.8424257040023804, -0.7729753851890564, -0.7035250663757324, -0.6340746879577637, -0.5646243095397949, -0.49517399072647095, -0.4257236421108246, -0.3562732934951782, -0.28682294487953186, -0.2173725962638855, -0.14792224764823914, -0.07847213745117188, -0.009021788835525513, 0.06042855978012085, 0.1298789083957672, 0.19932925701141357, 0.26877960562705994, 0.3382299542427063, 0.40768030285835266, 0.477130651473999, 0.5465810298919678, 0.6160313487052917, 0.6854816675186157, 0.7549320459365845, 0.8243824243545532, 0.8938327431678772, 0.9632830619812012, 1.03273344039917, 1.1021838188171387, 1.1716341972351074, 1.2410844564437866, 1.3105348348617554, 1.3799852132797241, 1.4494354724884033, 1.518885850906372, 1.5883362293243408, 1.6577866077423096, 1.7272369861602783, 1.7966872453689575, 1.8661376237869263, 1.935588002204895, 2.005038261413574, 2.074488639831543, 2.1439390182495117]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 15.0, 10.0, 12.0, 27.0, 64.0, 108.0, 257.0, 573.0, 1624.0, 5555.0, 23885.0, 124793.0, 564689.0, 264138.0, 48346.0, 10055.0, 2713.0, 908.0, 372.0, 169.0, 98.0, 52.0, 28.0, 17.0, 12.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.455078125, -2.372467041015625, -2.28985595703125, -2.207244873046875, -2.1246337890625, -2.042022705078125, -1.95941162109375, -1.876800537109375, -1.794189453125, -1.711578369140625, -1.62896728515625, -1.546356201171875, -1.4637451171875, -1.381134033203125, -1.29852294921875, -1.215911865234375, -1.13330078125, -1.050689697265625, -0.96807861328125, -0.885467529296875, -0.8028564453125, -0.720245361328125, -0.63763427734375, -0.555023193359375, -0.472412109375, -0.389801025390625, -0.30718994140625, -0.224578857421875, -0.1419677734375, -0.059356689453125, 0.02325439453125, 0.105865478515625, 0.1884765625, 0.271087646484375, 0.35369873046875, 0.436309814453125, 0.5189208984375, 0.601531982421875, 0.68414306640625, 0.766754150390625, 0.849365234375, 0.931976318359375, 1.01458740234375, 1.097198486328125, 1.1798095703125, 1.262420654296875, 1.34503173828125, 1.427642822265625, 1.51025390625, 1.592864990234375, 1.67547607421875, 1.758087158203125, 1.8406982421875, 1.923309326171875, 2.00592041015625, 2.088531494140625, 2.171142578125, 2.253753662109375, 2.33636474609375, 2.418975830078125, 2.5015869140625, 2.584197998046875, 2.66680908203125, 2.749420166015625, 2.83203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 14.0, 7.0, 18.0, 27.0, 35.0, 32.0, 27.0, 43.0, 58.0, 65.0, 53.0, 50.0, 51.0, 67.0, 58.0, 53.0, 58.0, 37.0, 38.0, 33.0, 22.0, 28.0, 14.0, 19.0, 18.0, 10.0, 4.0, 1.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8361892700195312, -0.8125152587890625, -0.7888412475585938, -0.765167236328125, -0.7414932250976562, -0.7178192138671875, -0.6941452026367188, -0.67047119140625, -0.6467971801757812, -0.6231231689453125, -0.5994491577148438, -0.575775146484375, -0.5521011352539062, -0.5284271240234375, -0.5047531127929688, -0.4810791015625, -0.45740509033203125, -0.4337310791015625, -0.41005706787109375, -0.386383056640625, -0.36270904541015625, -0.3390350341796875, -0.31536102294921875, -0.29168701171875, -0.26801300048828125, -0.2443389892578125, -0.22066497802734375, -0.196990966796875, -0.17331695556640625, -0.1496429443359375, -0.12596893310546875, -0.102294921875, -0.07862091064453125, -0.0549468994140625, -0.03127288818359375, -0.007598876953125, 0.01607513427734375, 0.0397491455078125, 0.06342315673828125, 0.08709716796875, 0.11077117919921875, 0.1344451904296875, 0.15811920166015625, 0.181793212890625, 0.20546722412109375, 0.2291412353515625, 0.25281524658203125, 0.2764892578125, 0.30016326904296875, 0.3238372802734375, 0.34751129150390625, 0.371185302734375, 0.39485931396484375, 0.4185333251953125, 0.44220733642578125, 0.46588134765625, 0.48955535888671875, 0.5132293701171875, 0.5369033813476562, 0.560577392578125, 0.5842514038085938, 0.6079254150390625, 0.6315994262695312, 0.6552734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 9.0, 15.0, 27.0, 55.0, 81.0, 181.0, 476.0, 1748.0, 22689.0, 1003416.0, 17350.0, 1595.0, 464.0, 181.0, 100.0, 45.0, 25.0, 17.0, 14.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4002685546875, -8.105224609375, -7.8101806640625, -7.51513671875, -7.2200927734375, -6.925048828125, -6.6300048828125, -6.3349609375, -6.0399169921875, -5.744873046875, -5.4498291015625, -5.15478515625, -4.8597412109375, -4.564697265625, -4.2696533203125, -3.974609375, -3.6795654296875, -3.384521484375, -3.0894775390625, -2.79443359375, -2.4993896484375, -2.204345703125, -1.9093017578125, -1.6142578125, -1.3192138671875, -1.024169921875, -0.7291259765625, -0.43408203125, -0.1390380859375, 0.156005859375, 0.4510498046875, 0.74609375, 1.0411376953125, 1.336181640625, 1.6312255859375, 1.92626953125, 2.2213134765625, 2.516357421875, 2.8114013671875, 3.1064453125, 3.4014892578125, 3.696533203125, 3.9915771484375, 4.28662109375, 4.5816650390625, 4.876708984375, 5.1717529296875, 5.466796875, 5.7618408203125, 6.056884765625, 6.3519287109375, 6.64697265625, 6.9420166015625, 7.237060546875, 7.5321044921875, 7.8271484375, 8.1221923828125, 8.417236328125, 8.7122802734375, 9.00732421875, 9.3023681640625, 9.597412109375, 9.8924560546875, 10.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 19.0, 14.0, 15.0, 29.0, 35.0, 39.0, 35.0, 66.0, 59.0, 78.0, 77.0, 65.0, 63.0, 57.0, 47.0, 44.0, 51.0, 38.0, 36.0, 29.0, 22.0, 16.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.753570556640625, -3.63018798828125, -3.506805419921875, -3.3834228515625, -3.260040283203125, -3.13665771484375, -3.013275146484375, -2.889892578125, -2.766510009765625, -2.64312744140625, -2.519744873046875, -2.3963623046875, -2.272979736328125, -2.14959716796875, -2.026214599609375, -1.90283203125, -1.779449462890625, -1.65606689453125, -1.532684326171875, -1.4093017578125, -1.285919189453125, -1.16253662109375, -1.039154052734375, -0.915771484375, -0.792388916015625, -0.66900634765625, -0.545623779296875, -0.4222412109375, -0.298858642578125, -0.17547607421875, -0.052093505859375, 0.0712890625, 0.194671630859375, 0.31805419921875, 0.441436767578125, 0.5648193359375, 0.688201904296875, 0.81158447265625, 0.934967041015625, 1.058349609375, 1.181732177734375, 1.30511474609375, 1.428497314453125, 1.5518798828125, 1.675262451171875, 1.79864501953125, 1.922027587890625, 2.04541015625, 2.168792724609375, 2.29217529296875, 2.415557861328125, 2.5389404296875, 2.662322998046875, 2.78570556640625, 2.909088134765625, 3.032470703125, 3.155853271484375, 3.27923583984375, 3.402618408203125, 3.5260009765625, 3.649383544921875, 3.77276611328125, 3.896148681640625, 4.01953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 11.0, 20.0, 19.0, 25.0, 43.0, 70.0, 98.0, 188.0, 281.0, 489.0, 1016.0, 2504.0, 8414.0, 42242.0, 342789.0, 569288.0, 63948.0, 11338.0, 3165.0, 1191.0, 556.0, 310.0, 166.0, 101.0, 79.0, 51.0, 38.0, 26.0, 23.0, 14.0, 9.0, 9.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.5283203125, -1.4911422729492188, -1.4539642333984375, -1.4167861938476562, -1.379608154296875, -1.3424301147460938, -1.3052520751953125, -1.2680740356445312, -1.23089599609375, -1.1937179565429688, -1.1565399169921875, -1.1193618774414062, -1.082183837890625, -1.0450057983398438, -1.0078277587890625, -0.9706497192382812, -0.9334716796875, -0.8962936401367188, -0.8591156005859375, -0.8219375610351562, -0.784759521484375, -0.7475814819335938, -0.7104034423828125, -0.6732254028320312, -0.63604736328125, -0.5988693237304688, -0.5616912841796875, -0.5245132446289062, -0.487335205078125, -0.45015716552734375, -0.4129791259765625, -0.37580108642578125, -0.338623046875, -0.30144500732421875, -0.2642669677734375, -0.22708892822265625, -0.189910888671875, -0.15273284912109375, -0.1155548095703125, -0.07837677001953125, -0.04119873046875, -0.00402069091796875, 0.0331573486328125, 0.07033538818359375, 0.107513427734375, 0.14469146728515625, 0.1818695068359375, 0.21904754638671875, 0.2562255859375, 0.29340362548828125, 0.3305816650390625, 0.36775970458984375, 0.404937744140625, 0.44211578369140625, 0.4792938232421875, 0.5164718627929688, 0.55364990234375, 0.5908279418945312, 0.6280059814453125, 0.6651840209960938, 0.702362060546875, 0.7395401000976562, 0.7767181396484375, 0.8138961791992188, 0.85107421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 11.0, 20.0, 16.0, 18.0, 24.0, 28.0, 35.0, 44.0, 48.0, 71.0, 123.0, 137.0, 105.0, 48.0, 50.0, 37.0, 34.0, 23.0, 23.0, 22.0, 19.0, 13.0, 8.0, 11.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.00021397322416305542, -0.00020645558834075928, -0.00019893795251846313, -0.000191420316696167, -0.00018390268087387085, -0.0001763850450515747, -0.00016886740922927856, -0.00016134977340698242, -0.00015383213758468628, -0.00014631450176239014, -0.000138796865940094, -0.00013127923011779785, -0.0001237615942955017, -0.00011624395847320557, -0.00010872632265090942, -0.00010120868682861328, -9.369105100631714e-05, -8.6173415184021e-05, -7.865577936172485e-05, -7.113814353942871e-05, -6.362050771713257e-05, -5.6102871894836426e-05, -4.858523607254028e-05, -4.106760025024414e-05, -3.3549964427948e-05, -2.6032328605651855e-05, -1.8514692783355713e-05, -1.099705696105957e-05, -3.4794211387634277e-06, 4.038214683532715e-06, 1.1555850505828857e-05, 1.9073486328125e-05, 2.6591122150421143e-05, 3.4108757972717285e-05, 4.162639379501343e-05, 4.914402961730957e-05, 5.666166543960571e-05, 6.417930126190186e-05, 7.1696937084198e-05, 7.921457290649414e-05, 8.673220872879028e-05, 9.424984455108643e-05, 0.00010176748037338257, 0.00010928511619567871, 0.00011680275201797485, 0.000124320387840271, 0.00013183802366256714, 0.00013935565948486328, 0.00014687329530715942, 0.00015439093112945557, 0.0001619085669517517, 0.00016942620277404785, 0.000176943838596344, 0.00018446147441864014, 0.00019197911024093628, 0.00019949674606323242, 0.00020701438188552856, 0.0002145320177078247, 0.00022204965353012085, 0.000229567289352417, 0.00023708492517471313, 0.0002446025609970093, 0.0002521201968193054, 0.00025963783264160156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 9.0, 10.0, 20.0, 32.0, 49.0, 72.0, 131.0, 208.0, 348.0, 700.0, 1546.0, 4698.0, 25189.0, 286649.0, 660356.0, 56071.0, 8143.0, 2218.0, 971.0, 443.0, 240.0, 142.0, 99.0, 59.0, 31.0, 28.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.2458343505859375, -1.201629638671875, -1.1574249267578125, -1.11322021484375, -1.0690155029296875, -1.024810791015625, -0.9806060791015625, -0.9364013671875, -0.8921966552734375, -0.847991943359375, -0.8037872314453125, -0.75958251953125, -0.7153778076171875, -0.671173095703125, -0.6269683837890625, -0.582763671875, -0.5385589599609375, -0.494354248046875, -0.4501495361328125, -0.40594482421875, -0.3617401123046875, -0.317535400390625, -0.2733306884765625, -0.2291259765625, -0.1849212646484375, -0.140716552734375, -0.0965118408203125, -0.05230712890625, -0.0081024169921875, 0.036102294921875, 0.0803070068359375, 0.12451171875, 0.1687164306640625, 0.212921142578125, 0.2571258544921875, 0.30133056640625, 0.3455352783203125, 0.389739990234375, 0.4339447021484375, 0.4781494140625, 0.5223541259765625, 0.566558837890625, 0.6107635498046875, 0.65496826171875, 0.6991729736328125, 0.743377685546875, 0.7875823974609375, 0.831787109375, 0.8759918212890625, 0.920196533203125, 0.9644012451171875, 1.00860595703125, 1.0528106689453125, 1.097015380859375, 1.1412200927734375, 1.1854248046875, 1.2296295166015625, 1.273834228515625, 1.3180389404296875, 1.36224365234375, 1.4064483642578125, 1.450653076171875, 1.4948577880859375, 1.5390625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 8.0, 7.0, 11.0, 16.0, 17.0, 19.0, 21.0, 36.0, 54.0, 51.0, 73.0, 111.0, 94.0, 78.0, 93.0, 72.0, 65.0, 47.0, 37.0, 21.0, 21.0, 16.0, 9.0, 8.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2294921875, -1.194244384765625, -1.15899658203125, -1.123748779296875, -1.0885009765625, -1.053253173828125, -1.01800537109375, -0.982757568359375, -0.947509765625, -0.912261962890625, -0.87701416015625, -0.841766357421875, -0.8065185546875, -0.771270751953125, -0.73602294921875, -0.700775146484375, -0.66552734375, -0.630279541015625, -0.59503173828125, -0.559783935546875, -0.5245361328125, -0.489288330078125, -0.45404052734375, -0.418792724609375, -0.383544921875, -0.348297119140625, -0.31304931640625, -0.277801513671875, -0.2425537109375, -0.207305908203125, -0.17205810546875, -0.136810302734375, -0.1015625, -0.066314697265625, -0.03106689453125, 0.004180908203125, 0.0394287109375, 0.074676513671875, 0.10992431640625, 0.145172119140625, 0.180419921875, 0.215667724609375, 0.25091552734375, 0.286163330078125, 0.3214111328125, 0.356658935546875, 0.39190673828125, 0.427154541015625, 0.46240234375, 0.497650146484375, 0.53289794921875, 0.568145751953125, 0.6033935546875, 0.638641357421875, 0.67388916015625, 0.709136962890625, 0.744384765625, 0.779632568359375, 0.81488037109375, 0.850128173828125, 0.8853759765625, 0.920623779296875, 0.95587158203125, 0.991119384765625, 1.0263671875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 13.0, 17.0, 35.0, 69.0, 104.0, 148.0, 161.0, 170.0, 97.0, 75.0, 36.0, 24.0, 9.0, 12.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.929759979248047, -22.264568328857422, -21.59937858581543, -20.934186935424805, -20.26899528503418, -19.603803634643555, -18.938613891601562, -18.273422241210938, -17.608230590820312, -16.943038940429688, -16.277849197387695, -15.61265754699707, -14.947465896606445, -14.282275199890137, -13.617084503173828, -12.951892852783203, -12.286702156066895, -11.621511459350586, -10.956319808959961, -10.291129112243652, -9.625937461853027, -8.960746765136719, -8.295555114746094, -7.630364418029785, -6.965173244476318, -6.299982070922852, -5.634790897369385, -4.969599723815918, -4.304409027099609, -3.6392176151275635, -2.974026679992676, -2.308835506439209, -1.6436443328857422, -0.9784532189369202, -0.31326210498809814, 0.3519289493560791, 1.017120122909546, 1.6823112964630127, 2.3475022315979004, 3.012693405151367, 3.677884578704834, 4.343075752258301, 5.008266925811768, 5.673458099365234, 6.338648796081543, 7.003840446472168, 7.669031143188477, 8.334222793579102, 8.99941349029541, 9.664604187011719, 10.329795837402344, 10.994986534118652, 11.660178184509277, 12.325368881225586, 12.990560531616211, 13.65575122833252, 14.320941925048828, 14.986132621765137, 15.651324272155762, 16.31651496887207, 16.981706619262695, 17.64689826965332, 18.312088012695312, 18.977279663085938, 19.642471313476562]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 11.0, 13.0, 15.0, 26.0, 21.0, 23.0, 18.0, 32.0, 32.0, 38.0, 48.0, 33.0, 46.0, 46.0, 51.0, 55.0, 71.0, 47.0, 37.0, 45.0, 45.0, 33.0, 27.0, 24.0, 32.0, 23.0, 19.0, 18.0, 14.0, 5.0, 9.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-13.828222274780273, -13.415547370910645, -13.0028715133667, -12.59019660949707, -12.177520751953125, -11.764845848083496, -11.352170944213867, -10.939495086669922, -10.526819229125977, -10.114144325256348, -9.701468467712402, -9.288793563842773, -8.876117706298828, -8.4634428024292, -8.05076789855957, -7.638092041015625, -7.225417137145996, -6.812741756439209, -6.400066375732422, -5.987391471862793, -5.574715614318848, -5.162040710449219, -4.749365329742432, -4.3366899490356445, -3.9240145683288574, -3.5113391876220703, -3.098663806915283, -2.685988664627075, -2.273313283920288, -1.860637903213501, -1.447962760925293, -1.0352873802185059, -0.6226119995117188, -0.20993667840957642, 0.20273864269256592, 0.6154139041900635, 1.0280892848968506, 1.4407646656036377, 1.8534398078918457, 2.266115188598633, 2.67879056930542, 3.091465950012207, 3.504141330718994, 3.916816473007202, 4.32949161529541, 4.7421674728393555, 5.154842376708984, 5.5675177574157715, 5.980193138122559, 6.392868518829346, 6.805543899536133, 7.218218803405762, 7.630894660949707, 8.043569564819336, 8.456245422363281, 8.86892032623291, 9.281595230102539, 9.694270133972168, 10.106945991516113, 10.519620895385742, 10.932296752929688, 11.344971656799316, 11.757646560668945, 12.17032241821289, 12.582998275756836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 7.0, 8.0, 14.0, 14.0, 25.0, 47.0, 43.0, 70.0, 112.0, 133.0, 195.0, 260.0, 421.0, 598.0, 909.0, 1350.0, 1976.0, 3130.0, 5141.0, 8970.0, 16343.0, 33122.0, 77504.0, 235910.0, 1132262.0, 2054868.0, 410295.0, 115654.0, 45366.0, 21129.0, 11221.0, 6371.0, 3685.0, 2358.0, 1538.0, 1037.0, 675.0, 456.0, 293.0, 238.0, 150.0, 124.0, 83.0, 44.0, 41.0, 31.0, 18.0, 7.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.75537109375, -0.7319107055664062, -0.7084503173828125, -0.6849899291992188, -0.661529541015625, -0.6380691528320312, -0.6146087646484375, -0.5911483764648438, -0.56768798828125, -0.5442276000976562, -0.5207672119140625, -0.49730682373046875, -0.473846435546875, -0.45038604736328125, -0.4269256591796875, -0.40346527099609375, -0.3800048828125, -0.35654449462890625, -0.3330841064453125, -0.30962371826171875, -0.286163330078125, -0.26270294189453125, -0.2392425537109375, -0.21578216552734375, -0.19232177734375, -0.16886138916015625, -0.1454010009765625, -0.12194061279296875, -0.098480224609375, -0.07501983642578125, -0.0515594482421875, -0.02809906005859375, -0.004638671875, 0.01882171630859375, 0.0422821044921875, 0.06574249267578125, 0.089202880859375, 0.11266326904296875, 0.1361236572265625, 0.15958404541015625, 0.18304443359375, 0.20650482177734375, 0.2299652099609375, 0.25342559814453125, 0.276885986328125, 0.30034637451171875, 0.3238067626953125, 0.34726715087890625, 0.3707275390625, 0.39418792724609375, 0.4176483154296875, 0.44110870361328125, 0.464569091796875, 0.48802947998046875, 0.5114898681640625, 0.5349502563476562, 0.55841064453125, 0.5818710327148438, 0.6053314208984375, 0.6287918090820312, 0.652252197265625, 0.6757125854492188, 0.6991729736328125, 0.7226333618164062, 0.74609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 12.0, 14.0, 19.0, 29.0, 25.0, 59.0, 39.0, 48.0, 68.0, 65.0, 70.0, 74.0, 85.0, 69.0, 46.0, 59.0, 44.0, 35.0, 26.0, 26.0, 16.0, 12.0, 10.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330078125, -0.8062744140625, -0.779541015625, -0.7528076171875, -0.72607421875, -0.6993408203125, -0.672607421875, -0.6458740234375, -0.619140625, -0.5924072265625, -0.565673828125, -0.5389404296875, -0.51220703125, -0.4854736328125, -0.458740234375, -0.4320068359375, -0.4052734375, -0.3785400390625, -0.351806640625, -0.3250732421875, -0.29833984375, -0.2716064453125, -0.244873046875, -0.2181396484375, -0.19140625, -0.1646728515625, -0.137939453125, -0.1112060546875, -0.08447265625, -0.0577392578125, -0.031005859375, -0.0042724609375, 0.0224609375, 0.0491943359375, 0.075927734375, 0.1026611328125, 0.12939453125, 0.1561279296875, 0.182861328125, 0.2095947265625, 0.236328125, 0.2630615234375, 0.289794921875, 0.3165283203125, 0.34326171875, 0.3699951171875, 0.396728515625, 0.4234619140625, 0.4501953125, 0.4769287109375, 0.503662109375, 0.5303955078125, 0.55712890625, 0.5838623046875, 0.610595703125, 0.6373291015625, 0.6640625, 0.6907958984375, 0.717529296875, 0.7442626953125, 0.77099609375, 0.7977294921875, 0.824462890625, 0.8511962890625, 0.8779296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 8.0, 20.0, 21.0, 34.0, 56.0, 73.0, 116.0, 239.0, 468.0, 977.0, 2542.0, 7242.0, 27044.0, 148895.0, 2803044.0, 1091945.0, 84611.0, 18094.0, 5238.0, 1835.0, 813.0, 390.0, 193.0, 134.0, 71.0, 45.0, 34.0, 17.0, 23.0, 8.0, 8.0, 6.0, 9.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.816986083984375, -1.75994873046875, -1.702911376953125, -1.6458740234375, -1.588836669921875, -1.53179931640625, -1.474761962890625, -1.417724609375, -1.360687255859375, -1.30364990234375, -1.246612548828125, -1.1895751953125, -1.132537841796875, -1.07550048828125, -1.018463134765625, -0.96142578125, -0.904388427734375, -0.84735107421875, -0.790313720703125, -0.7332763671875, -0.676239013671875, -0.61920166015625, -0.562164306640625, -0.505126953125, -0.448089599609375, -0.39105224609375, -0.334014892578125, -0.2769775390625, -0.219940185546875, -0.16290283203125, -0.105865478515625, -0.048828125, 0.008209228515625, 0.06524658203125, 0.122283935546875, 0.1793212890625, 0.236358642578125, 0.29339599609375, 0.350433349609375, 0.407470703125, 0.464508056640625, 0.52154541015625, 0.578582763671875, 0.6356201171875, 0.692657470703125, 0.74969482421875, 0.806732177734375, 0.86376953125, 0.920806884765625, 0.97784423828125, 1.034881591796875, 1.0919189453125, 1.148956298828125, 1.20599365234375, 1.263031005859375, 1.320068359375, 1.377105712890625, 1.43414306640625, 1.491180419921875, 1.5482177734375, 1.605255126953125, 1.66229248046875, 1.719329833984375, 1.7763671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 1.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 18.0, 16.0, 26.0, 47.0, 56.0, 85.0, 132.0, 197.0, 341.0, 632.0, 879.0, 634.0, 333.0, 218.0, 134.0, 84.0, 48.0, 38.0, 26.0, 20.0, 14.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4012908935546875, -1.348480224609375, -1.2956695556640625, -1.24285888671875, -1.1900482177734375, -1.137237548828125, -1.0844268798828125, -1.0316162109375, -0.9788055419921875, -0.925994873046875, -0.8731842041015625, -0.82037353515625, -0.7675628662109375, -0.714752197265625, -0.6619415283203125, -0.609130859375, -0.5563201904296875, -0.503509521484375, -0.4506988525390625, -0.39788818359375, -0.3450775146484375, -0.292266845703125, -0.2394561767578125, -0.1866455078125, -0.1338348388671875, -0.081024169921875, -0.0282135009765625, 0.02459716796875, 0.0774078369140625, 0.130218505859375, 0.1830291748046875, 0.23583984375, 0.2886505126953125, 0.341461181640625, 0.3942718505859375, 0.44708251953125, 0.4998931884765625, 0.552703857421875, 0.6055145263671875, 0.6583251953125, 0.7111358642578125, 0.763946533203125, 0.8167572021484375, 0.86956787109375, 0.9223785400390625, 0.975189208984375, 1.0279998779296875, 1.080810546875, 1.1336212158203125, 1.186431884765625, 1.2392425537109375, 1.29205322265625, 1.3448638916015625, 1.397674560546875, 1.4504852294921875, 1.5032958984375, 1.5561065673828125, 1.608917236328125, 1.6617279052734375, 1.71453857421875, 1.7673492431640625, 1.820159912109375, 1.8729705810546875, 1.92578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 5.0, 13.0, 36.0, 108.0, 235.0, 286.0, 178.0, 70.0, 26.0, 15.0, 9.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.974903106689453, -10.144695281982422, -9.314488410949707, -8.484281539916992, -7.654073715209961, -6.823866367340088, -5.993659019470215, -5.163451671600342, -4.333244323730469, -3.5030369758605957, -2.6728296279907227, -1.8426222801208496, -1.0124149322509766, -0.18220758438110352, 0.6479997634887695, 1.4782071113586426, 2.3084144592285156, 3.1386218070983887, 3.9688291549682617, 4.799036502838135, 5.629243850708008, 6.459451198577881, 7.289658546447754, 8.119865417480469, 8.9500732421875, 9.780281066894531, 10.610487937927246, 11.440694808959961, 12.270902633666992, 13.101110458374023, 13.931317329406738, 14.761524200439453, 15.591732025146484, 16.421939849853516, 17.252147674560547, 18.082353591918945, 18.912561416625977, 19.742769241333008, 20.572975158691406, 21.403182983398438, 22.23339080810547, 23.0635986328125, 23.89380645751953, 24.72401237487793, 25.55422019958496, 26.384428024291992, 27.21463394165039, 28.044841766357422, 28.875049591064453, 29.705257415771484, 30.535465240478516, 31.365671157836914, 32.19587707519531, 33.026084899902344, 33.856292724609375, 34.686500549316406, 35.51670837402344, 36.34691619873047, 37.1771240234375, 38.00733184814453, 38.83753967285156, 39.66774368286133, 40.49795150756836, 41.32815933227539, 42.15836715698242]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 10.0, 14.0, 12.0, 17.0, 19.0, 21.0, 19.0, 27.0, 19.0, 32.0, 45.0, 39.0, 47.0, 47.0, 50.0, 42.0, 36.0, 49.0, 56.0, 46.0, 35.0, 41.0, 42.0, 29.0, 32.0, 30.0, 27.0, 17.0, 17.0, 17.0, 13.0, 13.0, 13.0, 4.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.859951972961426, -6.618941783905029, -6.377931594848633, -6.136921405792236, -5.89591121673584, -5.654901504516602, -5.413890838623047, -5.172881126403809, -4.931870937347412, -4.690860748291016, -4.449850559234619, -4.208840370178223, -3.9678304195404053, -3.726820230484009, -3.4858100414276123, -3.244800090789795, -3.0037896633148193, -2.762779474258423, -2.5217692852020264, -2.280759334564209, -2.0397491455078125, -1.798738956451416, -1.5577287673950195, -1.3167186975479126, -1.0757085084915161, -0.8346983790397644, -0.5936882495880127, -0.3526780605316162, -0.1116679310798645, 0.1293421983718872, 0.3703523874282837, 0.6113624572753906, 0.8523726463317871, 1.0933828353881836, 1.3343929052352905, 1.575403094291687, 1.816413164138794, 2.0574233531951904, 2.298433542251587, 2.5394434928894043, 2.780453681945801, 3.0214638710021973, 3.2624740600585938, 3.5034842491149902, 3.7444941997528076, 3.985504388809204, 4.22651481628418, 4.467524528503418, 4.708535194396973, 4.949545383453369, 5.190555572509766, 5.431565761566162, 5.672575950622559, 5.913585662841797, 6.154596328735352, 6.39560604095459, 6.636616230010986, 6.877626419067383, 7.118636608123779, 7.359646797180176, 7.600656986236572, 7.841667175292969, 8.082676887512207, 8.323687553405762, 8.564697265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 1.0, 7.0, 13.0, 18.0, 53.0, 52.0, 112.0, 205.0, 344.0, 597.0, 1215.0, 2679.0, 6001.0, 14944.0, 41770.0, 144947.0, 549599.0, 201530.0, 52833.0, 18195.0, 7321.0, 2965.0, 1435.0, 765.0, 393.0, 215.0, 128.0, 72.0, 45.0, 34.0, 21.0, 17.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4708709716796875, -1.413421630859375, -1.3559722900390625, -1.29852294921875, -1.2410736083984375, -1.183624267578125, -1.1261749267578125, -1.0687255859375, -1.0112762451171875, -0.953826904296875, -0.8963775634765625, -0.83892822265625, -0.7814788818359375, -0.724029541015625, -0.6665802001953125, -0.609130859375, -0.5516815185546875, -0.494232177734375, -0.4367828369140625, -0.37933349609375, -0.3218841552734375, -0.264434814453125, -0.2069854736328125, -0.1495361328125, -0.0920867919921875, -0.034637451171875, 0.0228118896484375, 0.08026123046875, 0.1377105712890625, 0.195159912109375, 0.2526092529296875, 0.31005859375, 0.3675079345703125, 0.424957275390625, 0.4824066162109375, 0.53985595703125, 0.5973052978515625, 0.654754638671875, 0.7122039794921875, 0.7696533203125, 0.8271026611328125, 0.884552001953125, 0.9420013427734375, 0.99945068359375, 1.0569000244140625, 1.114349365234375, 1.1717987060546875, 1.229248046875, 1.2866973876953125, 1.344146728515625, 1.4015960693359375, 1.45904541015625, 1.5164947509765625, 1.573944091796875, 1.6313934326171875, 1.6888427734375, 1.7462921142578125, 1.803741455078125, 1.8611907958984375, 1.91864013671875, 1.9760894775390625, 2.033538818359375, 2.0909881591796875, 2.1484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 9.0, 10.0, 10.0, 22.0, 15.0, 21.0, 22.0, 33.0, 34.0, 30.0, 44.0, 37.0, 33.0, 62.0, 49.0, 52.0, 46.0, 42.0, 55.0, 52.0, 47.0, 40.0, 32.0, 28.0, 28.0, 25.0, 13.0, 17.0, 15.0, 18.0, 10.0, 13.0, 5.0, 5.0, 3.0, 2.0, 3.0, 7.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67724609375, -0.6573562622070312, -0.6374664306640625, -0.6175765991210938, -0.597686767578125, -0.5777969360351562, -0.5579071044921875, -0.5380172729492188, -0.51812744140625, -0.49823760986328125, -0.4783477783203125, -0.45845794677734375, -0.438568115234375, -0.41867828369140625, -0.3987884521484375, -0.37889862060546875, -0.3590087890625, -0.33911895751953125, -0.3192291259765625, -0.29933929443359375, -0.279449462890625, -0.25955963134765625, -0.2396697998046875, -0.21977996826171875, -0.19989013671875, -0.18000030517578125, -0.1601104736328125, -0.14022064208984375, -0.120330810546875, -0.10044097900390625, -0.0805511474609375, -0.06066131591796875, -0.040771484375, -0.02088165283203125, -0.0009918212890625, 0.01889801025390625, 0.038787841796875, 0.05867767333984375, 0.0785675048828125, 0.09845733642578125, 0.11834716796875, 0.13823699951171875, 0.1581268310546875, 0.17801666259765625, 0.197906494140625, 0.21779632568359375, 0.2376861572265625, 0.25757598876953125, 0.2774658203125, 0.29735565185546875, 0.3172454833984375, 0.33713531494140625, 0.357025146484375, 0.37691497802734375, 0.3968048095703125, 0.41669464111328125, 0.43658447265625, 0.45647430419921875, 0.4763641357421875, 0.49625396728515625, 0.516143798828125, 0.5360336303710938, 0.5559234619140625, 0.5758132934570312, 0.595703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 6.0, 13.0, 19.0, 20.0, 36.0, 57.0, 118.0, 208.0, 466.0, 1408.0, 7093.0, 552672.0, 477241.0, 6860.0, 1326.0, 479.0, 213.0, 112.0, 66.0, 30.0, 27.0, 14.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.628173828125, -7.39697265625, -7.165771484375, -6.9345703125, -6.703369140625, -6.47216796875, -6.240966796875, -6.009765625, -5.778564453125, -5.54736328125, -5.316162109375, -5.0849609375, -4.853759765625, -4.62255859375, -4.391357421875, -4.16015625, -3.928955078125, -3.69775390625, -3.466552734375, -3.2353515625, -3.004150390625, -2.77294921875, -2.541748046875, -2.310546875, -2.079345703125, -1.84814453125, -1.616943359375, -1.3857421875, -1.154541015625, -0.92333984375, -0.692138671875, -0.4609375, -0.229736328125, 0.00146484375, 0.232666015625, 0.4638671875, 0.695068359375, 0.92626953125, 1.157470703125, 1.388671875, 1.619873046875, 1.85107421875, 2.082275390625, 2.3134765625, 2.544677734375, 2.77587890625, 3.007080078125, 3.23828125, 3.469482421875, 3.70068359375, 3.931884765625, 4.1630859375, 4.394287109375, 4.62548828125, 4.856689453125, 5.087890625, 5.319091796875, 5.55029296875, 5.781494140625, 6.0126953125, 6.243896484375, 6.47509765625, 6.706298828125, 6.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 4.0, 7.0, 11.0, 9.0, 12.0, 17.0, 20.0, 24.0, 35.0, 29.0, 35.0, 41.0, 47.0, 33.0, 50.0, 74.0, 54.0, 60.0, 56.0, 46.0, 59.0, 35.0, 31.0, 28.0, 38.0, 31.0, 23.0, 24.0, 17.0, 8.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.80859375, -3.7078857421875, -3.607177734375, -3.5064697265625, -3.40576171875, -3.3050537109375, -3.204345703125, -3.1036376953125, -3.0029296875, -2.9022216796875, -2.801513671875, -2.7008056640625, -2.60009765625, -2.4993896484375, -2.398681640625, -2.2979736328125, -2.197265625, -2.0965576171875, -1.995849609375, -1.8951416015625, -1.79443359375, -1.6937255859375, -1.593017578125, -1.4923095703125, -1.3916015625, -1.2908935546875, -1.190185546875, -1.0894775390625, -0.98876953125, -0.8880615234375, -0.787353515625, -0.6866455078125, -0.5859375, -0.4852294921875, -0.384521484375, -0.2838134765625, -0.18310546875, -0.0823974609375, 0.018310546875, 0.1190185546875, 0.2197265625, 0.3204345703125, 0.421142578125, 0.5218505859375, 0.62255859375, 0.7232666015625, 0.823974609375, 0.9246826171875, 1.025390625, 1.1260986328125, 1.226806640625, 1.3275146484375, 1.42822265625, 1.5289306640625, 1.629638671875, 1.7303466796875, 1.8310546875, 1.9317626953125, 2.032470703125, 2.1331787109375, 2.23388671875, 2.3345947265625, 2.435302734375, 2.5360107421875, 2.63671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 5.0, 10.0, 7.0, 21.0, 27.0, 46.0, 69.0, 146.0, 340.0, 1105.0, 4832.0, 49834.0, 908080.0, 75512.0, 6416.0, 1283.0, 401.0, 183.0, 92.0, 41.0, 25.0, 28.0, 13.0, 6.0, 10.0, 6.0, 3.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.91015625, -2.83660888671875, -2.7630615234375, -2.68951416015625, -2.615966796875, -2.54241943359375, -2.4688720703125, -2.39532470703125, -2.32177734375, -2.24822998046875, -2.1746826171875, -2.10113525390625, -2.027587890625, -1.95404052734375, -1.8804931640625, -1.80694580078125, -1.7333984375, -1.65985107421875, -1.5863037109375, -1.51275634765625, -1.439208984375, -1.36566162109375, -1.2921142578125, -1.21856689453125, -1.14501953125, -1.07147216796875, -0.9979248046875, -0.92437744140625, -0.850830078125, -0.77728271484375, -0.7037353515625, -0.63018798828125, -0.556640625, -0.48309326171875, -0.4095458984375, -0.33599853515625, -0.262451171875, -0.18890380859375, -0.1153564453125, -0.04180908203125, 0.03173828125, 0.10528564453125, 0.1788330078125, 0.25238037109375, 0.325927734375, 0.39947509765625, 0.4730224609375, 0.54656982421875, 0.6201171875, 0.69366455078125, 0.7672119140625, 0.84075927734375, 0.914306640625, 0.98785400390625, 1.0614013671875, 1.13494873046875, 1.20849609375, 1.28204345703125, 1.3555908203125, 1.42913818359375, 1.502685546875, 1.57623291015625, 1.6497802734375, 1.72332763671875, 1.796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 11.0, 6.0, 11.0, 23.0, 20.0, 44.0, 63.0, 121.0, 315.0, 172.0, 64.0, 39.0, 41.0, 28.0, 16.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004794597625732422, -0.0004647783935070038, -0.0004500970244407654, -0.000435415655374527, -0.0004207342863082886, -0.00040605291724205017, -0.00039137154817581177, -0.00037669017910957336, -0.00036200881004333496, -0.00034732744097709656, -0.00033264607191085815, -0.00031796470284461975, -0.00030328333377838135, -0.00028860196471214294, -0.00027392059564590454, -0.00025923922657966614, -0.00024455785751342773, -0.00022987648844718933, -0.00021519511938095093, -0.00020051375031471252, -0.00018583238124847412, -0.00017115101218223572, -0.00015646964311599731, -0.0001417882740497589, -0.0001271069049835205, -0.0001124255359172821, -9.77441668510437e-05, -8.30627977848053e-05, -6.83814287185669e-05, -5.370005965232849e-05, -3.901869058609009e-05, -2.4337321519851685e-05, -9.655952453613281e-06, 5.025416612625122e-06, 1.9706785678863525e-05, 3.438815474510193e-05, 4.906952381134033e-05, 6.375089287757874e-05, 7.843226194381714e-05, 9.311363101005554e-05, 0.00010779500007629395, 0.00012247636914253235, 0.00013715773820877075, 0.00015183910727500916, 0.00016652047634124756, 0.00018120184540748596, 0.00019588321447372437, 0.00021056458353996277, 0.00022524595260620117, 0.00023992732167243958, 0.000254608690738678, 0.0002692900598049164, 0.0002839714288711548, 0.0002986527979373932, 0.0003133341670036316, 0.00032801553606987, 0.0003426969051361084, 0.0003573782742023468, 0.0003720596432685852, 0.0003867410123348236, 0.000401422381401062, 0.0004161037504673004, 0.0004307851195335388, 0.0004454664885997772, 0.0004601478576660156]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 14.0, 8.0, 21.0, 27.0, 24.0, 51.0, 83.0, 105.0, 216.0, 390.0, 801.0, 1993.0, 6864.0, 42237.0, 722885.0, 245059.0, 20395.0, 4396.0, 1517.0, 617.0, 327.0, 197.0, 96.0, 65.0, 45.0, 39.0, 18.0, 13.0, 14.0, 6.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5986328125, -1.54840087890625, -1.4981689453125, -1.44793701171875, -1.397705078125, -1.34747314453125, -1.2972412109375, -1.24700927734375, -1.19677734375, -1.14654541015625, -1.0963134765625, -1.04608154296875, -0.995849609375, -0.94561767578125, -0.8953857421875, -0.84515380859375, -0.794921875, -0.74468994140625, -0.6944580078125, -0.64422607421875, -0.593994140625, -0.54376220703125, -0.4935302734375, -0.44329833984375, -0.39306640625, -0.34283447265625, -0.2926025390625, -0.24237060546875, -0.192138671875, -0.14190673828125, -0.0916748046875, -0.04144287109375, 0.0087890625, 0.05902099609375, 0.1092529296875, 0.15948486328125, 0.209716796875, 0.25994873046875, 0.3101806640625, 0.36041259765625, 0.41064453125, 0.46087646484375, 0.5111083984375, 0.56134033203125, 0.611572265625, 0.66180419921875, 0.7120361328125, 0.76226806640625, 0.8125, 0.86273193359375, 0.9129638671875, 0.96319580078125, 1.013427734375, 1.06365966796875, 1.1138916015625, 1.16412353515625, 1.21435546875, 1.26458740234375, 1.3148193359375, 1.36505126953125, 1.415283203125, 1.46551513671875, 1.5157470703125, 1.56597900390625, 1.6162109375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 4.0, 3.0, 10.0, 14.0, 23.0, 34.0, 33.0, 53.0, 55.0, 90.0, 132.0, 144.0, 105.0, 81.0, 56.0, 36.0, 33.0, 21.0, 9.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2060699462890625, -1.163116455078125, -1.1201629638671875, -1.07720947265625, -1.0342559814453125, -0.991302490234375, -0.9483489990234375, -0.9053955078125, -0.8624420166015625, -0.819488525390625, -0.7765350341796875, -0.73358154296875, -0.6906280517578125, -0.647674560546875, -0.6047210693359375, -0.561767578125, -0.5188140869140625, -0.475860595703125, -0.4329071044921875, -0.38995361328125, -0.3470001220703125, -0.304046630859375, -0.2610931396484375, -0.2181396484375, -0.1751861572265625, -0.132232666015625, -0.0892791748046875, -0.04632568359375, -0.0033721923828125, 0.039581298828125, 0.0825347900390625, 0.12548828125, 0.1684417724609375, 0.211395263671875, 0.2543487548828125, 0.29730224609375, 0.3402557373046875, 0.383209228515625, 0.4261627197265625, 0.4691162109375, 0.5120697021484375, 0.555023193359375, 0.5979766845703125, 0.64093017578125, 0.6838836669921875, 0.726837158203125, 0.7697906494140625, 0.812744140625, 0.8556976318359375, 0.898651123046875, 0.9416046142578125, 0.98455810546875, 1.0275115966796875, 1.070465087890625, 1.1134185791015625, 1.1563720703125, 1.1993255615234375, 1.242279052734375, 1.2852325439453125, 1.32818603515625, 1.3711395263671875, 1.414093017578125, 1.4570465087890625, 1.5]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 2.0, 5.0, 19.0, 37.0, 62.0, 146.0, 232.0, 195.0, 150.0, 68.0, 31.0, 14.0, 7.0, 10.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.755178451538086, -13.96750545501709, -13.17983341217041, -12.392160415649414, -11.604488372802734, -10.816815376281738, -10.029142379760742, -9.241470336914062, -8.453797340393066, -7.6661248207092285, -6.878452301025391, -6.0907793045043945, -5.303106784820557, -4.515434265136719, -3.7277612686157227, -2.9400887489318848, -2.152416229248047, -1.3647435903549194, -0.577070951461792, 0.210601806640625, 0.9982743263244629, 1.7859468460083008, 2.573619842529297, 3.3612923622131348, 4.148964881896973, 4.9366374015808105, 5.724309921264648, 6.5119829177856445, 7.299655437469482, 8.08732795715332, 8.875000953674316, 9.662673950195312, 10.45034408569336, 11.238017082214355, 12.025689125061035, 12.813362121582031, 13.601034164428711, 14.388707160949707, 15.176380157470703, 15.964052200317383, 16.751724243164062, 17.539396286010742, 18.327070236206055, 19.114742279052734, 19.902414321899414, 20.690086364746094, 21.477760314941406, 22.265432357788086, 23.0531063079834, 23.840778350830078, 24.62845230102539, 25.41612434387207, 26.20379638671875, 26.991470336914062, 27.779142379760742, 28.566814422607422, 29.354488372802734, 30.142160415649414, 30.929834365844727, 31.717506408691406, 32.50518035888672, 33.292850494384766, 34.08052444458008, 34.86819839477539, 35.65586853027344]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 9.0, 13.0, 14.0, 9.0, 22.0, 25.0, 27.0, 28.0, 41.0, 29.0, 39.0, 47.0, 36.0, 53.0, 57.0, 67.0, 51.0, 55.0, 44.0, 45.0, 43.0, 33.0, 22.0, 28.0, 20.0, 22.0, 22.0, 16.0, 13.0, 16.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.940229415893555, -11.576400756835938, -11.21257209777832, -10.848743438720703, -10.484914779663086, -10.121086120605469, -9.757257461547852, -9.393428802490234, -9.029600143432617, -8.665771484375, -8.301942825317383, -7.938114166259766, -7.574285507202148, -7.210456848144531, -6.846628189086914, -6.482799530029297, -6.118971347808838, -5.755142688751221, -5.3913140296936035, -5.027485370635986, -4.663656711578369, -4.299828052520752, -3.935999631881714, -3.5721709728240967, -3.2083423137664795, -2.8445136547088623, -2.480684995651245, -2.116856575012207, -1.7530277967453003, -1.389199137687683, -1.0253705978393555, -0.6615419387817383, -0.2977132797241211, 0.0661153495311737, 0.4299439787864685, 0.7937725782394409, 1.157601237297058, 1.5214298963546753, 1.885258436203003, 2.24908709526062, 2.6129157543182373, 2.9767444133758545, 3.3405730724334717, 3.7044014930725098, 4.068230152130127, 4.432058811187744, 4.795887470245361, 5.1597161293029785, 5.523544788360596, 5.887373447418213, 6.25120210647583, 6.615030765533447, 6.9788594245910645, 7.342688083648682, 7.706516265869141, 8.070344924926758, 8.434173583984375, 8.798002243041992, 9.16183090209961, 9.525659561157227, 9.889488220214844, 10.253316879272461, 10.617145538330078, 10.980974197387695, 11.344802856445312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 9.0, 13.0, 14.0, 28.0, 47.0, 52.0, 104.0, 226.0, 818.0, 22559.0, 4139402.0, 29655.0, 869.0, 209.0, 100.0, 48.0, 45.0, 28.0, 18.0, 16.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.9129638671875, -4.712646484375, -4.5123291015625, -4.31201171875, -4.1116943359375, -3.911376953125, -3.7110595703125, -3.5107421875, -3.3104248046875, -3.110107421875, -2.9097900390625, -2.70947265625, -2.5091552734375, -2.308837890625, -2.1085205078125, -1.908203125, -1.7078857421875, -1.507568359375, -1.3072509765625, -1.10693359375, -0.9066162109375, -0.706298828125, -0.5059814453125, -0.3056640625, -0.1053466796875, 0.094970703125, 0.2952880859375, 0.49560546875, 0.6959228515625, 0.896240234375, 1.0965576171875, 1.296875, 1.4971923828125, 1.697509765625, 1.8978271484375, 2.09814453125, 2.2984619140625, 2.498779296875, 2.6990966796875, 2.8994140625, 3.0997314453125, 3.300048828125, 3.5003662109375, 3.70068359375, 3.9010009765625, 4.101318359375, 4.3016357421875, 4.501953125, 4.7022705078125, 4.902587890625, 5.1029052734375, 5.30322265625, 5.5035400390625, 5.703857421875, 5.9041748046875, 6.1044921875, 6.3048095703125, 6.505126953125, 6.7054443359375, 6.90576171875, 7.1060791015625, 7.306396484375, 7.5067138671875, 7.70703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 12.0, 14.0, 20.0, 18.0, 27.0, 35.0, 29.0, 51.0, 53.0, 58.0, 65.0, 77.0, 74.0, 77.0, 64.0, 67.0, 52.0, 50.0, 30.0, 32.0, 25.0, 17.0, 12.0, 14.0, 11.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1552734375, -1.12725830078125, -1.0992431640625, -1.07122802734375, -1.043212890625, -1.01519775390625, -0.9871826171875, -0.95916748046875, -0.93115234375, -0.90313720703125, -0.8751220703125, -0.84710693359375, -0.819091796875, -0.79107666015625, -0.7630615234375, -0.73504638671875, -0.70703125, -0.67901611328125, -0.6510009765625, -0.62298583984375, -0.594970703125, -0.56695556640625, -0.5389404296875, -0.51092529296875, -0.48291015625, -0.45489501953125, -0.4268798828125, -0.39886474609375, -0.370849609375, -0.34283447265625, -0.3148193359375, -0.28680419921875, -0.2587890625, -0.23077392578125, -0.2027587890625, -0.17474365234375, -0.146728515625, -0.11871337890625, -0.0906982421875, -0.06268310546875, -0.03466796875, -0.00665283203125, 0.0213623046875, 0.04937744140625, 0.077392578125, 0.10540771484375, 0.1334228515625, 0.16143798828125, 0.189453125, 0.21746826171875, 0.2454833984375, 0.27349853515625, 0.301513671875, 0.32952880859375, 0.3575439453125, 0.38555908203125, 0.41357421875, 0.44158935546875, 0.4696044921875, 0.49761962890625, 0.525634765625, 0.55364990234375, 0.5816650390625, 0.60968017578125, 0.6376953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 3.0, 10.0, 13.0, 19.0, 15.0, 40.0, 37.0, 77.0, 117.0, 145.0, 268.0, 511.0, 908.0, 1694.0, 3597.0, 8757.0, 22782.0, 74264.0, 418929.0, 2938698.0, 590646.0, 90557.0, 25883.0, 9273.0, 3692.0, 1576.0, 756.0, 419.0, 222.0, 121.0, 76.0, 43.0, 40.0, 25.0, 17.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4501953125, -1.4082489013671875, -1.366302490234375, -1.3243560791015625, -1.28240966796875, -1.2404632568359375, -1.198516845703125, -1.1565704345703125, -1.1146240234375, -1.0726776123046875, -1.030731201171875, -0.9887847900390625, -0.94683837890625, -0.9048919677734375, -0.862945556640625, -0.8209991455078125, -0.779052734375, -0.7371063232421875, -0.695159912109375, -0.6532135009765625, -0.61126708984375, -0.5693206787109375, -0.527374267578125, -0.4854278564453125, -0.4434814453125, -0.4015350341796875, -0.359588623046875, -0.3176422119140625, -0.27569580078125, -0.2337493896484375, -0.191802978515625, -0.1498565673828125, -0.10791015625, -0.0659637451171875, -0.024017333984375, 0.0179290771484375, 0.05987548828125, 0.1018218994140625, 0.143768310546875, 0.1857147216796875, 0.2276611328125, 0.2696075439453125, 0.311553955078125, 0.3535003662109375, 0.39544677734375, 0.4373931884765625, 0.479339599609375, 0.5212860107421875, 0.563232421875, 0.6051788330078125, 0.647125244140625, 0.6890716552734375, 0.73101806640625, 0.7729644775390625, 0.814910888671875, 0.8568572998046875, 0.8988037109375, 0.9407501220703125, 0.982696533203125, 1.0246429443359375, 1.06658935546875, 1.1085357666015625, 1.150482177734375, 1.1924285888671875, 1.234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 13.0, 5.0, 12.0, 15.0, 22.0, 28.0, 47.0, 62.0, 85.0, 138.0, 241.0, 412.0, 695.0, 801.0, 590.0, 309.0, 185.0, 120.0, 79.0, 40.0, 42.0, 23.0, 20.0, 18.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.9755859375, -1.9277496337890625, -1.879913330078125, -1.8320770263671875, -1.78424072265625, -1.7364044189453125, -1.688568115234375, -1.6407318115234375, -1.5928955078125, -1.5450592041015625, -1.497222900390625, -1.4493865966796875, -1.40155029296875, -1.3537139892578125, -1.305877685546875, -1.2580413818359375, -1.210205078125, -1.1623687744140625, -1.114532470703125, -1.0666961669921875, -1.01885986328125, -0.9710235595703125, -0.923187255859375, -0.8753509521484375, -0.8275146484375, -0.7796783447265625, -0.731842041015625, -0.6840057373046875, -0.63616943359375, -0.5883331298828125, -0.540496826171875, -0.4926605224609375, -0.44482421875, -0.3969879150390625, -0.349151611328125, -0.3013153076171875, -0.25347900390625, -0.2056427001953125, -0.157806396484375, -0.1099700927734375, -0.0621337890625, -0.0142974853515625, 0.033538818359375, 0.0813751220703125, 0.12921142578125, 0.1770477294921875, 0.224884033203125, 0.2727203369140625, 0.320556640625, 0.3683929443359375, 0.416229248046875, 0.4640655517578125, 0.51190185546875, 0.5597381591796875, 0.607574462890625, 0.6554107666015625, 0.7032470703125, 0.7510833740234375, 0.798919677734375, 0.8467559814453125, 0.89459228515625, 0.9424285888671875, 0.990264892578125, 1.0381011962890625, 1.0859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 15.0, 51.0, 84.0, 193.0, 232.0, 191.0, 109.0, 57.0, 16.0, 6.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.047576904296875, -15.441932678222656, -14.836287498474121, -14.230642318725586, -13.624998092651367, -13.019353866577148, -12.413708686828613, -11.808063507080078, -11.20241928100586, -10.59677505493164, -9.991129875183105, -9.38548469543457, -8.779840469360352, -8.174196243286133, -7.568551063537598, -6.962906360626221, -6.357261657714844, -5.751616954803467, -5.14597225189209, -4.540327548980713, -3.934682846069336, -3.329038143157959, -2.723393440246582, -2.117748737335205, -1.5121040344238281, -0.9064593315124512, -0.3008146286010742, 0.30483007431030273, 0.9104747772216797, 1.5161194801330566, 2.1217641830444336, 2.7274088859558105, 3.3330535888671875, 3.9386982917785645, 4.544342994689941, 5.149987697601318, 5.755632400512695, 6.361277103424072, 6.966921806335449, 7.572566509246826, 8.178211212158203, 8.783855438232422, 9.389500617980957, 9.995145797729492, 10.600790023803711, 11.20643424987793, 11.812079429626465, 12.417724609375, 13.023368835449219, 13.629013061523438, 14.234658241271973, 14.840303421020508, 15.445947647094727, 16.051591873168945, 16.657238006591797, 17.262882232666016, 17.868526458740234, 18.474170684814453, 19.079814910888672, 19.685461044311523, 20.291105270385742, 20.89674949645996, 21.502395629882812, 22.10803985595703, 22.71368408203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 13.0, 8.0, 10.0, 15.0, 11.0, 17.0, 19.0, 28.0, 43.0, 33.0, 52.0, 35.0, 45.0, 48.0, 62.0, 66.0, 49.0, 56.0, 57.0, 34.0, 47.0, 43.0, 35.0, 30.0, 22.0, 26.0, 28.0, 14.0, 14.0, 16.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.916929244995117, -10.637404441833496, -10.357879638671875, -10.078353881835938, -9.798829078674316, -9.519304275512695, -9.239779472351074, -8.960254669189453, -8.680729866027832, -8.401205062866211, -8.12168025970459, -7.8421549797058105, -7.5626301765441895, -7.28310489654541, -7.003580093383789, -6.724055290222168, -6.444530010223389, -6.165005207061768, -5.885479927062988, -5.605955123901367, -5.326430320739746, -5.046905517578125, -4.767380237579346, -4.487855434417725, -4.208330154418945, -3.928805112838745, -3.649280309677124, -3.369755268096924, -3.0902304649353027, -2.8107054233551025, -2.5311803817749023, -2.2516555786132812, -1.9721307754516602, -1.6926058530807495, -1.4130809307098389, -1.1335558891296387, -0.854030966758728, -0.5745060443878174, -0.2949810028076172, -0.015456080436706543, 0.2640688419342041, 0.5435937643051147, 0.8231187462806702, 1.1026437282562256, 1.3821686506271362, 1.6616935729980469, 1.941218614578247, 2.2207436561584473, 2.5002684593200684, 2.7797935009002686, 3.0593183040618896, 3.33884334564209, 3.618368148803711, 3.897893190383911, 4.177418231964111, 4.456943035125732, 4.736468315124512, 5.015993118286133, 5.295518398284912, 5.575043201446533, 5.854568004608154, 6.134093284606934, 6.413618087768555, 6.693142890930176, 6.972667694091797]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 8.0, 3.0, 10.0, 10.0, 13.0, 9.0, 20.0, 30.0, 37.0, 65.0, 74.0, 121.0, 201.0, 320.0, 504.0, 778.0, 1467.0, 2499.0, 5045.0, 10663.0, 25166.0, 70875.0, 283482.0, 460373.0, 119792.0, 37640.0, 14904.0, 6586.0, 3332.0, 1781.0, 1048.0, 580.0, 340.0, 248.0, 144.0, 112.0, 82.0, 54.0, 40.0, 27.0, 25.0, 14.0, 8.0, 5.0, 10.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2138671875, -1.16925048828125, -1.1246337890625, -1.08001708984375, -1.035400390625, -0.99078369140625, -0.9461669921875, -0.90155029296875, -0.85693359375, -0.81231689453125, -0.7677001953125, -0.72308349609375, -0.678466796875, -0.63385009765625, -0.5892333984375, -0.54461669921875, -0.5, -0.45538330078125, -0.4107666015625, -0.36614990234375, -0.321533203125, -0.27691650390625, -0.2322998046875, -0.18768310546875, -0.14306640625, -0.09844970703125, -0.0538330078125, -0.00921630859375, 0.035400390625, 0.08001708984375, 0.1246337890625, 0.16925048828125, 0.2138671875, 0.25848388671875, 0.3031005859375, 0.34771728515625, 0.392333984375, 0.43695068359375, 0.4815673828125, 0.52618408203125, 0.57080078125, 0.61541748046875, 0.6600341796875, 0.70465087890625, 0.749267578125, 0.79388427734375, 0.8385009765625, 0.88311767578125, 0.927734375, 0.97235107421875, 1.0169677734375, 1.06158447265625, 1.106201171875, 1.15081787109375, 1.1954345703125, 1.24005126953125, 1.28466796875, 1.32928466796875, 1.3739013671875, 1.41851806640625, 1.463134765625, 1.50775146484375, 1.5523681640625, 1.59698486328125, 1.6416015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 12.0, 10.0, 17.0, 18.0, 19.0, 24.0, 31.0, 38.0, 37.0, 47.0, 46.0, 64.0, 63.0, 54.0, 72.0, 52.0, 64.0, 64.0, 46.0, 44.0, 28.0, 37.0, 21.0, 20.0, 14.0, 12.0, 13.0, 11.0, 5.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.98583984375, -0.9606170654296875, -0.935394287109375, -0.9101715087890625, -0.88494873046875, -0.8597259521484375, -0.834503173828125, -0.8092803955078125, -0.7840576171875, -0.7588348388671875, -0.733612060546875, -0.7083892822265625, -0.68316650390625, -0.6579437255859375, -0.632720947265625, -0.6074981689453125, -0.582275390625, -0.5570526123046875, -0.531829833984375, -0.5066070556640625, -0.48138427734375, -0.4561614990234375, -0.430938720703125, -0.4057159423828125, -0.3804931640625, -0.3552703857421875, -0.330047607421875, -0.3048248291015625, -0.27960205078125, -0.2543792724609375, -0.229156494140625, -0.2039337158203125, -0.1787109375, -0.1534881591796875, -0.128265380859375, -0.1030426025390625, -0.07781982421875, -0.0525970458984375, -0.027374267578125, -0.0021514892578125, 0.0230712890625, 0.0482940673828125, 0.073516845703125, 0.0987396240234375, 0.12396240234375, 0.1491851806640625, 0.174407958984375, 0.1996307373046875, 0.224853515625, 0.2500762939453125, 0.275299072265625, 0.3005218505859375, 0.32574462890625, 0.3509674072265625, 0.376190185546875, 0.4014129638671875, 0.4266357421875, 0.4518585205078125, 0.477081298828125, 0.5023040771484375, 0.52752685546875, 0.5527496337890625, 0.577972412109375, 0.6031951904296875, 0.62841796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 5.0, 12.0, 13.0, 26.0, 42.0, 72.0, 114.0, 182.0, 308.0, 646.0, 1587.0, 4992.0, 25557.0, 394245.0, 582283.0, 29559.0, 5588.0, 1751.0, 731.0, 353.0, 195.0, 89.0, 71.0, 42.0, 31.0, 16.0, 15.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.81390380859375, -2.7098388671875, -2.60577392578125, -2.501708984375, -2.39764404296875, -2.2935791015625, -2.18951416015625, -2.08544921875, -1.98138427734375, -1.8773193359375, -1.77325439453125, -1.669189453125, -1.56512451171875, -1.4610595703125, -1.35699462890625, -1.2529296875, -1.14886474609375, -1.0447998046875, -0.94073486328125, -0.836669921875, -0.73260498046875, -0.6285400390625, -0.52447509765625, -0.42041015625, -0.31634521484375, -0.2122802734375, -0.10821533203125, -0.004150390625, 0.09991455078125, 0.2039794921875, 0.30804443359375, 0.412109375, 0.51617431640625, 0.6202392578125, 0.72430419921875, 0.828369140625, 0.93243408203125, 1.0364990234375, 1.14056396484375, 1.24462890625, 1.34869384765625, 1.4527587890625, 1.55682373046875, 1.660888671875, 1.76495361328125, 1.8690185546875, 1.97308349609375, 2.0771484375, 2.18121337890625, 2.2852783203125, 2.38934326171875, 2.493408203125, 2.59747314453125, 2.7015380859375, 2.80560302734375, 2.90966796875, 3.01373291015625, 3.1177978515625, 3.22186279296875, 3.325927734375, 3.42999267578125, 3.5340576171875, 3.63812255859375, 3.7421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 7.0, 13.0, 10.0, 18.0, 12.0, 15.0, 23.0, 26.0, 20.0, 37.0, 31.0, 43.0, 47.0, 42.0, 37.0, 46.0, 44.0, 48.0, 54.0, 41.0, 49.0, 54.0, 42.0, 33.0, 32.0, 22.0, 29.0, 16.0, 13.0, 13.0, 15.0, 10.0, 12.0, 10.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.96875, -2.88690185546875, -2.8050537109375, -2.72320556640625, -2.641357421875, -2.55950927734375, -2.4776611328125, -2.39581298828125, -2.31396484375, -2.23211669921875, -2.1502685546875, -2.06842041015625, -1.986572265625, -1.90472412109375, -1.8228759765625, -1.74102783203125, -1.6591796875, -1.57733154296875, -1.4954833984375, -1.41363525390625, -1.331787109375, -1.24993896484375, -1.1680908203125, -1.08624267578125, -1.00439453125, -0.92254638671875, -0.8406982421875, -0.75885009765625, -0.677001953125, -0.59515380859375, -0.5133056640625, -0.43145751953125, -0.349609375, -0.26776123046875, -0.1859130859375, -0.10406494140625, -0.022216796875, 0.05963134765625, 0.1414794921875, 0.22332763671875, 0.30517578125, 0.38702392578125, 0.4688720703125, 0.55072021484375, 0.632568359375, 0.71441650390625, 0.7962646484375, 0.87811279296875, 0.9599609375, 1.04180908203125, 1.1236572265625, 1.20550537109375, 1.287353515625, 1.36920166015625, 1.4510498046875, 1.53289794921875, 1.61474609375, 1.69659423828125, 1.7784423828125, 1.86029052734375, 1.942138671875, 2.02398681640625, 2.1058349609375, 2.18768310546875, 2.26953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 10.0, 8.0, 11.0, 12.0, 22.0, 34.0, 51.0, 76.0, 137.0, 335.0, 1019.0, 4699.0, 39688.0, 830633.0, 157752.0, 11058.0, 2000.0, 525.0, 203.0, 98.0, 60.0, 33.0, 18.0, 22.0, 14.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.02734375, -1.96539306640625, -1.9034423828125, -1.84149169921875, -1.779541015625, -1.71759033203125, -1.6556396484375, -1.59368896484375, -1.53173828125, -1.46978759765625, -1.4078369140625, -1.34588623046875, -1.283935546875, -1.22198486328125, -1.1600341796875, -1.09808349609375, -1.0361328125, -0.97418212890625, -0.9122314453125, -0.85028076171875, -0.788330078125, -0.72637939453125, -0.6644287109375, -0.60247802734375, -0.54052734375, -0.47857666015625, -0.4166259765625, -0.35467529296875, -0.292724609375, -0.23077392578125, -0.1688232421875, -0.10687255859375, -0.044921875, 0.01702880859375, 0.0789794921875, 0.14093017578125, 0.202880859375, 0.26483154296875, 0.3267822265625, 0.38873291015625, 0.45068359375, 0.51263427734375, 0.5745849609375, 0.63653564453125, 0.698486328125, 0.76043701171875, 0.8223876953125, 0.88433837890625, 0.9462890625, 1.00823974609375, 1.0701904296875, 1.13214111328125, 1.194091796875, 1.25604248046875, 1.3179931640625, 1.37994384765625, 1.44189453125, 1.50384521484375, 1.5657958984375, 1.62774658203125, 1.689697265625, 1.75164794921875, 1.8135986328125, 1.87554931640625, 1.9375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 12.0, 20.0, 38.0, 40.0, 84.0, 206.0, 321.0, 129.0, 55.0, 32.0, 17.0, 12.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034356117248535156, -0.00032738223671913147, -0.0003112033009529114, -0.0002950243651866913, -0.0002788454294204712, -0.0002626664936542511, -0.000246487557888031, -0.0002303086221218109, -0.00021412968635559082, -0.00019795075058937073, -0.00018177181482315063, -0.00016559287905693054, -0.00014941394329071045, -0.00013323500752449036, -0.00011705607175827026, -0.00010087713599205017, -8.469820022583008e-05, -6.851926445960999e-05, -5.234032869338989e-05, -3.61613929271698e-05, -1.9982457160949707e-05, -3.8035213947296143e-06, 1.2375414371490479e-05, 2.855435013771057e-05, 4.4733285903930664e-05, 6.091222167015076e-05, 7.709115743637085e-05, 9.327009320259094e-05, 0.00010944902896881104, 0.00012562796473503113, 0.00014180690050125122, 0.0001579858362674713, 0.0001741647720336914, 0.0001903437077999115, 0.0002065226435661316, 0.00022270157933235168, 0.00023888051509857178, 0.00025505945086479187, 0.00027123838663101196, 0.00028741732239723206, 0.00030359625816345215, 0.00031977519392967224, 0.00033595412969589233, 0.0003521330654621124, 0.0003683120012283325, 0.0003844909369945526, 0.0004006698727607727, 0.0004168488085269928, 0.0004330277442932129, 0.000449206680059433, 0.0004653856158256531, 0.00048156455159187317, 0.0004977434873580933, 0.0005139224231243134, 0.0005301013588905334, 0.0005462802946567535, 0.0005624592304229736, 0.0005786381661891937, 0.0005948171019554138, 0.0006109960377216339, 0.000627174973487854, 0.0006433539092540741, 0.0006595328450202942, 0.0006757117807865143, 0.0006918907165527344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 4.0, 19.0, 14.0, 32.0, 57.0, 70.0, 128.0, 248.0, 477.0, 1076.0, 2567.0, 7646.0, 32759.0, 240377.0, 661993.0, 79172.0, 14585.0, 4243.0, 1550.0, 703.0, 364.0, 186.0, 120.0, 60.0, 38.0, 20.0, 9.0, 6.0, 9.0, 5.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.844085693359375, -0.80926513671875, -0.774444580078125, -0.7396240234375, -0.704803466796875, -0.66998291015625, -0.635162353515625, -0.600341796875, -0.565521240234375, -0.53070068359375, -0.495880126953125, -0.4610595703125, -0.426239013671875, -0.39141845703125, -0.356597900390625, -0.32177734375, -0.286956787109375, -0.25213623046875, -0.217315673828125, -0.1824951171875, -0.147674560546875, -0.11285400390625, -0.078033447265625, -0.043212890625, -0.008392333984375, 0.02642822265625, 0.061248779296875, 0.0960693359375, 0.130889892578125, 0.16571044921875, 0.200531005859375, 0.2353515625, 0.270172119140625, 0.30499267578125, 0.339813232421875, 0.3746337890625, 0.409454345703125, 0.44427490234375, 0.479095458984375, 0.513916015625, 0.548736572265625, 0.58355712890625, 0.618377685546875, 0.6531982421875, 0.688018798828125, 0.72283935546875, 0.757659912109375, 0.79248046875, 0.827301025390625, 0.86212158203125, 0.896942138671875, 0.9317626953125, 0.966583251953125, 1.00140380859375, 1.036224365234375, 1.071044921875, 1.105865478515625, 1.14068603515625, 1.175506591796875, 1.2103271484375, 1.245147705078125, 1.27996826171875, 1.314788818359375, 1.349609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 14.0, 11.0, 9.0, 24.0, 30.0, 36.0, 51.0, 45.0, 78.0, 93.0, 96.0, 104.0, 78.0, 77.0, 61.0, 40.0, 32.0, 34.0, 11.0, 15.0, 14.0, 4.0, 10.0, 9.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2193756103515625, -1.189727783203125, -1.1600799560546875, -1.13043212890625, -1.1007843017578125, -1.071136474609375, -1.0414886474609375, -1.0118408203125, -0.9821929931640625, -0.952545166015625, -0.9228973388671875, -0.89324951171875, -0.8636016845703125, -0.833953857421875, -0.8043060302734375, -0.774658203125, -0.7450103759765625, -0.715362548828125, -0.6857147216796875, -0.65606689453125, -0.6264190673828125, -0.596771240234375, -0.5671234130859375, -0.5374755859375, -0.5078277587890625, -0.478179931640625, -0.4485321044921875, -0.41888427734375, -0.3892364501953125, -0.359588623046875, -0.3299407958984375, -0.30029296875, -0.2706451416015625, -0.240997314453125, -0.2113494873046875, -0.18170166015625, -0.1520538330078125, -0.122406005859375, -0.0927581787109375, -0.0631103515625, -0.0334625244140625, -0.003814697265625, 0.0258331298828125, 0.05548095703125, 0.0851287841796875, 0.114776611328125, 0.1444244384765625, 0.174072265625, 0.2037200927734375, 0.233367919921875, 0.2630157470703125, 0.29266357421875, 0.3223114013671875, 0.351959228515625, 0.3816070556640625, 0.4112548828125, 0.4409027099609375, 0.470550537109375, 0.5001983642578125, 0.52984619140625, 0.5594940185546875, 0.589141845703125, 0.6187896728515625, 0.6484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 20.0, 52.0, 141.0, 264.0, 277.0, 145.0, 48.0, 15.0, 11.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.679428100585938, -28.75617790222168, -27.832927703857422, -26.909677505493164, -25.986427307128906, -25.06317710876465, -24.13992691040039, -23.2166748046875, -22.293426513671875, -21.370176315307617, -20.44692611694336, -19.5236759185791, -18.600425720214844, -17.677175521850586, -16.753925323486328, -15.830674171447754, -14.90742301940918, -13.984172821044922, -13.060922622680664, -12.137672424316406, -11.214422225952148, -10.29117202758789, -9.367920875549316, -8.444670677185059, -7.521420478820801, -6.598170280456543, -5.674920082092285, -4.751669406890869, -3.8284192085266113, -2.9051690101623535, -1.9819183349609375, -1.0586681365966797, -0.1354198455810547, 0.7878304719924927, 1.71108078956604, 2.634331226348877, 3.5575814247131348, 4.480831623077393, 5.404082298278809, 6.327332496643066, 7.250582695007324, 8.173832893371582, 9.09708309173584, 10.020334243774414, 10.943584442138672, 11.86683464050293, 12.790084838867188, 13.713335037231445, 14.636585235595703, 15.559835433959961, 16.48308563232422, 17.406335830688477, 18.329586029052734, 19.252836227416992, 20.17608642578125, 21.09933853149414, 22.022586822509766, 22.945837020874023, 23.86908721923828, 24.79233741760254, 25.715587615966797, 26.638837814331055, 27.562088012695312, 28.485340118408203, 29.40859031677246]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 20.0, 13.0, 16.0, 19.0, 23.0, 24.0, 23.0, 30.0, 31.0, 35.0, 38.0, 38.0, 34.0, 43.0, 55.0, 60.0, 50.0, 53.0, 47.0, 36.0, 28.0, 37.0, 28.0, 18.0, 28.0, 19.0, 19.0, 18.0, 17.0, 14.0, 13.0, 13.0, 8.0, 3.0, 8.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.617690086364746, -10.309447288513184, -10.001205444335938, -9.692962646484375, -9.384719848632812, -9.076478004455566, -8.768235206604004, -8.459993362426758, -8.151750564575195, -7.843508243560791, -7.535265922546387, -7.227023124694824, -6.91878080368042, -6.610538482666016, -6.302295684814453, -5.994053363800049, -5.6858110427856445, -5.37756872177124, -5.069326400756836, -4.761083602905273, -4.452841281890869, -4.144598960876465, -3.8363564014434814, -3.528113842010498, -3.2198715209960938, -2.9116291999816895, -2.603386640548706, -2.2951440811157227, -1.9869017601013184, -1.6786593198776245, -1.3704168796539307, -1.0621743202209473, -0.7539329528808594, -0.4456905126571655, -0.13744807243347168, 0.17079436779022217, 0.479036808013916, 0.7872792482376099, 1.0955216884613037, 1.403764247894287, 1.7120065689086914, 2.0202488899230957, 2.328491449356079, 2.6367340087890625, 2.944976329803467, 3.253218650817871, 3.5614612102508545, 3.869703769683838, 4.177946090698242, 4.4861884117126465, 4.794430732727051, 5.102673530578613, 5.410915851593018, 5.719158172607422, 6.027400970458984, 6.335643291473389, 6.643885612487793, 6.952127933502197, 7.260370254516602, 7.568613052368164, 7.876855373382568, 8.185097694396973, 8.493340492248535, 8.801582336425781, 9.109825134277344]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 49.0, 92.0, 300.0, 1683.0, 14581.0, 312918.0, 3662206.0, 190393.0, 10401.0, 1224.0, 252.0, 90.0, 40.0, 19.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.140716552734375, -2.06268310546875, -1.984649658203125, -1.9066162109375, -1.828582763671875, -1.75054931640625, -1.672515869140625, -1.594482421875, -1.516448974609375, -1.43841552734375, -1.360382080078125, -1.2823486328125, -1.204315185546875, -1.12628173828125, -1.048248291015625, -0.97021484375, -0.892181396484375, -0.81414794921875, -0.736114501953125, -0.6580810546875, -0.580047607421875, -0.50201416015625, -0.423980712890625, -0.345947265625, -0.267913818359375, -0.18988037109375, -0.111846923828125, -0.0338134765625, 0.044219970703125, 0.12225341796875, 0.200286865234375, 0.2783203125, 0.356353759765625, 0.43438720703125, 0.512420654296875, 0.5904541015625, 0.668487548828125, 0.74652099609375, 0.824554443359375, 0.902587890625, 0.980621337890625, 1.05865478515625, 1.136688232421875, 1.2147216796875, 1.292755126953125, 1.37078857421875, 1.448822021484375, 1.52685546875, 1.604888916015625, 1.68292236328125, 1.760955810546875, 1.8389892578125, 1.917022705078125, 1.99505615234375, 2.073089599609375, 2.151123046875, 2.229156494140625, 2.30718994140625, 2.385223388671875, 2.4632568359375, 2.541290283203125, 2.61932373046875, 2.697357177734375, 2.775390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 9.0, 7.0, 11.0, 16.0, 18.0, 25.0, 28.0, 37.0, 53.0, 51.0, 64.0, 76.0, 61.0, 60.0, 77.0, 75.0, 53.0, 55.0, 53.0, 44.0, 33.0, 36.0, 22.0, 15.0, 6.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.220703125, -1.1933059692382812, -1.1659088134765625, -1.1385116577148438, -1.111114501953125, -1.0837173461914062, -1.0563201904296875, -1.0289230346679688, -1.00152587890625, -0.9741287231445312, -0.9467315673828125, -0.9193344116210938, -0.891937255859375, -0.8645401000976562, -0.8371429443359375, -0.8097457885742188, -0.7823486328125, -0.7549514770507812, -0.7275543212890625, -0.7001571655273438, -0.672760009765625, -0.6453628540039062, -0.6179656982421875, -0.5905685424804688, -0.56317138671875, -0.5357742309570312, -0.5083770751953125, -0.48097991943359375, -0.453582763671875, -0.42618560791015625, -0.3987884521484375, -0.37139129638671875, -0.343994140625, -0.31659698486328125, -0.2891998291015625, -0.26180267333984375, -0.234405517578125, -0.20700836181640625, -0.1796112060546875, -0.15221405029296875, -0.12481689453125, -0.09741973876953125, -0.0700225830078125, -0.04262542724609375, -0.015228271484375, 0.01216888427734375, 0.0395660400390625, 0.06696319580078125, 0.0943603515625, 0.12175750732421875, 0.1491546630859375, 0.17655181884765625, 0.203948974609375, 0.23134613037109375, 0.2587432861328125, 0.28614044189453125, 0.31353759765625, 0.34093475341796875, 0.3683319091796875, 0.39572906494140625, 0.423126220703125, 0.45052337646484375, 0.4779205322265625, 0.5053176879882812, 0.53271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 11.0, 11.0, 12.0, 27.0, 34.0, 60.0, 84.0, 130.0, 260.0, 375.0, 709.0, 1446.0, 3359.0, 9659.0, 32762.0, 154350.0, 1412826.0, 2272710.0, 234331.0, 47935.0, 14013.0, 4864.0, 2052.0, 968.0, 494.0, 288.0, 193.0, 92.0, 59.0, 55.0, 32.0, 15.0, 13.0, 15.0, 9.0, 5.0, 5.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.23828125, -1.1926116943359375, -1.146942138671875, -1.1012725830078125, -1.05560302734375, -1.0099334716796875, -0.964263916015625, -0.9185943603515625, -0.8729248046875, -0.8272552490234375, -0.781585693359375, -0.7359161376953125, -0.69024658203125, -0.6445770263671875, -0.598907470703125, -0.5532379150390625, -0.507568359375, -0.4618988037109375, -0.416229248046875, -0.3705596923828125, -0.32489013671875, -0.2792205810546875, -0.233551025390625, -0.1878814697265625, -0.1422119140625, -0.0965423583984375, -0.050872802734375, -0.0052032470703125, 0.04046630859375, 0.0861358642578125, 0.131805419921875, 0.1774749755859375, 0.22314453125, 0.2688140869140625, 0.314483642578125, 0.3601531982421875, 0.40582275390625, 0.4514923095703125, 0.497161865234375, 0.5428314208984375, 0.5885009765625, 0.6341705322265625, 0.679840087890625, 0.7255096435546875, 0.77117919921875, 0.8168487548828125, 0.862518310546875, 0.9081878662109375, 0.953857421875, 0.9995269775390625, 1.045196533203125, 1.0908660888671875, 1.13653564453125, 1.1822052001953125, 1.227874755859375, 1.2735443115234375, 1.3192138671875, 1.3648834228515625, 1.410552978515625, 1.4562225341796875, 1.50189208984375, 1.5475616455078125, 1.593231201171875, 1.6389007568359375, 1.6845703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 12.0, 5.0, 14.0, 24.0, 24.0, 43.0, 76.0, 92.0, 175.0, 257.0, 442.0, 621.0, 736.0, 557.0, 343.0, 219.0, 127.0, 89.0, 63.0, 40.0, 27.0, 24.0, 11.0, 10.0, 7.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.951385498046875, -1.88909912109375, -1.826812744140625, -1.7645263671875, -1.702239990234375, -1.63995361328125, -1.577667236328125, -1.515380859375, -1.453094482421875, -1.39080810546875, -1.328521728515625, -1.2662353515625, -1.203948974609375, -1.14166259765625, -1.079376220703125, -1.01708984375, -0.954803466796875, -0.89251708984375, -0.830230712890625, -0.7679443359375, -0.705657958984375, -0.64337158203125, -0.581085205078125, -0.518798828125, -0.456512451171875, -0.39422607421875, -0.331939697265625, -0.2696533203125, -0.207366943359375, -0.14508056640625, -0.082794189453125, -0.0205078125, 0.041778564453125, 0.10406494140625, 0.166351318359375, 0.2286376953125, 0.290924072265625, 0.35321044921875, 0.415496826171875, 0.477783203125, 0.540069580078125, 0.60235595703125, 0.664642333984375, 0.7269287109375, 0.789215087890625, 0.85150146484375, 0.913787841796875, 0.97607421875, 1.038360595703125, 1.10064697265625, 1.162933349609375, 1.2252197265625, 1.287506103515625, 1.34979248046875, 1.412078857421875, 1.474365234375, 1.536651611328125, 1.59893798828125, 1.661224365234375, 1.7235107421875, 1.785797119140625, 1.84808349609375, 1.910369873046875, 1.97265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 29.0, 81.0, 188.0, 271.0, 203.0, 131.0, 34.0, 18.0, 10.0, 7.0, 3.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.060928344726562, -27.200525283813477, -26.34012222290039, -25.479721069335938, -24.61931800842285, -23.758914947509766, -22.89851188659668, -22.038108825683594, -21.177705764770508, -20.317302703857422, -19.456899642944336, -18.59649658203125, -17.736095428466797, -16.87569236755371, -16.015289306640625, -15.154886245727539, -14.29448413848877, -13.434081077575684, -12.573678970336914, -11.713275909423828, -10.852872848510742, -9.992469787597656, -9.132067680358887, -8.2716646194458, -7.411262035369873, -6.550859451293945, -5.690456390380859, -4.830053806304932, -3.969650983810425, -3.109248161315918, -2.2488455772399902, -1.3884425163269043, -0.5280399322509766, 0.3323628306388855, 1.1927655935287476, 2.053168296813965, 2.9135711193084717, 3.7739739418029785, 4.634376525878906, 5.494779586791992, 6.35518217086792, 7.215584754943848, 8.075987815856934, 8.936389923095703, 9.796792984008789, 10.657196044921875, 11.517599105834961, 12.378002166748047, 13.238404273986816, 14.098807334899902, 14.959209442138672, 15.819612503051758, 16.680015563964844, 17.54041862487793, 18.400821685791016, 19.26122283935547, 20.121625900268555, 20.98202896118164, 21.842432022094727, 22.702835083007812, 23.563236236572266, 24.42363929748535, 25.284042358398438, 26.144445419311523, 27.00484848022461]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 11.0, 20.0, 24.0, 30.0, 14.0, 27.0, 29.0, 36.0, 27.0, 34.0, 44.0, 30.0, 35.0, 31.0, 47.0, 51.0, 37.0, 36.0, 42.0, 48.0, 35.0, 35.0, 43.0, 28.0, 25.0, 24.0, 21.0, 17.0, 14.0, 18.0, 13.0, 12.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.075824737548828, -6.839612007141113, -6.603399276733398, -6.367186546325684, -6.130973815917969, -5.894761085510254, -5.658548355102539, -5.422335624694824, -5.186122894287109, -4.9499101638793945, -4.71369743347168, -4.477484703063965, -4.24127197265625, -4.005059242248535, -3.7688465118408203, -3.5326337814331055, -3.2964212894439697, -3.060208559036255, -2.82399582862854, -2.587783098220825, -2.3515703678131104, -2.1153578758239746, -1.8791450262069702, -1.6429322957992554, -1.4067195653915405, -1.1705068349838257, -0.9342941045761108, -0.6980814337730408, -0.4618687033653259, -0.22565603256225586, 0.010556697845458984, 0.24676942825317383, 0.48298215866088867, 0.7191948890686035, 0.9554076194763184, 1.1916203498840332, 1.427833080291748, 1.6640456914901733, 1.9002584218978882, 2.1364712715148926, 2.3726840019226074, 2.6088967323303223, 2.845109462738037, 3.081322193145752, 3.317534923553467, 3.5537476539611816, 3.7899603843688965, 4.026173114776611, 4.262385368347168, 4.498598098754883, 4.734810829162598, 4.9710235595703125, 5.207236289978027, 5.443449020385742, 5.679661750793457, 5.915874481201172, 6.152087211608887, 6.388299942016602, 6.624512672424316, 6.860725402832031, 7.096938133239746, 7.333150863647461, 7.569363594055176, 7.805576324462891, 8.041789054870605]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 14.0, 13.0, 18.0, 22.0, 49.0, 56.0, 106.0, 171.0, 263.0, 419.0, 877.0, 1633.0, 3065.0, 6388.0, 14770.0, 34247.0, 84749.0, 247269.0, 406364.0, 148334.0, 56420.0, 23456.0, 10056.0, 4643.0, 2343.0, 1221.0, 613.0, 357.0, 245.0, 120.0, 65.0, 60.0, 38.0, 23.0, 15.0, 11.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.513671875, -1.469512939453125, -1.42535400390625, -1.381195068359375, -1.3370361328125, -1.292877197265625, -1.24871826171875, -1.204559326171875, -1.160400390625, -1.116241455078125, -1.07208251953125, -1.027923583984375, -0.9837646484375, -0.939605712890625, -0.89544677734375, -0.851287841796875, -0.80712890625, -0.762969970703125, -0.71881103515625, -0.674652099609375, -0.6304931640625, -0.586334228515625, -0.54217529296875, -0.498016357421875, -0.453857421875, -0.409698486328125, -0.36553955078125, -0.321380615234375, -0.2772216796875, -0.233062744140625, -0.18890380859375, -0.144744873046875, -0.1005859375, -0.056427001953125, -0.01226806640625, 0.031890869140625, 0.0760498046875, 0.120208740234375, 0.16436767578125, 0.208526611328125, 0.252685546875, 0.296844482421875, 0.34100341796875, 0.385162353515625, 0.4293212890625, 0.473480224609375, 0.51763916015625, 0.561798095703125, 0.60595703125, 0.650115966796875, 0.69427490234375, 0.738433837890625, 0.7825927734375, 0.826751708984375, 0.87091064453125, 0.915069580078125, 0.959228515625, 1.003387451171875, 1.04754638671875, 1.091705322265625, 1.1358642578125, 1.180023193359375, 1.22418212890625, 1.268341064453125, 1.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 10.0, 9.0, 26.0, 27.0, 34.0, 50.0, 57.0, 51.0, 72.0, 79.0, 71.0, 68.0, 75.0, 58.0, 66.0, 73.0, 46.0, 35.0, 21.0, 21.0, 9.0, 14.0, 9.0, 4.0, 5.0, 6.0, 0.0, 3.0], "bins": [-1.447265625, -1.4164276123046875, -1.385589599609375, -1.3547515869140625, -1.32391357421875, -1.2930755615234375, -1.262237548828125, -1.2313995361328125, -1.2005615234375, -1.1697235107421875, -1.138885498046875, -1.1080474853515625, -1.07720947265625, -1.0463714599609375, -1.015533447265625, -0.9846954345703125, -0.953857421875, -0.9230194091796875, -0.892181396484375, -0.8613433837890625, -0.83050537109375, -0.7996673583984375, -0.768829345703125, -0.7379913330078125, -0.7071533203125, -0.6763153076171875, -0.645477294921875, -0.6146392822265625, -0.58380126953125, -0.5529632568359375, -0.522125244140625, -0.4912872314453125, -0.46044921875, -0.4296112060546875, -0.398773193359375, -0.3679351806640625, -0.33709716796875, -0.3062591552734375, -0.275421142578125, -0.2445831298828125, -0.2137451171875, -0.1829071044921875, -0.152069091796875, -0.1212310791015625, -0.09039306640625, -0.0595550537109375, -0.028717041015625, 0.0021209716796875, 0.032958984375, 0.0637969970703125, 0.094635009765625, 0.1254730224609375, 0.15631103515625, 0.1871490478515625, 0.217987060546875, 0.2488250732421875, 0.2796630859375, 0.3105010986328125, 0.341339111328125, 0.3721771240234375, 0.40301513671875, 0.4338531494140625, 0.464691162109375, 0.4955291748046875, 0.5263671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 35.0, 49.0, 86.0, 167.0, 292.0, 587.0, 1320.0, 3705.0, 17571.0, 365910.0, 630920.0, 20913.0, 4101.0, 1474.0, 671.0, 296.0, 172.0, 109.0, 49.0, 39.0, 22.0, 15.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.36767578125, -4.2119140625, -4.05615234375, -3.900390625, -3.74462890625, -3.5888671875, -3.43310546875, -3.27734375, -3.12158203125, -2.9658203125, -2.81005859375, -2.654296875, -2.49853515625, -2.3427734375, -2.18701171875, -2.03125, -1.87548828125, -1.7197265625, -1.56396484375, -1.408203125, -1.25244140625, -1.0966796875, -0.94091796875, -0.78515625, -0.62939453125, -0.4736328125, -0.31787109375, -0.162109375, -0.00634765625, 0.1494140625, 0.30517578125, 0.4609375, 0.61669921875, 0.7724609375, 0.92822265625, 1.083984375, 1.23974609375, 1.3955078125, 1.55126953125, 1.70703125, 1.86279296875, 2.0185546875, 2.17431640625, 2.330078125, 2.48583984375, 2.6416015625, 2.79736328125, 2.953125, 3.10888671875, 3.2646484375, 3.42041015625, 3.576171875, 3.73193359375, 3.8876953125, 4.04345703125, 4.19921875, 4.35498046875, 4.5107421875, 4.66650390625, 4.822265625, 4.97802734375, 5.1337890625, 5.28955078125, 5.4453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 13.0, 12.0, 16.0, 16.0, 15.0, 31.0, 30.0, 40.0, 41.0, 40.0, 49.0, 51.0, 58.0, 60.0, 63.0, 56.0, 48.0, 49.0, 49.0, 37.0, 41.0, 31.0, 31.0, 28.0, 20.0, 16.0, 7.0, 14.0, 3.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.924163818359375, -2.81707763671875, -2.709991455078125, -2.6029052734375, -2.495819091796875, -2.38873291015625, -2.281646728515625, -2.174560546875, -2.067474365234375, -1.96038818359375, -1.853302001953125, -1.7462158203125, -1.639129638671875, -1.53204345703125, -1.424957275390625, -1.31787109375, -1.210784912109375, -1.10369873046875, -0.996612548828125, -0.8895263671875, -0.782440185546875, -0.67535400390625, -0.568267822265625, -0.461181640625, -0.354095458984375, -0.24700927734375, -0.139923095703125, -0.0328369140625, 0.074249267578125, 0.18133544921875, 0.288421630859375, 0.3955078125, 0.502593994140625, 0.60968017578125, 0.716766357421875, 0.8238525390625, 0.930938720703125, 1.03802490234375, 1.145111083984375, 1.252197265625, 1.359283447265625, 1.46636962890625, 1.573455810546875, 1.6805419921875, 1.787628173828125, 1.89471435546875, 2.001800537109375, 2.10888671875, 2.215972900390625, 2.32305908203125, 2.430145263671875, 2.5372314453125, 2.644317626953125, 2.75140380859375, 2.858489990234375, 2.965576171875, 3.072662353515625, 3.17974853515625, 3.286834716796875, 3.3939208984375, 3.501007080078125, 3.60809326171875, 3.715179443359375, 3.822265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 12.0, 14.0, 23.0, 41.0, 54.0, 110.0, 153.0, 277.0, 592.0, 1355.0, 3710.0, 13393.0, 66769.0, 636350.0, 270929.0, 41046.0, 9035.0, 2515.0, 1007.0, 502.0, 248.0, 127.0, 57.0, 53.0, 41.0, 25.0, 26.0, 11.0, 11.0, 6.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.087890625, -1.053741455078125, -1.01959228515625, -0.985443115234375, -0.9512939453125, -0.917144775390625, -0.88299560546875, -0.848846435546875, -0.814697265625, -0.780548095703125, -0.74639892578125, -0.712249755859375, -0.6781005859375, -0.643951416015625, -0.60980224609375, -0.575653076171875, -0.54150390625, -0.507354736328125, -0.47320556640625, -0.439056396484375, -0.4049072265625, -0.370758056640625, -0.33660888671875, -0.302459716796875, -0.268310546875, -0.234161376953125, -0.20001220703125, -0.165863037109375, -0.1317138671875, -0.097564697265625, -0.06341552734375, -0.029266357421875, 0.0048828125, 0.039031982421875, 0.07318115234375, 0.107330322265625, 0.1414794921875, 0.175628662109375, 0.20977783203125, 0.243927001953125, 0.278076171875, 0.312225341796875, 0.34637451171875, 0.380523681640625, 0.4146728515625, 0.448822021484375, 0.48297119140625, 0.517120361328125, 0.55126953125, 0.585418701171875, 0.61956787109375, 0.653717041015625, 0.6878662109375, 0.722015380859375, 0.75616455078125, 0.790313720703125, 0.824462890625, 0.858612060546875, 0.89276123046875, 0.926910400390625, 0.9610595703125, 0.995208740234375, 1.02935791015625, 1.063507080078125, 1.09765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 11.0, 14.0, 13.0, 18.0, 24.0, 20.0, 24.0, 31.0, 52.0, 55.0, 93.0, 141.0, 139.0, 63.0, 62.0, 49.0, 33.0, 26.0, 19.0, 17.0, 24.0, 13.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002503395080566406, -0.00024197623133659363, -0.00023361295461654663, -0.00022524967789649963, -0.00021688640117645264, -0.00020852312445640564, -0.00020015984773635864, -0.00019179657101631165, -0.00018343329429626465, -0.00017507001757621765, -0.00016670674085617065, -0.00015834346413612366, -0.00014998018741607666, -0.00014161691069602966, -0.00013325363397598267, -0.00012489035725593567, -0.00011652708053588867, -0.00010816380381584167, -9.980052709579468e-05, -9.143725037574768e-05, -8.307397365570068e-05, -7.471069693565369e-05, -6.634742021560669e-05, -5.798414349555969e-05, -4.9620866775512695e-05, -4.12575900554657e-05, -3.28943133354187e-05, -2.4531036615371704e-05, -1.6167759895324707e-05, -7.80448317527771e-06, 5.587935447692871e-07, 8.922070264816284e-06, 1.728534698486328e-05, 2.564862370491028e-05, 3.4011900424957275e-05, 4.237517714500427e-05, 5.073845386505127e-05, 5.9101730585098267e-05, 6.746500730514526e-05, 7.582828402519226e-05, 8.419156074523926e-05, 9.255483746528625e-05, 0.00010091811418533325, 0.00010928139090538025, 0.00011764466762542725, 0.00012600794434547424, 0.00013437122106552124, 0.00014273449778556824, 0.00015109777450561523, 0.00015946105122566223, 0.00016782432794570923, 0.00017618760466575623, 0.00018455088138580322, 0.00019291415810585022, 0.00020127743482589722, 0.00020964071154594421, 0.0002180039882659912, 0.0002263672649860382, 0.0002347305417060852, 0.0002430938184261322, 0.0002514570951461792, 0.0002598203718662262, 0.0002681836485862732, 0.0002765469253063202, 0.0002849102020263672]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 6.0, 7.0, 10.0, 11.0, 33.0, 40.0, 51.0, 112.0, 272.0, 570.0, 1471.0, 4481.0, 23499.0, 351243.0, 628656.0, 29981.0, 5251.0, 1680.0, 602.0, 284.0, 133.0, 74.0, 39.0, 19.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.105377197265625, -1.05743408203125, -1.009490966796875, -0.9615478515625, -0.913604736328125, -0.86566162109375, -0.817718505859375, -0.769775390625, -0.721832275390625, -0.67388916015625, -0.625946044921875, -0.5780029296875, -0.530059814453125, -0.48211669921875, -0.434173583984375, -0.38623046875, -0.338287353515625, -0.29034423828125, -0.242401123046875, -0.1944580078125, -0.146514892578125, -0.09857177734375, -0.050628662109375, -0.002685546875, 0.045257568359375, 0.09320068359375, 0.141143798828125, 0.1890869140625, 0.237030029296875, 0.28497314453125, 0.332916259765625, 0.380859375, 0.428802490234375, 0.47674560546875, 0.524688720703125, 0.5726318359375, 0.620574951171875, 0.66851806640625, 0.716461181640625, 0.764404296875, 0.812347412109375, 0.86029052734375, 0.908233642578125, 0.9561767578125, 1.004119873046875, 1.05206298828125, 1.100006103515625, 1.14794921875, 1.195892333984375, 1.24383544921875, 1.291778564453125, 1.3397216796875, 1.387664794921875, 1.43560791015625, 1.483551025390625, 1.531494140625, 1.579437255859375, 1.62738037109375, 1.675323486328125, 1.7232666015625, 1.771209716796875, 1.81915283203125, 1.867095947265625, 1.9150390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 13.0, 17.0, 13.0, 25.0, 53.0, 33.0, 55.0, 55.0, 68.0, 75.0, 98.0, 83.0, 81.0, 56.0, 52.0, 48.0, 30.0, 26.0, 16.0, 19.0, 18.0, 6.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7885971069335938, -0.7593231201171875, -0.7300491333007812, -0.700775146484375, -0.6715011596679688, -0.6422271728515625, -0.6129531860351562, -0.58367919921875, -0.5544052124023438, -0.5251312255859375, -0.49585723876953125, -0.466583251953125, -0.43730926513671875, -0.4080352783203125, -0.37876129150390625, -0.3494873046875, -0.32021331787109375, -0.2909393310546875, -0.26166534423828125, -0.232391357421875, -0.20311737060546875, -0.1738433837890625, -0.14456939697265625, -0.11529541015625, -0.08602142333984375, -0.0567474365234375, -0.02747344970703125, 0.001800537109375, 0.03107452392578125, 0.0603485107421875, 0.08962249755859375, 0.118896484375, 0.14817047119140625, 0.1774444580078125, 0.20671844482421875, 0.235992431640625, 0.26526641845703125, 0.2945404052734375, 0.32381439208984375, 0.35308837890625, 0.38236236572265625, 0.4116363525390625, 0.44091033935546875, 0.470184326171875, 0.49945831298828125, 0.5287322998046875, 0.5580062866210938, 0.5872802734375, 0.6165542602539062, 0.6458282470703125, 0.6751022338867188, 0.704376220703125, 0.7336502075195312, 0.7629241943359375, 0.7921981811523438, 0.82147216796875, 0.8507461547851562, 0.8800201416015625, 0.9092941284179688, 0.938568115234375, 0.9678421020507812, 0.9971160888671875, 1.0263900756835938, 1.0556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 13.0, 28.0, 59.0, 136.0, 231.0, 245.0, 138.0, 63.0, 31.0, 15.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.754072189331055, -26.940380096435547, -26.12668800354004, -25.31299591064453, -24.499305725097656, -23.68561363220215, -22.87192153930664, -22.058229446411133, -21.244537353515625, -20.430845260620117, -19.61715316772461, -18.803462982177734, -17.989770889282227, -17.17607879638672, -16.36238670349121, -15.548694610595703, -14.735003471374512, -13.921311378479004, -13.107620239257812, -12.293928146362305, -11.480236053466797, -10.666543960571289, -9.852852821350098, -9.03916072845459, -8.225469589233398, -7.411777973175049, -6.598085880279541, -5.784394264221191, -4.970702171325684, -4.157010555267334, -3.3433189392089844, -2.5296268463134766, -1.7159347534179688, -0.9022429585456848, -0.08855116367340088, 0.7251405715942383, 1.538832426071167, 2.3525242805480957, 3.1662158966064453, 3.979907989501953, 4.793599605560303, 5.607291221618652, 6.42098331451416, 7.23467493057251, 8.04836654663086, 8.862058639526367, 9.675750732421875, 10.489442825317383, 11.303133964538574, 12.116826057434082, 12.930517196655273, 13.744209289550781, 14.557901382446289, 15.371593475341797, 16.185283660888672, 16.998977661132812, 17.812667846679688, 18.626359939575195, 19.440052032470703, 20.253742218017578, 21.067434310913086, 21.881126403808594, 22.6948184967041, 23.50851058959961, 24.322202682495117]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 7.0, 3.0, 8.0, 10.0, 10.0, 15.0, 10.0, 23.0, 17.0, 20.0, 20.0, 17.0, 21.0, 21.0, 31.0, 35.0, 30.0, 32.0, 41.0, 53.0, 45.0, 54.0, 52.0, 47.0, 32.0, 44.0, 37.0, 25.0, 30.0, 27.0, 21.0, 23.0, 21.0, 15.0, 10.0, 8.0, 11.0, 13.0, 13.0, 5.0, 4.0, 5.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-10.03938102722168, -9.736881256103516, -9.434381484985352, -9.131881713867188, -8.829381942749023, -8.52688217163086, -8.224382400512695, -7.921882629394531, -7.619382858276367, -7.316883087158203, -7.014383316040039, -6.711883544921875, -6.409383773803711, -6.106884002685547, -5.804384231567383, -5.501884460449219, -5.199384689331055, -4.896884918212891, -4.594385147094727, -4.2918853759765625, -3.9893856048583984, -3.6868858337402344, -3.3843860626220703, -3.0818862915039062, -2.779386520385742, -2.476886749267578, -2.174386978149414, -1.87188720703125, -1.569387435913086, -1.2668876647949219, -0.9643878936767578, -0.6618881225585938, -0.3593883514404297, -0.056888580322265625, 0.24561119079589844, 0.5481109619140625, 0.8506107330322266, 1.1531105041503906, 1.4556102752685547, 1.7581100463867188, 2.060609817504883, 2.363109588623047, 2.665609359741211, 2.968109130859375, 3.270608901977539, 3.573108673095703, 3.875608444213867, 4.178108215332031, 4.480607986450195, 4.783107757568359, 5.085607528686523, 5.3881072998046875, 5.690607070922852, 5.993106842041016, 6.29560661315918, 6.598106384277344, 6.900606155395508, 7.203105926513672, 7.505605697631836, 7.80810546875, 8.110605239868164, 8.413105010986328, 8.715604782104492, 9.018104553222656, 9.32060432434082]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 15.0, 29.0, 64.0, 102.0, 230.0, 673.0, 2035.0, 9413.0, 67907.0, 1320856.0, 2641013.0, 130439.0, 16614.0, 3398.0, 918.0, 311.0, 138.0, 65.0, 26.0, 15.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.455078125, -2.4006805419921875, -2.346282958984375, -2.2918853759765625, -2.23748779296875, -2.1830902099609375, -2.128692626953125, -2.0742950439453125, -2.0198974609375, -1.9654998779296875, -1.911102294921875, -1.8567047119140625, -1.80230712890625, -1.7479095458984375, -1.693511962890625, -1.6391143798828125, -1.584716796875, -1.5303192138671875, -1.475921630859375, -1.4215240478515625, -1.36712646484375, -1.3127288818359375, -1.258331298828125, -1.2039337158203125, -1.1495361328125, -1.0951385498046875, -1.040740966796875, -0.9863433837890625, -0.93194580078125, -0.8775482177734375, -0.823150634765625, -0.7687530517578125, -0.71435546875, -0.6599578857421875, -0.605560302734375, -0.5511627197265625, -0.49676513671875, -0.4423675537109375, -0.387969970703125, -0.3335723876953125, -0.2791748046875, -0.2247772216796875, -0.170379638671875, -0.1159820556640625, -0.06158447265625, -0.0071868896484375, 0.047210693359375, 0.1016082763671875, 0.156005859375, 0.2104034423828125, 0.264801025390625, 0.3191986083984375, 0.37359619140625, 0.4279937744140625, 0.482391357421875, 0.5367889404296875, 0.5911865234375, 0.6455841064453125, 0.699981689453125, 0.7543792724609375, 0.80877685546875, 0.8631744384765625, 0.917572021484375, 0.9719696044921875, 1.0263671875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 7.0, 14.0, 16.0, 23.0, 39.0, 45.0, 59.0, 81.0, 88.0, 88.0, 105.0, 100.0, 86.0, 78.0, 50.0, 44.0, 24.0, 25.0, 18.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.8583984375, -1.820556640625, -1.78271484375, -1.744873046875, -1.70703125, -1.669189453125, -1.63134765625, -1.593505859375, -1.5556640625, -1.517822265625, -1.47998046875, -1.442138671875, -1.404296875, -1.366455078125, -1.32861328125, -1.290771484375, -1.2529296875, -1.215087890625, -1.17724609375, -1.139404296875, -1.1015625, -1.063720703125, -1.02587890625, -0.988037109375, -0.9501953125, -0.912353515625, -0.87451171875, -0.836669921875, -0.798828125, -0.760986328125, -0.72314453125, -0.685302734375, -0.6474609375, -0.609619140625, -0.57177734375, -0.533935546875, -0.49609375, -0.458251953125, -0.42041015625, -0.382568359375, -0.3447265625, -0.306884765625, -0.26904296875, -0.231201171875, -0.193359375, -0.155517578125, -0.11767578125, -0.079833984375, -0.0419921875, -0.004150390625, 0.03369140625, 0.071533203125, 0.109375, 0.147216796875, 0.18505859375, 0.222900390625, 0.2607421875, 0.298583984375, 0.33642578125, 0.374267578125, 0.412109375, 0.449951171875, 0.48779296875, 0.525634765625, 0.5634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 13.0, 31.0, 36.0, 52.0, 105.0, 164.0, 309.0, 605.0, 1298.0, 3045.0, 9848.0, 42044.0, 313868.0, 3130023.0, 609647.0, 62795.0, 13426.0, 3966.0, 1494.0, 685.0, 345.0, 197.0, 96.0, 61.0, 41.0, 15.0, 17.0, 16.0, 12.0, 2.0, 3.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.8303375244140625, -1.775909423828125, -1.7214813232421875, -1.66705322265625, -1.6126251220703125, -1.558197021484375, -1.5037689208984375, -1.4493408203125, -1.3949127197265625, -1.340484619140625, -1.2860565185546875, -1.23162841796875, -1.1772003173828125, -1.122772216796875, -1.0683441162109375, -1.013916015625, -0.9594879150390625, -0.905059814453125, -0.8506317138671875, -0.79620361328125, -0.7417755126953125, -0.687347412109375, -0.6329193115234375, -0.5784912109375, -0.5240631103515625, -0.469635009765625, -0.4152069091796875, -0.36077880859375, -0.3063507080078125, -0.251922607421875, -0.1974945068359375, -0.14306640625, -0.0886383056640625, -0.034210205078125, 0.0202178955078125, 0.07464599609375, 0.1290740966796875, 0.183502197265625, 0.2379302978515625, 0.2923583984375, 0.3467864990234375, 0.401214599609375, 0.4556427001953125, 0.51007080078125, 0.5644989013671875, 0.618927001953125, 0.6733551025390625, 0.727783203125, 0.7822113037109375, 0.836639404296875, 0.8910675048828125, 0.94549560546875, 0.9999237060546875, 1.054351806640625, 1.1087799072265625, 1.1632080078125, 1.2176361083984375, 1.272064208984375, 1.3264923095703125, 1.38092041015625, 1.4353485107421875, 1.489776611328125, 1.5442047119140625, 1.5986328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 7.0, 11.0, 13.0, 21.0, 27.0, 47.0, 61.0, 96.0, 133.0, 253.0, 318.0, 531.0, 682.0, 637.0, 455.0, 269.0, 143.0, 108.0, 86.0, 38.0, 30.0, 21.0, 26.0, 16.0, 10.0, 6.0, 9.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3656463623046875, -1.308441162109375, -1.2512359619140625, -1.19403076171875, -1.1368255615234375, -1.079620361328125, -1.0224151611328125, -0.9652099609375, -0.9080047607421875, -0.850799560546875, -0.7935943603515625, -0.73638916015625, -0.6791839599609375, -0.621978759765625, -0.5647735595703125, -0.507568359375, -0.4503631591796875, -0.393157958984375, -0.3359527587890625, -0.27874755859375, -0.2215423583984375, -0.164337158203125, -0.1071319580078125, -0.0499267578125, 0.0072784423828125, 0.064483642578125, 0.1216888427734375, 0.17889404296875, 0.2360992431640625, 0.293304443359375, 0.3505096435546875, 0.40771484375, 0.4649200439453125, 0.522125244140625, 0.5793304443359375, 0.63653564453125, 0.6937408447265625, 0.750946044921875, 0.8081512451171875, 0.8653564453125, 0.9225616455078125, 0.979766845703125, 1.0369720458984375, 1.09417724609375, 1.1513824462890625, 1.208587646484375, 1.2657928466796875, 1.322998046875, 1.3802032470703125, 1.437408447265625, 1.4946136474609375, 1.55181884765625, 1.6090240478515625, 1.666229248046875, 1.7234344482421875, 1.7806396484375, 1.8378448486328125, 1.895050048828125, 1.9522552490234375, 2.00946044921875, 2.0666656494140625, 2.123870849609375, 2.1810760498046875, 2.23828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 13.0, 15.0, 50.0, 121.0, 198.0, 262.0, 156.0, 96.0, 37.0, 18.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.47132110595703, -34.741455078125, -34.01158905029297, -33.2817268371582, -32.55186080932617, -31.82199478149414, -31.09212875366211, -30.36226463317871, -29.632400512695312, -28.90253448486328, -28.172670364379883, -27.44280433654785, -26.712940216064453, -25.983074188232422, -25.25320816040039, -24.523344039916992, -23.79347801208496, -23.06361198425293, -22.33374786376953, -21.6038818359375, -20.8740177154541, -20.14415168762207, -19.414287567138672, -18.68442153930664, -17.95455551147461, -17.224689483642578, -16.49482536315918, -15.764959335327148, -15.03509521484375, -14.305229187011719, -13.575364112854004, -12.845499038696289, -12.11563491821289, -11.385769844055176, -10.655904769897461, -9.92603874206543, -9.196174621582031, -8.46630859375, -7.736443519592285, -7.00657844543457, -6.2767133712768555, -5.546848297119141, -4.816983222961426, -4.087117671966553, -3.357252597808838, -2.627387523651123, -1.89752197265625, -1.1676568984985352, -0.4377918243408203, 0.2920733690261841, 1.0219385623931885, 1.7518038749694824, 2.4816689491271973, 3.211534023284912, 3.941399574279785, 4.6712646484375, 5.401129722595215, 6.13099479675293, 6.8608598709106445, 7.590725421905518, 8.32059097290039, 9.050455093383789, 9.78032112121582, 10.510186195373535, 11.24005126953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 8.0, 16.0, 21.0, 19.0, 28.0, 28.0, 26.0, 32.0, 38.0, 36.0, 40.0, 52.0, 44.0, 48.0, 56.0, 42.0, 47.0, 63.0, 48.0, 57.0, 44.0, 35.0, 30.0, 26.0, 28.0, 22.0, 12.0, 14.0, 8.0, 9.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.01160717010498, -7.712160110473633, -7.412713050842285, -7.1132659912109375, -6.81381893157959, -6.514371871948242, -6.214925289154053, -5.915478229522705, -5.616031169891357, -5.31658411026001, -5.017137050628662, -4.7176899909973145, -4.418243408203125, -4.118796348571777, -3.8193492889404297, -3.519902229309082, -3.2204551696777344, -2.9210081100463867, -2.621561050415039, -2.3221142292022705, -2.022667169570923, -1.7232201099395752, -1.423773169517517, -1.124326229095459, -0.8248791694641113, -0.5254321694374084, -0.22598516941070557, 0.07346183061599731, 0.3729088306427002, 0.6723558902740479, 0.971802830696106, 1.271249771118164, 1.5706968307495117, 1.8701438903808594, 2.169590950012207, 2.4690377712249756, 2.7684848308563232, 3.067931890487671, 3.3673787117004395, 3.666825771331787, 3.9662728309631348, 4.265719890594482, 4.56516695022583, 4.864614009857178, 5.164060592651367, 5.463507652282715, 5.7629547119140625, 6.06240177154541, 6.361848831176758, 6.6612958908081055, 6.960742950439453, 7.260190010070801, 7.559637069702148, 7.859084129333496, 8.158531188964844, 8.457977294921875, 8.757425308227539, 9.056872367858887, 9.356319427490234, 9.655766487121582, 9.95521354675293, 10.254660606384277, 10.554107666015625, 10.853553771972656, 11.153000831604004]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 10.0, 6.0, 10.0, 6.0, 25.0, 32.0, 28.0, 59.0, 107.0, 136.0, 240.0, 430.0, 641.0, 1163.0, 2403.0, 4715.0, 10366.0, 24827.0, 77797.0, 359946.0, 422184.0, 92818.0, 28273.0, 11446.0, 5182.0, 2627.0, 1324.0, 697.0, 413.0, 241.0, 114.0, 107.0, 61.0, 35.0, 34.0, 15.0, 7.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.66015625, -1.611419677734375, -1.56268310546875, -1.513946533203125, -1.4652099609375, -1.416473388671875, -1.36773681640625, -1.319000244140625, -1.270263671875, -1.221527099609375, -1.17279052734375, -1.124053955078125, -1.0753173828125, -1.026580810546875, -0.97784423828125, -0.929107666015625, -0.88037109375, -0.831634521484375, -0.78289794921875, -0.734161376953125, -0.6854248046875, -0.636688232421875, -0.58795166015625, -0.539215087890625, -0.490478515625, -0.441741943359375, -0.39300537109375, -0.344268798828125, -0.2955322265625, -0.246795654296875, -0.19805908203125, -0.149322509765625, -0.1005859375, -0.051849365234375, -0.00311279296875, 0.045623779296875, 0.0943603515625, 0.143096923828125, 0.19183349609375, 0.240570068359375, 0.289306640625, 0.338043212890625, 0.38677978515625, 0.435516357421875, 0.4842529296875, 0.532989501953125, 0.58172607421875, 0.630462646484375, 0.67919921875, 0.727935791015625, 0.77667236328125, 0.825408935546875, 0.8741455078125, 0.922882080078125, 0.97161865234375, 1.020355224609375, 1.069091796875, 1.117828369140625, 1.16656494140625, 1.215301513671875, 1.2640380859375, 1.312774658203125, 1.36151123046875, 1.410247802734375, 1.458984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 14.0, 13.0, 22.0, 21.0, 19.0, 28.0, 27.0, 30.0, 41.0, 44.0, 55.0, 56.0, 41.0, 46.0, 53.0, 54.0, 63.0, 57.0, 42.0, 45.0, 27.0, 38.0, 31.0, 19.0, 20.0, 18.0, 15.0, 11.0, 9.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.8974609375, -0.875457763671875, -0.85345458984375, -0.831451416015625, -0.8094482421875, -0.787445068359375, -0.76544189453125, -0.743438720703125, -0.721435546875, -0.699432373046875, -0.67742919921875, -0.655426025390625, -0.6334228515625, -0.611419677734375, -0.58941650390625, -0.567413330078125, -0.54541015625, -0.523406982421875, -0.50140380859375, -0.479400634765625, -0.4573974609375, -0.435394287109375, -0.41339111328125, -0.391387939453125, -0.369384765625, -0.347381591796875, -0.32537841796875, -0.303375244140625, -0.2813720703125, -0.259368896484375, -0.23736572265625, -0.215362548828125, -0.193359375, -0.171356201171875, -0.14935302734375, -0.127349853515625, -0.1053466796875, -0.083343505859375, -0.06134033203125, -0.039337158203125, -0.017333984375, 0.004669189453125, 0.02667236328125, 0.048675537109375, 0.0706787109375, 0.092681884765625, 0.11468505859375, 0.136688232421875, 0.15869140625, 0.180694580078125, 0.20269775390625, 0.224700927734375, 0.2467041015625, 0.268707275390625, 0.29071044921875, 0.312713623046875, 0.334716796875, 0.356719970703125, 0.37872314453125, 0.400726318359375, 0.4227294921875, 0.444732666015625, 0.46673583984375, 0.488739013671875, 0.5107421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 20.0, 20.0, 44.0, 81.0, 126.0, 244.0, 493.0, 1095.0, 3356.0, 18355.0, 598389.0, 404311.0, 16683.0, 3159.0, 1053.0, 502.0, 253.0, 150.0, 76.0, 41.0, 24.0, 23.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.58746337890625, -4.4483642578125, -4.30926513671875, -4.170166015625, -4.03106689453125, -3.8919677734375, -3.75286865234375, -3.61376953125, -3.47467041015625, -3.3355712890625, -3.19647216796875, -3.057373046875, -2.91827392578125, -2.7791748046875, -2.64007568359375, -2.5009765625, -2.36187744140625, -2.2227783203125, -2.08367919921875, -1.944580078125, -1.80548095703125, -1.6663818359375, -1.52728271484375, -1.38818359375, -1.24908447265625, -1.1099853515625, -0.97088623046875, -0.831787109375, -0.69268798828125, -0.5535888671875, -0.41448974609375, -0.275390625, -0.13629150390625, 0.0028076171875, 0.14190673828125, 0.281005859375, 0.42010498046875, 0.5592041015625, 0.69830322265625, 0.83740234375, 0.97650146484375, 1.1156005859375, 1.25469970703125, 1.393798828125, 1.53289794921875, 1.6719970703125, 1.81109619140625, 1.9501953125, 2.08929443359375, 2.2283935546875, 2.36749267578125, 2.506591796875, 2.64569091796875, 2.7847900390625, 2.92388916015625, 3.06298828125, 3.20208740234375, 3.3411865234375, 3.48028564453125, 3.619384765625, 3.75848388671875, 3.8975830078125, 4.03668212890625, 4.17578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 7.0, 6.0, 5.0, 11.0, 12.0, 16.0, 14.0, 27.0, 27.0, 24.0, 29.0, 35.0, 30.0, 46.0, 53.0, 42.0, 48.0, 45.0, 49.0, 52.0, 57.0, 49.0, 35.0, 39.0, 31.0, 30.0, 36.0, 21.0, 19.0, 13.0, 18.0, 12.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.595703125, -2.51434326171875, -2.4329833984375, -2.35162353515625, -2.270263671875, -2.18890380859375, -2.1075439453125, -2.02618408203125, -1.94482421875, -1.86346435546875, -1.7821044921875, -1.70074462890625, -1.619384765625, -1.53802490234375, -1.4566650390625, -1.37530517578125, -1.2939453125, -1.21258544921875, -1.1312255859375, -1.04986572265625, -0.968505859375, -0.88714599609375, -0.8057861328125, -0.72442626953125, -0.64306640625, -0.56170654296875, -0.4803466796875, -0.39898681640625, -0.317626953125, -0.23626708984375, -0.1549072265625, -0.07354736328125, 0.0078125, 0.08917236328125, 0.1705322265625, 0.25189208984375, 0.333251953125, 0.41461181640625, 0.4959716796875, 0.57733154296875, 0.65869140625, 0.74005126953125, 0.8214111328125, 0.90277099609375, 0.984130859375, 1.06549072265625, 1.1468505859375, 1.22821044921875, 1.3095703125, 1.39093017578125, 1.4722900390625, 1.55364990234375, 1.635009765625, 1.71636962890625, 1.7977294921875, 1.87908935546875, 1.96044921875, 2.04180908203125, 2.1231689453125, 2.20452880859375, 2.285888671875, 2.36724853515625, 2.4486083984375, 2.52996826171875, 2.611328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 8.0, 8.0, 20.0, 20.0, 57.0, 91.0, 169.0, 396.0, 973.0, 4099.0, 23121.0, 233116.0, 728832.0, 47914.0, 7029.0, 1656.0, 541.0, 234.0, 109.0, 65.0, 25.0, 15.0, 18.0, 7.0, 12.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4810791015625, -1.437744140625, -1.3944091796875, -1.35107421875, -1.3077392578125, -1.264404296875, -1.2210693359375, -1.177734375, -1.1343994140625, -1.091064453125, -1.0477294921875, -1.00439453125, -0.9610595703125, -0.917724609375, -0.8743896484375, -0.8310546875, -0.7877197265625, -0.744384765625, -0.7010498046875, -0.65771484375, -0.6143798828125, -0.571044921875, -0.5277099609375, -0.484375, -0.4410400390625, -0.397705078125, -0.3543701171875, -0.31103515625, -0.2677001953125, -0.224365234375, -0.1810302734375, -0.1376953125, -0.0943603515625, -0.051025390625, -0.0076904296875, 0.03564453125, 0.0789794921875, 0.122314453125, 0.1656494140625, 0.208984375, 0.2523193359375, 0.295654296875, 0.3389892578125, 0.38232421875, 0.4256591796875, 0.468994140625, 0.5123291015625, 0.5556640625, 0.5989990234375, 0.642333984375, 0.6856689453125, 0.72900390625, 0.7723388671875, 0.815673828125, 0.8590087890625, 0.90234375, 0.9456787109375, 0.989013671875, 1.0323486328125, 1.07568359375, 1.1190185546875, 1.162353515625, 1.2056884765625, 1.2490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 3.0, 5.0, 7.0, 7.0, 9.0, 13.0, 20.0, 23.0, 28.0, 20.0, 46.0, 75.0, 112.0, 144.0, 135.0, 85.0, 67.0, 38.0, 36.0, 17.0, 25.0, 12.0, 6.0, 12.0, 7.0, 8.0, 5.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026607513427734375, -0.0002579689025878906, -0.0002498626708984375, -0.00024175643920898438, -0.00023365020751953125, -0.00022554397583007812, -0.000217437744140625, -0.00020933151245117188, -0.00020122528076171875, -0.00019311904907226562, -0.0001850128173828125, -0.00017690658569335938, -0.00016880035400390625, -0.00016069412231445312, -0.000152587890625, -0.00014448165893554688, -0.00013637542724609375, -0.00012826919555664062, -0.0001201629638671875, -0.00011205673217773438, -0.00010395050048828125, -9.584426879882812e-05, -8.7738037109375e-05, -7.963180541992188e-05, -7.152557373046875e-05, -6.341934204101562e-05, -5.53131103515625e-05, -4.7206878662109375e-05, -3.910064697265625e-05, -3.0994415283203125e-05, -2.288818359375e-05, -1.4781951904296875e-05, -6.67572021484375e-06, 1.430511474609375e-06, 9.5367431640625e-06, 1.7642974853515625e-05, 2.574920654296875e-05, 3.3855438232421875e-05, 4.1961669921875e-05, 5.0067901611328125e-05, 5.817413330078125e-05, 6.628036499023438e-05, 7.43865966796875e-05, 8.249282836914062e-05, 9.059906005859375e-05, 9.870529174804688e-05, 0.0001068115234375, 0.00011491775512695312, 0.00012302398681640625, 0.00013113021850585938, 0.0001392364501953125, 0.00014734268188476562, 0.00015544891357421875, 0.00016355514526367188, 0.000171661376953125, 0.00017976760864257812, 0.00018787384033203125, 0.00019598007202148438, 0.0002040863037109375, 0.00021219253540039062, 0.00022029876708984375, 0.00022840499877929688, 0.00023651123046875, 0.0002446174621582031, 0.00025272369384765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 10.0, 16.0, 24.0, 32.0, 46.0, 87.0, 124.0, 193.0, 344.0, 686.0, 1158.0, 2549.0, 6665.0, 23055.0, 108089.0, 688765.0, 169311.0, 32165.0, 8869.0, 3075.0, 1402.0, 752.0, 427.0, 226.0, 148.0, 115.0, 65.0, 41.0, 31.0, 23.0, 8.0, 11.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7242584228515625, -0.697052001953125, -0.6698455810546875, -0.64263916015625, -0.6154327392578125, -0.588226318359375, -0.5610198974609375, -0.5338134765625, -0.5066070556640625, -0.479400634765625, -0.4521942138671875, -0.42498779296875, -0.3977813720703125, -0.370574951171875, -0.3433685302734375, -0.316162109375, -0.2889556884765625, -0.261749267578125, -0.2345428466796875, -0.20733642578125, -0.1801300048828125, -0.152923583984375, -0.1257171630859375, -0.0985107421875, -0.0713043212890625, -0.044097900390625, -0.0168914794921875, 0.01031494140625, 0.0375213623046875, 0.064727783203125, 0.0919342041015625, 0.119140625, 0.1463470458984375, 0.173553466796875, 0.2007598876953125, 0.22796630859375, 0.2551727294921875, 0.282379150390625, 0.3095855712890625, 0.3367919921875, 0.3639984130859375, 0.391204833984375, 0.4184112548828125, 0.44561767578125, 0.4728240966796875, 0.500030517578125, 0.5272369384765625, 0.554443359375, 0.5816497802734375, 0.608856201171875, 0.6360626220703125, 0.66326904296875, 0.6904754638671875, 0.717681884765625, 0.7448883056640625, 0.7720947265625, 0.7993011474609375, 0.826507568359375, 0.8537139892578125, 0.88092041015625, 0.9081268310546875, 0.935333251953125, 0.9625396728515625, 0.98974609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 8.0, 12.0, 8.0, 7.0, 17.0, 25.0, 31.0, 38.0, 50.0, 62.0, 78.0, 94.0, 86.0, 85.0, 86.0, 63.0, 48.0, 32.0, 26.0, 27.0, 24.0, 18.0, 18.0, 12.0, 6.0, 4.0, 11.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73193359375, -0.7071914672851562, -0.6824493408203125, -0.6577072143554688, -0.632965087890625, -0.6082229614257812, -0.5834808349609375, -0.5587387084960938, -0.53399658203125, -0.5092544555664062, -0.4845123291015625, -0.45977020263671875, -0.435028076171875, -0.41028594970703125, -0.3855438232421875, -0.36080169677734375, -0.3360595703125, -0.31131744384765625, -0.2865753173828125, -0.26183319091796875, -0.237091064453125, -0.21234893798828125, -0.1876068115234375, -0.16286468505859375, -0.13812255859375, -0.11338043212890625, -0.0886383056640625, -0.06389617919921875, -0.039154052734375, -0.01441192626953125, 0.0103302001953125, 0.03507232666015625, 0.059814453125, 0.08455657958984375, 0.1092987060546875, 0.13404083251953125, 0.158782958984375, 0.18352508544921875, 0.2082672119140625, 0.23300933837890625, 0.25775146484375, 0.28249359130859375, 0.3072357177734375, 0.33197784423828125, 0.356719970703125, 0.38146209716796875, 0.4062042236328125, 0.43094635009765625, 0.4556884765625, 0.48043060302734375, 0.5051727294921875, 0.5299148559570312, 0.554656982421875, 0.5793991088867188, 0.6041412353515625, 0.6288833618164062, 0.65362548828125, 0.6783676147460938, 0.7031097412109375, 0.7278518676757812, 0.752593994140625, 0.7773361206054688, 0.8020782470703125, 0.8268203735351562, 0.8515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 10.0, 17.0, 64.0, 166.0, 432.0, 196.0, 67.0, 26.0, 8.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.84894561767578, -36.7847785949707, -35.720611572265625, -34.65644073486328, -33.5922737121582, -32.528106689453125, -31.463937759399414, -30.399768829345703, -29.335601806640625, -28.271434783935547, -27.207265853881836, -26.143096923828125, -25.078929901123047, -24.01476287841797, -22.950593948364258, -21.886425018310547, -20.82225799560547, -19.75809097290039, -18.69392204284668, -17.62975311279297, -16.56558609008789, -15.501418113708496, -14.437250137329102, -13.373082160949707, -12.308914184570312, -11.244746208190918, -10.180578231811523, -9.116410255432129, -8.052242279052734, -6.98807430267334, -5.923906326293945, -4.859738349914551, -3.795574188232422, -2.7314062118530273, -1.6672382354736328, -0.6030702590942383, 0.46109771728515625, 1.5252656936645508, 2.5894336700439453, 3.65360164642334, 4.717769622802734, 5.781937599182129, 6.846105575561523, 7.910273551940918, 8.974441528320312, 10.038609504699707, 11.102777481079102, 12.166945457458496, 13.23111343383789, 14.295281410217285, 15.35944938659668, 16.42361831665039, 17.48778533935547, 18.551952362060547, 19.616121292114258, 20.68029022216797, 21.744457244873047, 22.808624267578125, 23.872793197631836, 24.936962127685547, 26.001129150390625, 27.065296173095703, 28.129465103149414, 29.193634033203125, 30.257801055908203]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 12.0, 16.0, 9.0, 9.0, 14.0, 21.0, 30.0, 33.0, 30.0, 49.0, 47.0, 34.0, 71.0, 60.0, 71.0, 77.0, 69.0, 40.0, 38.0, 35.0, 42.0, 18.0, 34.0, 23.0, 22.0, 14.0, 11.0, 12.0, 11.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.929452896118164, -9.5798978805542, -9.230341911315918, -8.880786895751953, -8.531230926513672, -8.181675910949707, -7.832120418548584, -7.482564926147461, -7.133009910583496, -6.783454418182373, -6.43389892578125, -6.084343910217285, -5.734788417816162, -5.385232925415039, -5.035677433013916, -4.686121940612793, -4.33656644821167, -3.987010955810547, -3.637455701828003, -3.28790020942688, -2.938344955444336, -2.588789463043213, -2.23923397064209, -1.889678716659546, -1.5401232242584229, -1.1905678510665894, -0.8410124182701111, -0.4914569854736328, -0.14190161228179932, 0.20765376091003418, 0.5572092533111572, 0.9067645072937012, 1.2563199996948242, 1.6058753728866577, 1.9554307460784912, 2.3049862384796143, 2.654541492462158, 3.0040969848632812, 3.3536524772644043, 3.7032077312469482, 4.052762985229492, 4.402318477630615, 4.751873970031738, 5.101428985595703, 5.450984477996826, 5.800539970397949, 6.150095462799072, 6.499650955200195, 6.849206447601318, 7.198761940002441, 7.5483174324035645, 7.8978729248046875, 8.247427940368652, 8.596982955932617, 8.946538925170898, 9.296093940734863, 9.645649909973145, 9.99520492553711, 10.34476089477539, 10.694315910339355, 11.043871879577637, 11.393426895141602, 11.742982864379883, 12.092537879943848, 12.442092895507812]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 19.0, 13.0, 26.0, 44.0, 95.0, 186.0, 405.0, 1184.0, 4361.0, 24405.0, 338349.0, 3553119.0, 245353.0, 20902.0, 3990.0, 1078.0, 396.0, 161.0, 86.0, 41.0, 20.0, 15.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.9644622802734375, -1.907440185546875, -1.8504180908203125, -1.79339599609375, -1.7363739013671875, -1.679351806640625, -1.6223297119140625, -1.5653076171875, -1.5082855224609375, -1.451263427734375, -1.3942413330078125, -1.33721923828125, -1.2801971435546875, -1.223175048828125, -1.1661529541015625, -1.109130859375, -1.0521087646484375, -0.995086669921875, -0.9380645751953125, -0.88104248046875, -0.8240203857421875, -0.766998291015625, -0.7099761962890625, -0.6529541015625, -0.5959320068359375, -0.538909912109375, -0.4818878173828125, -0.42486572265625, -0.3678436279296875, -0.310821533203125, -0.2537994384765625, -0.19677734375, -0.1397552490234375, -0.082733154296875, -0.0257110595703125, 0.03131103515625, 0.0883331298828125, 0.145355224609375, 0.2023773193359375, 0.2593994140625, 0.3164215087890625, 0.373443603515625, 0.4304656982421875, 0.48748779296875, 0.5445098876953125, 0.601531982421875, 0.6585540771484375, 0.715576171875, 0.7725982666015625, 0.829620361328125, 0.8866424560546875, 0.94366455078125, 1.0006866455078125, 1.057708740234375, 1.1147308349609375, 1.1717529296875, 1.2287750244140625, 1.285797119140625, 1.3428192138671875, 1.39984130859375, 1.4568634033203125, 1.513885498046875, 1.5709075927734375, 1.6279296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 18.0, 18.0, 24.0, 27.0, 44.0, 41.0, 41.0, 70.0, 64.0, 81.0, 69.0, 73.0, 71.0, 75.0, 64.0, 59.0, 39.0, 26.0, 31.0, 15.0, 13.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.359375, -1.3295745849609375, -1.299774169921875, -1.2699737548828125, -1.24017333984375, -1.2103729248046875, -1.180572509765625, -1.1507720947265625, -1.1209716796875, -1.0911712646484375, -1.061370849609375, -1.0315704345703125, -1.00177001953125, -0.9719696044921875, -0.942169189453125, -0.9123687744140625, -0.882568359375, -0.8527679443359375, -0.822967529296875, -0.7931671142578125, -0.76336669921875, -0.7335662841796875, -0.703765869140625, -0.6739654541015625, -0.6441650390625, -0.6143646240234375, -0.584564208984375, -0.5547637939453125, -0.52496337890625, -0.4951629638671875, -0.465362548828125, -0.4355621337890625, -0.40576171875, -0.3759613037109375, -0.346160888671875, -0.3163604736328125, -0.28656005859375, -0.2567596435546875, -0.226959228515625, -0.1971588134765625, -0.1673583984375, -0.1375579833984375, -0.107757568359375, -0.0779571533203125, -0.04815673828125, -0.0183563232421875, 0.011444091796875, 0.0412445068359375, 0.071044921875, 0.1008453369140625, 0.130645751953125, 0.1604461669921875, 0.19024658203125, 0.2200469970703125, 0.249847412109375, 0.2796478271484375, 0.3094482421875, 0.3392486572265625, 0.369049072265625, 0.3988494873046875, 0.42864990234375, 0.4584503173828125, 0.488250732421875, 0.5180511474609375, 0.5478515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 15.0, 35.0, 61.0, 88.0, 168.0, 379.0, 789.0, 2099.0, 6085.0, 29776.0, 549361.0, 3481500.0, 105856.0, 12708.0, 3265.0, 1173.0, 416.0, 230.0, 100.0, 59.0, 28.0, 14.0, 17.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.8797607421875, -2.802490234375, -2.7252197265625, -2.64794921875, -2.5706787109375, -2.493408203125, -2.4161376953125, -2.3388671875, -2.2615966796875, -2.184326171875, -2.1070556640625, -2.02978515625, -1.9525146484375, -1.875244140625, -1.7979736328125, -1.720703125, -1.6434326171875, -1.566162109375, -1.4888916015625, -1.41162109375, -1.3343505859375, -1.257080078125, -1.1798095703125, -1.1025390625, -1.0252685546875, -0.947998046875, -0.8707275390625, -0.79345703125, -0.7161865234375, -0.638916015625, -0.5616455078125, -0.484375, -0.4071044921875, -0.329833984375, -0.2525634765625, -0.17529296875, -0.0980224609375, -0.020751953125, 0.0565185546875, 0.1337890625, 0.2110595703125, 0.288330078125, 0.3656005859375, 0.44287109375, 0.5201416015625, 0.597412109375, 0.6746826171875, 0.751953125, 0.8292236328125, 0.906494140625, 0.9837646484375, 1.06103515625, 1.1383056640625, 1.215576171875, 1.2928466796875, 1.3701171875, 1.4473876953125, 1.524658203125, 1.6019287109375, 1.67919921875, 1.7564697265625, 1.833740234375, 1.9110107421875, 1.98828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 4.0, 18.0, 16.0, 32.0, 64.0, 93.0, 165.0, 306.0, 700.0, 974.0, 795.0, 402.0, 201.0, 96.0, 69.0, 38.0, 24.0, 20.0, 4.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.703399658203125, -2.63531494140625, -2.567230224609375, -2.4991455078125, -2.431060791015625, -2.36297607421875, -2.294891357421875, -2.226806640625, -2.158721923828125, -2.09063720703125, -2.022552490234375, -1.9544677734375, -1.886383056640625, -1.81829833984375, -1.750213623046875, -1.68212890625, -1.614044189453125, -1.54595947265625, -1.477874755859375, -1.4097900390625, -1.341705322265625, -1.27362060546875, -1.205535888671875, -1.137451171875, -1.069366455078125, -1.00128173828125, -0.933197021484375, -0.8651123046875, -0.797027587890625, -0.72894287109375, -0.660858154296875, -0.5927734375, -0.524688720703125, -0.45660400390625, -0.388519287109375, -0.3204345703125, -0.252349853515625, -0.18426513671875, -0.116180419921875, -0.048095703125, 0.019989013671875, 0.08807373046875, 0.156158447265625, 0.2242431640625, 0.292327880859375, 0.36041259765625, 0.428497314453125, 0.49658203125, 0.564666748046875, 0.63275146484375, 0.700836181640625, 0.7689208984375, 0.837005615234375, 0.90509033203125, 0.973175048828125, 1.041259765625, 1.109344482421875, 1.17742919921875, 1.245513916015625, 1.3135986328125, 1.381683349609375, 1.44976806640625, 1.517852783203125, 1.5859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 4.0, 7.0, 20.0, 63.0, 215.0, 390.0, 214.0, 48.0, 18.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.615047454833984, -43.541160583496094, -42.46727752685547, -41.39339065551758, -40.31950759887695, -39.24562072753906, -38.17173767089844, -37.09785079956055, -36.02396774291992, -34.95008087158203, -33.876197814941406, -32.802310943603516, -31.72842788696289, -30.654542922973633, -29.580657958984375, -28.506771087646484, -27.432886123657227, -26.35900115966797, -25.28511619567871, -24.211231231689453, -23.137346267700195, -22.063461303710938, -20.989574432373047, -19.915691375732422, -18.84180450439453, -17.767919540405273, -16.694034576416016, -15.620149612426758, -14.5462646484375, -13.472379684448242, -12.398493766784668, -11.32460880279541, -10.250724792480469, -9.176839828491211, -8.102954864501953, -7.029069423675537, -5.955184459686279, -4.8812994956970215, -3.8074140548706055, -2.7335290908813477, -1.6596441268920898, -0.5857590436935425, 0.4881260395050049, 1.5620112419128418, 2.6358962059020996, 3.7097811698913574, 4.783666610717773, 5.857551574707031, 6.931436538696289, 8.005321502685547, 9.079206466674805, 10.153091430664062, 11.22697639465332, 12.300861358642578, 13.374747276306152, 14.44863224029541, 15.522517204284668, 16.596403121948242, 17.6702880859375, 18.744173049926758, 19.818058013916016, 20.891942977905273, 21.96582794189453, 23.03971290588379, 24.113597869873047]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 11.0, 6.0, 14.0, 16.0, 20.0, 31.0, 32.0, 41.0, 42.0, 57.0, 55.0, 60.0, 67.0, 65.0, 69.0, 67.0, 60.0, 67.0, 41.0, 38.0, 27.0, 25.0, 27.0, 14.0, 14.0, 8.0, 9.0, 3.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.014646530151367, -8.716702461242676, -8.418757438659668, -8.120813369750977, -7.822869300842285, -7.5249247550964355, -7.226980209350586, -6.9290361404418945, -6.631091594696045, -6.333147048950195, -6.035202980041504, -5.737258434295654, -5.439313888549805, -5.141369819641113, -4.843425273895264, -4.545480728149414, -4.247536659240723, -3.949592351913452, -3.6516480445861816, -3.353703498840332, -3.0557591915130615, -2.757814884185791, -2.4598703384399414, -2.161926031112671, -1.8639817237854004, -1.5660374164581299, -1.2680929899215698, -0.9701486229896545, -0.6722042560577393, -0.37425994873046875, -0.07631552219390869, 0.22162890434265137, 0.5195732116699219, 0.8175175786018372, 1.1154619455337524, 1.4134063720703125, 1.711350679397583, 2.0092949867248535, 2.307239532470703, 2.6051838397979736, 2.903128147125244, 3.2010724544525146, 3.499016761779785, 3.7969613075256348, 4.094905853271484, 4.392849922180176, 4.690794467926025, 4.988739013671875, 5.286683082580566, 5.584627628326416, 5.882571697235107, 6.180516242980957, 6.478460311889648, 6.776404857635498, 7.074349403381348, 7.372293472290039, 7.670238018035889, 7.968182563781738, 8.26612663269043, 8.564070701599121, 8.862015724182129, 9.15995979309082, 9.457903861999512, 9.75584888458252, 10.053792953491211]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 8.0, 13.0, 20.0, 39.0, 37.0, 93.0, 190.0, 338.0, 877.0, 2121.0, 6428.0, 27219.0, 213558.0, 646271.0, 125099.0, 18198.0, 4970.0, 1684.0, 694.0, 306.0, 143.0, 75.0, 34.0, 35.0, 25.0, 14.0, 11.0, 10.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5157928466796875, -1.464202880859375, -1.4126129150390625, -1.36102294921875, -1.3094329833984375, -1.257843017578125, -1.2062530517578125, -1.1546630859375, -1.1030731201171875, -1.051483154296875, -0.9998931884765625, -0.94830322265625, -0.8967132568359375, -0.845123291015625, -0.7935333251953125, -0.741943359375, -0.6903533935546875, -0.638763427734375, -0.5871734619140625, -0.53558349609375, -0.4839935302734375, -0.432403564453125, -0.3808135986328125, -0.3292236328125, -0.2776336669921875, -0.226043701171875, -0.1744537353515625, -0.12286376953125, -0.0712738037109375, -0.019683837890625, 0.0319061279296875, 0.08349609375, 0.1350860595703125, 0.186676025390625, 0.2382659912109375, 0.28985595703125, 0.3414459228515625, 0.393035888671875, 0.4446258544921875, 0.4962158203125, 0.5478057861328125, 0.599395751953125, 0.6509857177734375, 0.70257568359375, 0.7541656494140625, 0.805755615234375, 0.8573455810546875, 0.908935546875, 0.9605255126953125, 1.012115478515625, 1.0637054443359375, 1.11529541015625, 1.1668853759765625, 1.218475341796875, 1.2700653076171875, 1.3216552734375, 1.3732452392578125, 1.424835205078125, 1.4764251708984375, 1.52801513671875, 1.5796051025390625, 1.631195068359375, 1.6827850341796875, 1.734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 10.0, 15.0, 28.0, 20.0, 36.0, 32.0, 53.0, 62.0, 59.0, 67.0, 77.0, 68.0, 70.0, 78.0, 60.0, 51.0, 59.0, 53.0, 29.0, 26.0, 11.0, 12.0, 11.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3310546875, -1.2988510131835938, -1.2666473388671875, -1.2344436645507812, -1.202239990234375, -1.1700363159179688, -1.1378326416015625, -1.1056289672851562, -1.07342529296875, -1.0412216186523438, -1.0090179443359375, -0.9768142700195312, -0.944610595703125, -0.9124069213867188, -0.8802032470703125, -0.8479995727539062, -0.8157958984375, -0.7835922241210938, -0.7513885498046875, -0.7191848754882812, -0.686981201171875, -0.6547775268554688, -0.6225738525390625, -0.5903701782226562, -0.55816650390625, -0.5259628295898438, -0.4937591552734375, -0.46155548095703125, -0.429351806640625, -0.39714813232421875, -0.3649444580078125, -0.33274078369140625, -0.300537109375, -0.26833343505859375, -0.2361297607421875, -0.20392608642578125, -0.171722412109375, -0.13951873779296875, -0.1073150634765625, -0.07511138916015625, -0.04290771484375, -0.01070404052734375, 0.0214996337890625, 0.05370330810546875, 0.085906982421875, 0.11811065673828125, 0.1503143310546875, 0.18251800537109375, 0.2147216796875, 0.24692535400390625, 0.2791290283203125, 0.31133270263671875, 0.343536376953125, 0.37574005126953125, 0.4079437255859375, 0.44014739990234375, 0.47235107421875, 0.5045547485351562, 0.5367584228515625, 0.5689620971679688, 0.601165771484375, 0.6333694458007812, 0.6655731201171875, 0.6977767944335938, 0.72998046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 13.0, 24.0, 24.0, 39.0, 48.0, 71.0, 121.0, 221.0, 343.0, 689.0, 1566.0, 3795.0, 13313.0, 85441.0, 669559.0, 232385.0, 29858.0, 6559.0, 2302.0, 981.0, 467.0, 254.0, 147.0, 75.0, 66.0, 45.0, 27.0, 28.0, 15.0, 8.0, 11.0, 11.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.59375, -1.5465087890625, -1.499267578125, -1.4520263671875, -1.40478515625, -1.3575439453125, -1.310302734375, -1.2630615234375, -1.2158203125, -1.1685791015625, -1.121337890625, -1.0740966796875, -1.02685546875, -0.9796142578125, -0.932373046875, -0.8851318359375, -0.837890625, -0.7906494140625, -0.743408203125, -0.6961669921875, -0.64892578125, -0.6016845703125, -0.554443359375, -0.5072021484375, -0.4599609375, -0.4127197265625, -0.365478515625, -0.3182373046875, -0.27099609375, -0.2237548828125, -0.176513671875, -0.1292724609375, -0.08203125, -0.0347900390625, 0.012451171875, 0.0596923828125, 0.10693359375, 0.1541748046875, 0.201416015625, 0.2486572265625, 0.2958984375, 0.3431396484375, 0.390380859375, 0.4376220703125, 0.48486328125, 0.5321044921875, 0.579345703125, 0.6265869140625, 0.673828125, 0.7210693359375, 0.768310546875, 0.8155517578125, 0.86279296875, 0.9100341796875, 0.957275390625, 1.0045166015625, 1.0517578125, 1.0989990234375, 1.146240234375, 1.1934814453125, 1.24072265625, 1.2879638671875, 1.335205078125, 1.3824462890625, 1.4296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 9.0, 8.0, 18.0, 20.0, 25.0, 16.0, 39.0, 42.0, 56.0, 47.0, 43.0, 50.0, 63.0, 55.0, 75.0, 54.0, 55.0, 56.0, 38.0, 46.0, 35.0, 30.0, 28.0, 27.0, 18.0, 5.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.241455078125, -2.15087890625, -2.060302734375, -1.9697265625, -1.879150390625, -1.78857421875, -1.697998046875, -1.607421875, -1.516845703125, -1.42626953125, -1.335693359375, -1.2451171875, -1.154541015625, -1.06396484375, -0.973388671875, -0.8828125, -0.792236328125, -0.70166015625, -0.611083984375, -0.5205078125, -0.429931640625, -0.33935546875, -0.248779296875, -0.158203125, -0.067626953125, 0.02294921875, 0.113525390625, 0.2041015625, 0.294677734375, 0.38525390625, 0.475830078125, 0.56640625, 0.656982421875, 0.74755859375, 0.838134765625, 0.9287109375, 1.019287109375, 1.10986328125, 1.200439453125, 1.291015625, 1.381591796875, 1.47216796875, 1.562744140625, 1.6533203125, 1.743896484375, 1.83447265625, 1.925048828125, 2.015625, 2.106201171875, 2.19677734375, 2.287353515625, 2.3779296875, 2.468505859375, 2.55908203125, 2.649658203125, 2.740234375, 2.830810546875, 2.92138671875, 3.011962890625, 3.1025390625, 3.193115234375, 3.28369140625, 3.374267578125, 3.46484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 9.0, 15.0, 19.0, 25.0, 19.0, 36.0, 82.0, 135.0, 250.0, 610.0, 1288.0, 3138.0, 8527.0, 28152.0, 124765.0, 639004.0, 185569.0, 38701.0, 11171.0, 3912.0, 1633.0, 710.0, 362.0, 171.0, 86.0, 55.0, 38.0, 20.0, 15.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5498046875, -0.5334510803222656, -0.5170974731445312, -0.5007438659667969, -0.4843902587890625, -0.4680366516113281, -0.45168304443359375, -0.4353294372558594, -0.418975830078125, -0.4026222229003906, -0.38626861572265625, -0.3699150085449219, -0.3535614013671875, -0.3372077941894531, -0.32085418701171875, -0.3045005798339844, -0.28814697265625, -0.2717933654785156, -0.25543975830078125, -0.23908615112304688, -0.2227325439453125, -0.20637893676757812, -0.19002532958984375, -0.17367172241210938, -0.157318115234375, -0.14096450805664062, -0.12461090087890625, -0.10825729370117188, -0.0919036865234375, -0.07555007934570312, -0.05919647216796875, -0.042842864990234375, -0.0264892578125, -0.010135650634765625, 0.00621795654296875, 0.022571563720703125, 0.0389251708984375, 0.055278778076171875, 0.07163238525390625, 0.08798599243164062, 0.104339599609375, 0.12069320678710938, 0.13704681396484375, 0.15340042114257812, 0.1697540283203125, 0.18610763549804688, 0.20246124267578125, 0.21881484985351562, 0.23516845703125, 0.2515220642089844, 0.26787567138671875, 0.2842292785644531, 0.3005828857421875, 0.3169364929199219, 0.33329010009765625, 0.3496437072753906, 0.365997314453125, 0.3823509216308594, 0.39870452880859375, 0.4150581359863281, 0.4314117431640625, 0.4477653503417969, 0.46411895751953125, 0.4804725646972656, 0.496826171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 12.0, 18.0, 16.0, 35.0, 57.0, 93.0, 144.0, 175.0, 176.0, 102.0, 73.0, 32.0, 22.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000270843505859375, -0.0002632215619087219, -0.00025559961795806885, -0.00024797767400741577, -0.0002403557300567627, -0.00023273378610610962, -0.00022511184215545654, -0.00021748989820480347, -0.0002098679542541504, -0.00020224601030349731, -0.00019462406635284424, -0.00018700212240219116, -0.00017938017845153809, -0.000171758234500885, -0.00016413629055023193, -0.00015651434659957886, -0.00014889240264892578, -0.0001412704586982727, -0.00013364851474761963, -0.00012602657079696655, -0.00011840462684631348, -0.0001107826828956604, -0.00010316073894500732, -9.553879499435425e-05, -8.791685104370117e-05, -8.02949070930481e-05, -7.267296314239502e-05, -6.505101919174194e-05, -5.742907524108887e-05, -4.980713129043579e-05, -4.2185187339782715e-05, -3.456324338912964e-05, -2.6941299438476562e-05, -1.9319355487823486e-05, -1.169741153717041e-05, -4.075467586517334e-06, 3.546476364135742e-06, 1.1168420314788818e-05, 1.8790364265441895e-05, 2.641230821609497e-05, 3.403425216674805e-05, 4.165619611740112e-05, 4.92781400680542e-05, 5.6900084018707275e-05, 6.452202796936035e-05, 7.214397192001343e-05, 7.97659158706665e-05, 8.738785982131958e-05, 9.500980377197266e-05, 0.00010263174772262573, 0.00011025369167327881, 0.00011787563562393188, 0.00012549757957458496, 0.00013311952352523804, 0.0001407414674758911, 0.0001483634114265442, 0.00015598535537719727, 0.00016360729932785034, 0.00017122924327850342, 0.0001788511872291565, 0.00018647313117980957, 0.00019409507513046265, 0.00020171701908111572, 0.0002093389630317688, 0.00021696090698242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 17.0, 17.0, 26.0, 24.0, 36.0, 68.0, 99.0, 200.0, 328.0, 637.0, 1554.0, 3890.0, 11349.0, 41087.0, 189892.0, 622983.0, 131790.0, 30084.0, 8838.0, 3077.0, 1245.0, 526.0, 307.0, 153.0, 103.0, 61.0, 42.0, 31.0, 17.0, 20.0, 14.0, 7.0, 5.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.607421875, -0.5902557373046875, -0.573089599609375, -0.5559234619140625, -0.53875732421875, -0.5215911865234375, -0.504425048828125, -0.4872589111328125, -0.4700927734375, -0.4529266357421875, -0.435760498046875, -0.4185943603515625, -0.40142822265625, -0.3842620849609375, -0.367095947265625, -0.3499298095703125, -0.332763671875, -0.3155975341796875, -0.298431396484375, -0.2812652587890625, -0.26409912109375, -0.2469329833984375, -0.229766845703125, -0.2126007080078125, -0.1954345703125, -0.1782684326171875, -0.161102294921875, -0.1439361572265625, -0.12677001953125, -0.1096038818359375, -0.092437744140625, -0.0752716064453125, -0.05810546875, -0.0409393310546875, -0.023773193359375, -0.0066070556640625, 0.01055908203125, 0.0277252197265625, 0.044891357421875, 0.0620574951171875, 0.0792236328125, 0.0963897705078125, 0.113555908203125, 0.1307220458984375, 0.14788818359375, 0.1650543212890625, 0.182220458984375, 0.1993865966796875, 0.216552734375, 0.2337188720703125, 0.250885009765625, 0.2680511474609375, 0.28521728515625, 0.3023834228515625, 0.319549560546875, 0.3367156982421875, 0.3538818359375, 0.3710479736328125, 0.388214111328125, 0.4053802490234375, 0.42254638671875, 0.4397125244140625, 0.456878662109375, 0.4740447998046875, 0.4912109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 7.0, 14.0, 24.0, 22.0, 39.0, 44.0, 65.0, 97.0, 110.0, 103.0, 111.0, 95.0, 62.0, 58.0, 33.0, 37.0, 17.0, 18.0, 9.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.942718505859375, -0.92059326171875, -0.898468017578125, -0.8763427734375, -0.854217529296875, -0.83209228515625, -0.809967041015625, -0.787841796875, -0.765716552734375, -0.74359130859375, -0.721466064453125, -0.6993408203125, -0.677215576171875, -0.65509033203125, -0.632965087890625, -0.61083984375, -0.588714599609375, -0.56658935546875, -0.544464111328125, -0.5223388671875, -0.500213623046875, -0.47808837890625, -0.455963134765625, -0.433837890625, -0.411712646484375, -0.38958740234375, -0.367462158203125, -0.3453369140625, -0.323211669921875, -0.30108642578125, -0.278961181640625, -0.2568359375, -0.234710693359375, -0.21258544921875, -0.190460205078125, -0.1683349609375, -0.146209716796875, -0.12408447265625, -0.101959228515625, -0.079833984375, -0.057708740234375, -0.03558349609375, -0.013458251953125, 0.0086669921875, 0.030792236328125, 0.05291748046875, 0.075042724609375, 0.09716796875, 0.119293212890625, 0.14141845703125, 0.163543701171875, 0.1856689453125, 0.207794189453125, 0.22991943359375, 0.252044677734375, 0.274169921875, 0.296295166015625, 0.31842041015625, 0.340545654296875, 0.3626708984375, 0.384796142578125, 0.40692138671875, 0.429046630859375, 0.451171875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 18.0, 29.0, 70.0, 174.0, 319.0, 210.0, 97.0, 28.0, 16.0, 13.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.155841827392578, -24.617198944091797, -24.078556060791016, -23.539913177490234, -23.001270294189453, -22.462627410888672, -21.92398452758789, -21.385339736938477, -20.846696853637695, -20.308053970336914, -19.769411087036133, -19.23076820373535, -18.69212532043457, -18.153480529785156, -17.614837646484375, -17.076194763183594, -16.537551879882812, -15.998908996582031, -15.46026611328125, -14.921623229980469, -14.382979393005371, -13.84433650970459, -13.305693626403809, -12.767050743103027, -12.228408813476562, -11.689765930175781, -11.151123046875, -10.612480163574219, -10.073836326599121, -9.53519344329834, -8.996550559997559, -8.457907676696777, -7.91926383972168, -7.380620956420898, -6.841977596282959, -6.303334712982178, -5.764691352844238, -5.226048469543457, -4.687405586242676, -4.1487627029418945, -3.610119342803955, -3.0714762210845947, -2.5328330993652344, -1.9941902160644531, -1.4555470943450928, -0.9169039726257324, -0.37826108932495117, 0.16038203239440918, 0.6990251541137695, 1.2376682758331299, 1.7763112783432007, 2.3149542808532715, 2.853597402572632, 3.392240524291992, 3.9308834075927734, 4.469526290893555, 5.008169651031494, 5.546812534332275, 6.085455894470215, 6.624098777770996, 7.162741661071777, 7.701385021209717, 8.240028381347656, 8.778671264648438, 9.317314147949219]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 16.0, 17.0, 18.0, 15.0, 31.0, 25.0, 36.0, 35.0, 47.0, 53.0, 61.0, 92.0, 81.0, 75.0, 55.0, 41.0, 48.0, 33.0, 35.0, 29.0, 34.0, 25.0, 15.0, 15.0, 10.0, 10.0, 11.0, 11.0, 4.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9634370803833, -9.612728118896484, -9.262018203735352, -8.911308288574219, -8.560599327087402, -8.209890365600586, -7.859180450439453, -7.5084710121154785, -7.157761573791504, -6.807052135467529, -6.456342697143555, -6.10563325881958, -5.7549238204956055, -5.404214382171631, -5.053504943847656, -4.702795505523682, -4.352086067199707, -4.001376628875732, -3.650667190551758, -3.299957752227783, -2.9492483139038086, -2.598538875579834, -2.2478294372558594, -1.8971199989318848, -1.5464105606079102, -1.1957011222839355, -0.8449916839599609, -0.49428224563598633, -0.14357280731201172, 0.2071366310119629, 0.5578460693359375, 0.9085555076599121, 1.2592658996582031, 1.6099753379821777, 1.9606847763061523, 2.311394214630127, 2.6621036529541016, 3.012813091278076, 3.363522529602051, 3.7142319679260254, 4.06494140625, 4.415650844573975, 4.766360282897949, 5.117069721221924, 5.467779159545898, 5.818488597869873, 6.169198036193848, 6.519907474517822, 6.870616912841797, 7.2213263511657715, 7.572035789489746, 7.922745227813721, 8.273454666137695, 8.624164581298828, 8.974873542785645, 9.325582504272461, 9.676292419433594, 10.027002334594727, 10.377711296081543, 10.72842025756836, 11.079130172729492, 11.429840087890625, 11.780549049377441, 12.131258010864258, 12.48196792602539]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 15.0, 15.0, 26.0, 33.0, 48.0, 70.0, 84.0, 174.0, 245.0, 428.0, 687.0, 1344.0, 2680.0, 5547.0, 13351.0, 38956.0, 160786.0, 1070569.0, 2348903.0, 431282.0, 79517.0, 23009.0, 8520.0, 3869.0, 1832.0, 921.0, 459.0, 318.0, 191.0, 112.0, 77.0, 59.0, 38.0, 21.0, 9.0, 15.0, 11.0, 9.0, 9.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.81005859375, -0.784149169921875, -0.75823974609375, -0.732330322265625, -0.7064208984375, -0.680511474609375, -0.65460205078125, -0.628692626953125, -0.602783203125, -0.576873779296875, -0.55096435546875, -0.525054931640625, -0.4991455078125, -0.473236083984375, -0.44732666015625, -0.421417236328125, -0.3955078125, -0.369598388671875, -0.34368896484375, -0.317779541015625, -0.2918701171875, -0.265960693359375, -0.24005126953125, -0.214141845703125, -0.188232421875, -0.162322998046875, -0.13641357421875, -0.110504150390625, -0.0845947265625, -0.058685302734375, -0.03277587890625, -0.006866455078125, 0.01904296875, 0.044952392578125, 0.07086181640625, 0.096771240234375, 0.1226806640625, 0.148590087890625, 0.17449951171875, 0.200408935546875, 0.226318359375, 0.252227783203125, 0.27813720703125, 0.304046630859375, 0.3299560546875, 0.355865478515625, 0.38177490234375, 0.407684326171875, 0.43359375, 0.459503173828125, 0.48541259765625, 0.511322021484375, 0.5372314453125, 0.563140869140625, 0.58905029296875, 0.614959716796875, 0.640869140625, 0.666778564453125, 0.69268798828125, 0.718597412109375, 0.7445068359375, 0.770416259765625, 0.79632568359375, 0.822235107421875, 0.84814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 10.0, 13.0, 13.0, 15.0, 18.0, 18.0, 19.0, 19.0, 25.0, 22.0, 28.0, 34.0, 30.0, 35.0, 39.0, 40.0, 32.0, 32.0, 40.0, 46.0, 47.0, 38.0, 37.0, 39.0, 31.0, 28.0, 31.0, 30.0, 31.0, 27.0, 17.0, 12.0, 16.0, 19.0, 8.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.5185546875, -0.5024642944335938, -0.4863739013671875, -0.47028350830078125, -0.454193115234375, -0.43810272216796875, -0.4220123291015625, -0.40592193603515625, -0.38983154296875, -0.37374114990234375, -0.3576507568359375, -0.34156036376953125, -0.325469970703125, -0.30937957763671875, -0.2932891845703125, -0.27719879150390625, -0.2611083984375, -0.24501800537109375, -0.2289276123046875, -0.21283721923828125, -0.196746826171875, -0.18065643310546875, -0.1645660400390625, -0.14847564697265625, -0.13238525390625, -0.11629486083984375, -0.1002044677734375, -0.08411407470703125, -0.068023681640625, -0.05193328857421875, -0.0358428955078125, -0.01975250244140625, -0.003662109375, 0.01242828369140625, 0.0285186767578125, 0.04460906982421875, 0.060699462890625, 0.07678985595703125, 0.0928802490234375, 0.10897064208984375, 0.12506103515625, 0.14115142822265625, 0.1572418212890625, 0.17333221435546875, 0.189422607421875, 0.20551300048828125, 0.2216033935546875, 0.23769378662109375, 0.2537841796875, 0.26987457275390625, 0.2859649658203125, 0.30205535888671875, 0.318145751953125, 0.33423614501953125, 0.3503265380859375, 0.36641693115234375, 0.38250732421875, 0.39859771728515625, 0.4146881103515625, 0.43077850341796875, 0.446868896484375, 0.46295928955078125, 0.4790496826171875, 0.49514007568359375, 0.51123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 16.0, 24.0, 65.0, 165.0, 647.0, 5410.0, 1341400.0, 2838023.0, 7389.0, 767.0, 225.0, 79.0, 34.0, 22.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.98883056640625, -4.8331298828125, -4.67742919921875, -4.521728515625, -4.36602783203125, -4.2103271484375, -4.05462646484375, -3.89892578125, -3.74322509765625, -3.5875244140625, -3.43182373046875, -3.276123046875, -3.12042236328125, -2.9647216796875, -2.80902099609375, -2.6533203125, -2.49761962890625, -2.3419189453125, -2.18621826171875, -2.030517578125, -1.87481689453125, -1.7191162109375, -1.56341552734375, -1.40771484375, -1.25201416015625, -1.0963134765625, -0.94061279296875, -0.784912109375, -0.62921142578125, -0.4735107421875, -0.31781005859375, -0.162109375, -0.00640869140625, 0.1492919921875, 0.30499267578125, 0.460693359375, 0.61639404296875, 0.7720947265625, 0.92779541015625, 1.08349609375, 1.23919677734375, 1.3948974609375, 1.55059814453125, 1.706298828125, 1.86199951171875, 2.0177001953125, 2.17340087890625, 2.3291015625, 2.48480224609375, 2.6405029296875, 2.79620361328125, 2.951904296875, 3.10760498046875, 3.2633056640625, 3.41900634765625, 3.57470703125, 3.73040771484375, 3.8861083984375, 4.04180908203125, 4.197509765625, 4.35321044921875, 4.5089111328125, 4.66461181640625, 4.8203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 13.0, 20.0, 22.0, 35.0, 55.0, 95.0, 123.0, 262.0, 412.0, 668.0, 790.0, 582.0, 364.0, 228.0, 105.0, 91.0, 59.0, 40.0, 21.0, 18.0, 13.0, 6.0, 7.0, 7.0, 2.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.271484375, -1.2232666015625, -1.175048828125, -1.1268310546875, -1.07861328125, -1.0303955078125, -0.982177734375, -0.9339599609375, -0.8857421875, -0.8375244140625, -0.789306640625, -0.7410888671875, -0.69287109375, -0.6446533203125, -0.596435546875, -0.5482177734375, -0.5, -0.4517822265625, -0.403564453125, -0.3553466796875, -0.30712890625, -0.2589111328125, -0.210693359375, -0.1624755859375, -0.1142578125, -0.0660400390625, -0.017822265625, 0.0303955078125, 0.07861328125, 0.1268310546875, 0.175048828125, 0.2232666015625, 0.271484375, 0.3197021484375, 0.367919921875, 0.4161376953125, 0.46435546875, 0.5125732421875, 0.560791015625, 0.6090087890625, 0.6572265625, 0.7054443359375, 0.753662109375, 0.8018798828125, 0.85009765625, 0.8983154296875, 0.946533203125, 0.9947509765625, 1.04296875, 1.0911865234375, 1.139404296875, 1.1876220703125, 1.23583984375, 1.2840576171875, 1.332275390625, 1.3804931640625, 1.4287109375, 1.4769287109375, 1.525146484375, 1.5733642578125, 1.62158203125, 1.6697998046875, 1.718017578125, 1.7662353515625, 1.814453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 14.0, 52.0, 142.0, 354.0, 296.0, 112.0, 20.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.669219970703125, -29.66935920715332, -28.669498443603516, -27.669639587402344, -26.66977882385254, -25.669918060302734, -24.67005729675293, -23.670196533203125, -22.670337677001953, -21.67047691345215, -20.670616149902344, -19.670757293701172, -18.670896530151367, -17.671035766601562, -16.671175003051758, -15.671314239501953, -14.671453475952148, -13.671592712402344, -12.671732902526855, -11.67187213897705, -10.672012329101562, -9.672151565551758, -8.672290802001953, -7.672430515289307, -6.67257022857666, -5.672709941864014, -4.672849655151367, -3.6729888916015625, -2.673128604888916, -1.6732683181762695, -0.6734075546264648, 0.32645273208618164, 1.3263130187988281, 2.3261733055114746, 3.3260338306427, 4.325894355773926, 5.325754642486572, 6.325614929199219, 7.325475692749023, 8.325336456298828, 9.325196266174316, 10.325057029724121, 11.32491683959961, 12.324777603149414, 13.324638366699219, 14.324498176574707, 15.324358940124512, 16.32421875, 17.324079513549805, 18.32394027709961, 19.323801040649414, 20.32366180419922, 21.32352066040039, 22.323381423950195, 23.3232421875, 24.323102951049805, 25.32296371459961, 26.322824478149414, 27.32268524169922, 28.32254409790039, 29.322404861450195, 30.322265625, 31.322126388549805, 32.32198715209961, 33.32184600830078]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 15.0, 13.0, 29.0, 26.0, 31.0, 33.0, 54.0, 53.0, 54.0, 57.0, 60.0, 72.0, 65.0, 50.0, 52.0, 66.0, 39.0, 44.0, 48.0, 30.0, 27.0, 21.0, 7.0, 10.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.64519214630127, -8.379648208618164, -8.114103317260742, -7.848559379577637, -7.583015441894531, -7.317471027374268, -7.051926612854004, -6.786382675170898, -6.520838260650635, -6.255293846130371, -5.989749908447266, -5.724205493927002, -5.458661079406738, -5.193117141723633, -4.927572727203369, -4.6620283126831055, -4.396484375, -4.130939960479736, -3.865396022796631, -3.599851608276367, -3.3343074321746826, -3.068763256072998, -2.8032188415527344, -2.53767466545105, -2.2721304893493652, -2.0065863132476807, -1.7410420179367065, -1.4754977226257324, -1.2099535465240479, -0.9444093704223633, -0.6788650751113892, -0.41332077980041504, -0.14777755737304688, 0.11776667833328247, 0.3833109140396118, 0.6488551497459412, 0.9143993854522705, 1.179943561553955, 1.4454878568649292, 1.7110321521759033, 1.976576328277588, 2.2421205043792725, 2.507664680480957, 2.7732090950012207, 3.0387532711029053, 3.30429744720459, 3.5698418617248535, 3.835386037826538, 4.100930213928223, 4.366474628448486, 4.632018566131592, 4.8975629806518555, 5.163106918334961, 5.428651332855225, 5.694195747375488, 5.959739685058594, 6.225284099578857, 6.490828514099121, 6.756372451782227, 7.02191686630249, 7.287461280822754, 7.553005218505859, 7.818549633026123, 8.084094047546387, 8.349637985229492]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 10.0, 29.0, 48.0, 94.0, 194.0, 447.0, 1141.0, 3238.0, 11911.0, 72207.0, 570419.0, 338744.0, 38603.0, 7639.0, 2287.0, 818.0, 386.0, 161.0, 86.0, 28.0, 20.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.36126708984375, -1.3123779296875, -1.26348876953125, -1.214599609375, -1.16571044921875, -1.1168212890625, -1.06793212890625, -1.01904296875, -0.97015380859375, -0.9212646484375, -0.87237548828125, -0.823486328125, -0.77459716796875, -0.7257080078125, -0.67681884765625, -0.6279296875, -0.57904052734375, -0.5301513671875, -0.48126220703125, -0.432373046875, -0.38348388671875, -0.3345947265625, -0.28570556640625, -0.23681640625, -0.18792724609375, -0.1390380859375, -0.09014892578125, -0.041259765625, 0.00762939453125, 0.0565185546875, 0.10540771484375, 0.154296875, 0.20318603515625, 0.2520751953125, 0.30096435546875, 0.349853515625, 0.39874267578125, 0.4476318359375, 0.49652099609375, 0.54541015625, 0.59429931640625, 0.6431884765625, 0.69207763671875, 0.740966796875, 0.78985595703125, 0.8387451171875, 0.88763427734375, 0.9365234375, 0.98541259765625, 1.0343017578125, 1.08319091796875, 1.132080078125, 1.18096923828125, 1.2298583984375, 1.27874755859375, 1.32763671875, 1.37652587890625, 1.4254150390625, 1.47430419921875, 1.523193359375, 1.57208251953125, 1.6209716796875, 1.66986083984375, 1.71875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 9.0, 12.0, 19.0, 21.0, 25.0, 20.0, 26.0, 23.0, 28.0, 40.0, 37.0, 36.0, 43.0, 43.0, 48.0, 45.0, 41.0, 43.0, 44.0, 45.0, 52.0, 57.0, 33.0, 32.0, 29.0, 24.0, 24.0, 9.0, 17.0, 8.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.74072265625, -0.720123291015625, -0.69952392578125, -0.678924560546875, -0.6583251953125, -0.637725830078125, -0.61712646484375, -0.596527099609375, -0.575927734375, -0.555328369140625, -0.53472900390625, -0.514129638671875, -0.4935302734375, -0.472930908203125, -0.45233154296875, -0.431732177734375, -0.4111328125, -0.390533447265625, -0.36993408203125, -0.349334716796875, -0.3287353515625, -0.308135986328125, -0.28753662109375, -0.266937255859375, -0.246337890625, -0.225738525390625, -0.20513916015625, -0.184539794921875, -0.1639404296875, -0.143341064453125, -0.12274169921875, -0.102142333984375, -0.08154296875, -0.060943603515625, -0.04034423828125, -0.019744873046875, 0.0008544921875, 0.021453857421875, 0.04205322265625, 0.062652587890625, 0.083251953125, 0.103851318359375, 0.12445068359375, 0.145050048828125, 0.1656494140625, 0.186248779296875, 0.20684814453125, 0.227447509765625, 0.248046875, 0.268646240234375, 0.28924560546875, 0.309844970703125, 0.3304443359375, 0.351043701171875, 0.37164306640625, 0.392242431640625, 0.412841796875, 0.433441162109375, 0.45404052734375, 0.474639892578125, 0.4952392578125, 0.515838623046875, 0.53643798828125, 0.557037353515625, 0.57763671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 10.0, 17.0, 15.0, 22.0, 27.0, 39.0, 53.0, 82.0, 97.0, 152.0, 237.0, 390.0, 700.0, 1588.0, 4394.0, 17131.0, 101611.0, 720895.0, 166258.0, 24860.0, 5920.0, 1975.0, 827.0, 448.0, 269.0, 139.0, 100.0, 69.0, 69.0, 47.0, 25.0, 23.0, 10.0, 12.0, 6.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.338592529296875, -1.29339599609375, -1.248199462890625, -1.2030029296875, -1.157806396484375, -1.11260986328125, -1.067413330078125, -1.022216796875, -0.977020263671875, -0.93182373046875, -0.886627197265625, -0.8414306640625, -0.796234130859375, -0.75103759765625, -0.705841064453125, -0.66064453125, -0.615447998046875, -0.57025146484375, -0.525054931640625, -0.4798583984375, -0.434661865234375, -0.38946533203125, -0.344268798828125, -0.299072265625, -0.253875732421875, -0.20867919921875, -0.163482666015625, -0.1182861328125, -0.073089599609375, -0.02789306640625, 0.017303466796875, 0.0625, 0.107696533203125, 0.15289306640625, 0.198089599609375, 0.2432861328125, 0.288482666015625, 0.33367919921875, 0.378875732421875, 0.424072265625, 0.469268798828125, 0.51446533203125, 0.559661865234375, 0.6048583984375, 0.650054931640625, 0.69525146484375, 0.740447998046875, 0.78564453125, 0.830841064453125, 0.87603759765625, 0.921234130859375, 0.9664306640625, 1.011627197265625, 1.05682373046875, 1.102020263671875, 1.147216796875, 1.192413330078125, 1.23760986328125, 1.282806396484375, 1.3280029296875, 1.373199462890625, 1.41839599609375, 1.463592529296875, 1.5087890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 6.0, 5.0, 10.0, 12.0, 16.0, 11.0, 22.0, 22.0, 19.0, 26.0, 30.0, 28.0, 40.0, 51.0, 52.0, 45.0, 65.0, 66.0, 45.0, 54.0, 51.0, 48.0, 38.0, 46.0, 26.0, 24.0, 21.0, 17.0, 13.0, 15.0, 13.0, 10.0, 6.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.296875, -2.212890625, -2.12890625, -2.044921875, -1.9609375, -1.876953125, -1.79296875, -1.708984375, -1.625, -1.541015625, -1.45703125, -1.373046875, -1.2890625, -1.205078125, -1.12109375, -1.037109375, -0.953125, -0.869140625, -0.78515625, -0.701171875, -0.6171875, -0.533203125, -0.44921875, -0.365234375, -0.28125, -0.197265625, -0.11328125, -0.029296875, 0.0546875, 0.138671875, 0.22265625, 0.306640625, 0.390625, 0.474609375, 0.55859375, 0.642578125, 0.7265625, 0.810546875, 0.89453125, 0.978515625, 1.0625, 1.146484375, 1.23046875, 1.314453125, 1.3984375, 1.482421875, 1.56640625, 1.650390625, 1.734375, 1.818359375, 1.90234375, 1.986328125, 2.0703125, 2.154296875, 2.23828125, 2.322265625, 2.40625, 2.490234375, 2.57421875, 2.658203125, 2.7421875, 2.826171875, 2.91015625, 2.994140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 15.0, 9.0, 11.0, 25.0, 42.0, 56.0, 55.0, 122.0, 178.0, 303.0, 496.0, 1035.0, 2064.0, 4782.0, 12347.0, 37188.0, 149478.0, 668852.0, 120543.0, 31736.0, 10793.0, 4244.0, 1914.0, 896.0, 553.0, 287.0, 181.0, 121.0, 61.0, 59.0, 30.0, 24.0, 14.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.415771484375, -0.4016456604003906, -0.38751983642578125, -0.3733940124511719, -0.3592681884765625, -0.3451423645019531, -0.33101654052734375, -0.3168907165527344, -0.302764892578125, -0.2886390686035156, -0.27451324462890625, -0.2603874206542969, -0.2462615966796875, -0.23213577270507812, -0.21800994873046875, -0.20388412475585938, -0.18975830078125, -0.17563247680664062, -0.16150665283203125, -0.14738082885742188, -0.1332550048828125, -0.11912918090820312, -0.10500335693359375, -0.09087753295898438, -0.076751708984375, -0.06262588500976562, -0.04850006103515625, -0.034374237060546875, -0.0202484130859375, -0.006122589111328125, 0.00800323486328125, 0.022129058837890625, 0.0362548828125, 0.050380706787109375, 0.06450653076171875, 0.07863235473632812, 0.0927581787109375, 0.10688400268554688, 0.12100982666015625, 0.13513565063476562, 0.149261474609375, 0.16338729858398438, 0.17751312255859375, 0.19163894653320312, 0.2057647705078125, 0.21989059448242188, 0.23401641845703125, 0.24814224243164062, 0.26226806640625, 0.2763938903808594, 0.29051971435546875, 0.3046455383300781, 0.3187713623046875, 0.3328971862792969, 0.34702301025390625, 0.3611488342285156, 0.375274658203125, 0.3894004821777344, 0.40352630615234375, 0.4176521301269531, 0.4317779541015625, 0.4459037780761719, 0.46002960205078125, 0.4741554260253906, 0.48828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 3.0, 13.0, 14.0, 15.0, 32.0, 29.0, 44.0, 67.0, 102.0, 111.0, 139.0, 137.0, 83.0, 52.0, 29.0, 26.0, 24.0, 14.0, 11.0, 12.0, 5.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014495849609375, -0.000140337273478508, -0.000135716050863266, -0.000131094828248024, -0.00012647360563278198, -0.00012185238301753998, -0.00011723116040229797, -0.00011260993778705597, -0.00010798871517181396, -0.00010336749255657196, -9.874626994132996e-05, -9.412504732608795e-05, -8.950382471084595e-05, -8.488260209560394e-05, -8.026137948036194e-05, -7.564015686511993e-05, -7.101893424987793e-05, -6.639771163463593e-05, -6.177648901939392e-05, -5.7155266404151917e-05, -5.253404378890991e-05, -4.791282117366791e-05, -4.32915985584259e-05, -3.86703759431839e-05, -3.4049153327941895e-05, -2.942793071269989e-05, -2.4806708097457886e-05, -2.018548548221588e-05, -1.5564262866973877e-05, -1.0943040251731873e-05, -6.321817636489868e-06, -1.7005950212478638e-06, 2.9206275939941406e-06, 7.541850209236145e-06, 1.216307282447815e-05, 1.6784295439720154e-05, 2.1405518054962158e-05, 2.6026740670204163e-05, 3.064796328544617e-05, 3.526918590068817e-05, 3.9890408515930176e-05, 4.451163113117218e-05, 4.9132853746414185e-05, 5.375407636165619e-05, 5.837529897689819e-05, 6.29965215921402e-05, 6.76177442073822e-05, 7.22389668226242e-05, 7.686018943786621e-05, 8.148141205310822e-05, 8.610263466835022e-05, 9.072385728359222e-05, 9.534507989883423e-05, 9.996630251407623e-05, 0.00010458752512931824, 0.00010920874774456024, 0.00011382997035980225, 0.00011845119297504425, 0.00012307241559028625, 0.00012769363820552826, 0.00013231486082077026, 0.00013693608343601227, 0.00014155730605125427, 0.00014617852866649628, 0.00015079975128173828]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 12.0, 12.0, 8.0, 14.0, 19.0, 32.0, 33.0, 62.0, 103.0, 204.0, 387.0, 812.0, 1799.0, 4480.0, 14641.0, 68001.0, 710150.0, 202353.0, 31755.0, 8391.0, 2887.0, 1155.0, 527.0, 295.0, 155.0, 92.0, 58.0, 32.0, 36.0, 8.0, 13.0, 8.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6530914306640625, -0.631866455078125, -0.6106414794921875, -0.58941650390625, -0.5681915283203125, -0.546966552734375, -0.5257415771484375, -0.5045166015625, -0.4832916259765625, -0.462066650390625, -0.4408416748046875, -0.41961669921875, -0.3983917236328125, -0.377166748046875, -0.3559417724609375, -0.334716796875, -0.3134918212890625, -0.292266845703125, -0.2710418701171875, -0.24981689453125, -0.2285919189453125, -0.207366943359375, -0.1861419677734375, -0.1649169921875, -0.1436920166015625, -0.122467041015625, -0.1012420654296875, -0.08001708984375, -0.0587921142578125, -0.037567138671875, -0.0163421630859375, 0.0048828125, 0.0261077880859375, 0.047332763671875, 0.0685577392578125, 0.08978271484375, 0.1110076904296875, 0.132232666015625, 0.1534576416015625, 0.1746826171875, 0.1959075927734375, 0.217132568359375, 0.2383575439453125, 0.25958251953125, 0.2808074951171875, 0.302032470703125, 0.3232574462890625, 0.344482421875, 0.3657073974609375, 0.386932373046875, 0.4081573486328125, 0.42938232421875, 0.4506072998046875, 0.471832275390625, 0.4930572509765625, 0.5142822265625, 0.5355072021484375, 0.556732177734375, 0.5779571533203125, 0.59918212890625, 0.6204071044921875, 0.641632080078125, 0.6628570556640625, 0.68408203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 5.0, 12.0, 14.0, 15.0, 11.0, 13.0, 20.0, 24.0, 36.0, 31.0, 48.0, 69.0, 86.0, 135.0, 104.0, 88.0, 58.0, 57.0, 37.0, 26.0, 19.0, 20.0, 8.0, 8.0, 8.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5988998413085938, -0.5801239013671875, -0.5613479614257812, -0.542572021484375, -0.5237960815429688, -0.5050201416015625, -0.48624420166015625, -0.46746826171875, -0.44869232177734375, -0.4299163818359375, -0.41114044189453125, -0.392364501953125, -0.37358856201171875, -0.3548126220703125, -0.33603668212890625, -0.3172607421875, -0.29848480224609375, -0.2797088623046875, -0.26093292236328125, -0.242156982421875, -0.22338104248046875, -0.2046051025390625, -0.18582916259765625, -0.16705322265625, -0.14827728271484375, -0.1295013427734375, -0.11072540283203125, -0.091949462890625, -0.07317352294921875, -0.0543975830078125, -0.03562164306640625, -0.016845703125, 0.00193023681640625, 0.0207061767578125, 0.03948211669921875, 0.058258056640625, 0.07703399658203125, 0.0958099365234375, 0.11458587646484375, 0.13336181640625, 0.15213775634765625, 0.1709136962890625, 0.18968963623046875, 0.208465576171875, 0.22724151611328125, 0.2460174560546875, 0.26479339599609375, 0.2835693359375, 0.30234527587890625, 0.3211212158203125, 0.33989715576171875, 0.358673095703125, 0.37744903564453125, 0.3962249755859375, 0.41500091552734375, 0.43377685546875, 0.45255279541015625, 0.4713287353515625, 0.49010467529296875, 0.508880615234375, 0.5276565551757812, 0.5464324951171875, 0.5652084350585938, 0.583984375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 19.0, 38.0, 104.0, 240.0, 315.0, 142.0, 61.0, 31.0, 15.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.366168022155762, -14.780821800231934, -14.195475578308105, -13.610129356384277, -13.024782180786133, -12.439435958862305, -11.854089736938477, -11.268743515014648, -10.68339729309082, -10.098051071166992, -9.512704849243164, -8.927358627319336, -8.342012405395508, -7.7566657066345215, -7.171319007873535, -6.585972785949707, -6.000626564025879, -5.415280342102051, -4.829934120178223, -4.244587421417236, -3.659241199493408, -3.07389497756958, -2.488548517227173, -1.9032020568847656, -1.3178558349609375, -0.7325094938278198, -0.14716315269470215, 0.4381831884384155, 1.0235295295715332, 1.6088757514953613, 2.1942222118377686, 2.779568672180176, 3.3649158477783203, 3.9502620697021484, 4.535608291625977, 5.120954990386963, 5.706301212310791, 6.291647434234619, 6.8769941329956055, 7.462340354919434, 8.047686576843262, 8.63303279876709, 9.218379020690918, 9.803725242614746, 10.38907241821289, 10.974418640136719, 11.559764862060547, 12.145111083984375, 12.730457305908203, 13.315803527832031, 13.90114974975586, 14.486495971679688, 15.071842193603516, 15.657188415527344, 16.242534637451172, 16.827880859375, 17.413227081298828, 17.998573303222656, 18.583919525146484, 19.169265747070312, 19.75461196899414, 20.33995819091797, 20.925304412841797, 21.510650634765625, 22.095998764038086]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 5.0, 3.0, 14.0, 6.0, 11.0, 9.0, 10.0, 14.0, 12.0, 17.0, 22.0, 20.0, 17.0, 29.0, 39.0, 32.0, 38.0, 58.0, 77.0, 71.0, 69.0, 55.0, 50.0, 40.0, 33.0, 33.0, 40.0, 22.0, 24.0, 14.0, 14.0, 18.0, 13.0, 11.0, 11.0, 6.0, 11.0, 4.0, 9.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.99497127532959, -9.699907302856445, -9.404842376708984, -9.109777450561523, -8.814713478088379, -8.519649505615234, -8.224584579467773, -7.929520130157471, -7.634455680847168, -7.339391231536865, -7.0443267822265625, -6.74926233291626, -6.454197883605957, -6.159133434295654, -5.864068984985352, -5.569004535675049, -5.273940086364746, -4.978875637054443, -4.683811187744141, -4.388746738433838, -4.093682289123535, -3.7986178398132324, -3.5035533905029297, -3.208488941192627, -2.913424491882324, -2.6183600425720215, -2.3232955932617188, -2.028231143951416, -1.7331666946411133, -1.4381022453308105, -1.1430377960205078, -0.8479733467102051, -0.5529098510742188, -0.257845401763916, 0.03721904754638672, 0.33228349685668945, 0.6273479461669922, 0.9224123954772949, 1.2174768447875977, 1.5125412940979004, 1.8076057434082031, 2.102670192718506, 2.3977346420288086, 2.6927990913391113, 2.987863540649414, 3.282927989959717, 3.5779924392700195, 3.8730568885803223, 4.168121337890625, 4.463185787200928, 4.7582502365112305, 5.053314685821533, 5.348379135131836, 5.643443584442139, 5.938508033752441, 6.233572483062744, 6.528636932373047, 6.82370138168335, 7.118765830993652, 7.413830280303955, 7.708894729614258, 8.003959655761719, 8.299023628234863, 8.594087600708008, 8.889152526855469]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 13.0, 9.0, 8.0, 12.0, 13.0, 10.0, 24.0, 19.0, 32.0, 26.0, 51.0, 69.0, 100.0, 158.0, 321.0, 753.0, 2174.0, 8404.0, 57914.0, 1185987.0, 2792140.0, 126995.0, 13925.0, 3091.0, 969.0, 439.0, 220.0, 109.0, 78.0, 40.0, 38.0, 22.0, 20.0, 17.0, 21.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.465362548828125, -1.41510009765625, -1.364837646484375, -1.3145751953125, -1.264312744140625, -1.21405029296875, -1.163787841796875, -1.113525390625, -1.063262939453125, -1.01300048828125, -0.962738037109375, -0.9124755859375, -0.862213134765625, -0.81195068359375, -0.761688232421875, -0.71142578125, -0.661163330078125, -0.61090087890625, -0.560638427734375, -0.5103759765625, -0.460113525390625, -0.40985107421875, -0.359588623046875, -0.309326171875, -0.259063720703125, -0.20880126953125, -0.158538818359375, -0.1082763671875, -0.058013916015625, -0.00775146484375, 0.042510986328125, 0.0927734375, 0.143035888671875, 0.19329833984375, 0.243560791015625, 0.2938232421875, 0.344085693359375, 0.39434814453125, 0.444610595703125, 0.494873046875, 0.545135498046875, 0.59539794921875, 0.645660400390625, 0.6959228515625, 0.746185302734375, 0.79644775390625, 0.846710205078125, 0.89697265625, 0.947235107421875, 0.99749755859375, 1.047760009765625, 1.0980224609375, 1.148284912109375, 1.19854736328125, 1.248809814453125, 1.299072265625, 1.349334716796875, 1.39959716796875, 1.449859619140625, 1.5001220703125, 1.550384521484375, 1.60064697265625, 1.650909423828125, 1.701171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 9.0, 11.0, 18.0, 16.0, 17.0, 30.0, 25.0, 32.0, 31.0, 36.0, 32.0, 59.0, 53.0, 50.0, 46.0, 51.0, 45.0, 35.0, 53.0, 43.0, 32.0, 48.0, 32.0, 25.0, 24.0, 22.0, 12.0, 24.0, 5.0, 19.0, 8.0, 10.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.611328125, -0.5904693603515625, -0.569610595703125, -0.5487518310546875, -0.52789306640625, -0.5070343017578125, -0.486175537109375, -0.4653167724609375, -0.4444580078125, -0.4235992431640625, -0.402740478515625, -0.3818817138671875, -0.36102294921875, -0.3401641845703125, -0.319305419921875, -0.2984466552734375, -0.277587890625, -0.2567291259765625, -0.235870361328125, -0.2150115966796875, -0.19415283203125, -0.1732940673828125, -0.152435302734375, -0.1315765380859375, -0.1107177734375, -0.0898590087890625, -0.069000244140625, -0.0481414794921875, -0.02728271484375, -0.0064239501953125, 0.014434814453125, 0.0352935791015625, 0.05615234375, 0.0770111083984375, 0.097869873046875, 0.1187286376953125, 0.13958740234375, 0.1604461669921875, 0.181304931640625, 0.2021636962890625, 0.2230224609375, 0.2438812255859375, 0.264739990234375, 0.2855987548828125, 0.30645751953125, 0.3273162841796875, 0.348175048828125, 0.3690338134765625, 0.389892578125, 0.4107513427734375, 0.431610107421875, 0.4524688720703125, 0.47332763671875, 0.4941864013671875, 0.515045166015625, 0.5359039306640625, 0.5567626953125, 0.5776214599609375, 0.598480224609375, 0.6193389892578125, 0.64019775390625, 0.6610565185546875, 0.681915283203125, 0.7027740478515625, 0.7236328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 14.0, 18.0, 37.0, 144.0, 398.0, 1819.0, 89450.0, 4088537.0, 12378.0, 1035.0, 281.0, 100.0, 40.0, 10.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.19293212890625, -2.0147705078125, -1.83660888671875, -1.658447265625, -1.48028564453125, -1.3021240234375, -1.12396240234375, -0.94580078125, -0.76763916015625, -0.5894775390625, -0.41131591796875, -0.233154296875, -0.05499267578125, 0.1231689453125, 0.30133056640625, 0.4794921875, 0.65765380859375, 0.8358154296875, 1.01397705078125, 1.192138671875, 1.37030029296875, 1.5484619140625, 1.72662353515625, 1.90478515625, 2.08294677734375, 2.2611083984375, 2.43927001953125, 2.617431640625, 2.79559326171875, 2.9737548828125, 3.15191650390625, 3.330078125, 3.50823974609375, 3.6864013671875, 3.86456298828125, 4.042724609375, 4.22088623046875, 4.3990478515625, 4.57720947265625, 4.75537109375, 4.93353271484375, 5.1116943359375, 5.28985595703125, 5.468017578125, 5.64617919921875, 5.8243408203125, 6.00250244140625, 6.1806640625, 6.35882568359375, 6.5369873046875, 6.71514892578125, 6.893310546875, 7.07147216796875, 7.2496337890625, 7.42779541015625, 7.60595703125, 7.78411865234375, 7.9622802734375, 8.14044189453125, 8.318603515625, 8.49676513671875, 8.6749267578125, 8.85308837890625, 9.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 12.0, 25.0, 42.0, 61.0, 110.0, 235.0, 465.0, 888.0, 1053.0, 560.0, 293.0, 134.0, 73.0, 41.0, 34.0, 13.0, 6.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.54296875, -2.474456787109375, -2.40594482421875, -2.337432861328125, -2.2689208984375, -2.200408935546875, -2.13189697265625, -2.063385009765625, -1.994873046875, -1.926361083984375, -1.85784912109375, -1.789337158203125, -1.7208251953125, -1.652313232421875, -1.58380126953125, -1.515289306640625, -1.44677734375, -1.378265380859375, -1.30975341796875, -1.241241455078125, -1.1727294921875, -1.104217529296875, -1.03570556640625, -0.967193603515625, -0.898681640625, -0.830169677734375, -0.76165771484375, -0.693145751953125, -0.6246337890625, -0.556121826171875, -0.48760986328125, -0.419097900390625, -0.3505859375, -0.282073974609375, -0.21356201171875, -0.145050048828125, -0.0765380859375, -0.008026123046875, 0.06048583984375, 0.128997802734375, 0.197509765625, 0.266021728515625, 0.33453369140625, 0.403045654296875, 0.4715576171875, 0.540069580078125, 0.60858154296875, 0.677093505859375, 0.74560546875, 0.814117431640625, 0.88262939453125, 0.951141357421875, 1.0196533203125, 1.088165283203125, 1.15667724609375, 1.225189208984375, 1.293701171875, 1.362213134765625, 1.43072509765625, 1.499237060546875, 1.5677490234375, 1.636260986328125, 1.70477294921875, 1.773284912109375, 1.841796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 19.0, 55.0, 148.0, 262.0, 275.0, 116.0, 62.0, 22.0, 13.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.362067222595215, -12.566646575927734, -11.771224975585938, -10.975804328918457, -10.18038272857666, -9.38496208190918, -8.589540481567383, -7.794119834899902, -6.998698711395264, -6.203277587890625, -5.407856464385986, -4.612435340881348, -3.817014455795288, -3.0215933322906494, -2.22617244720459, -1.4307513236999512, -0.6353302001953125, 0.1600908637046814, 0.9555119276046753, 1.7509329319000244, 2.546354055404663, 3.3417751789093018, 4.137196063995361, 4.9326171875, 5.728038311004639, 6.523459434509277, 7.318880558013916, 8.114301681518555, 8.909722328186035, 9.705143928527832, 10.500564575195312, 11.29598617553711, 12.091405868530273, 12.886826515197754, 13.68224811553955, 14.477668762207031, 15.273090362548828, 16.068511962890625, 16.86393165588379, 17.659353256225586, 18.454774856567383, 19.25019645690918, 20.045616149902344, 20.84103775024414, 21.636459350585938, 22.431880950927734, 23.2273006439209, 24.022722244262695, 24.81814193725586, 25.613563537597656, 26.40898323059082, 27.204404830932617, 27.999826431274414, 28.79524803161621, 29.590667724609375, 30.386089324951172, 31.18151092529297, 31.976932525634766, 32.77235412597656, 33.56777572631836, 34.36319351196289, 35.15861511230469, 35.954036712646484, 36.74945831298828, 37.54487991333008]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 12.0, 10.0, 11.0, 7.0, 7.0, 21.0, 12.0, 17.0, 13.0, 25.0, 24.0, 37.0, 30.0, 39.0, 36.0, 39.0, 47.0, 34.0, 44.0, 47.0, 37.0, 36.0, 34.0, 34.0, 39.0, 34.0, 29.0, 27.0, 23.0, 30.0, 27.0, 11.0, 17.0, 16.0, 17.0, 14.0, 17.0, 4.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.2947845458984375, -6.113229274749756, -5.931674003601074, -5.750118732452393, -5.568563461303711, -5.387008190155029, -5.205452919006348, -5.023897171020508, -4.842342376708984, -4.660787105560303, -4.479231834411621, -4.2976765632629395, -4.116121292114258, -3.934566020965576, -3.7530105113983154, -3.571455240249634, -3.389899730682373, -3.2083444595336914, -3.0267891883850098, -2.845233917236328, -2.6636786460876465, -2.482123374938965, -2.300567865371704, -2.1190125942230225, -1.9374573230743408, -1.7559020519256592, -1.5743467807769775, -1.3927913904190063, -1.2112361192703247, -1.029680848121643, -0.8481254577636719, -0.6665701866149902, -0.4850144386291504, -0.30345913767814636, -0.12190383672714233, 0.05965149402618408, 0.24120676517486572, 0.42276203632354736, 0.6043174266815186, 0.7858726978302002, 0.9674279689788818, 1.1489832401275635, 1.3305385112762451, 1.5120939016342163, 1.693649172782898, 1.8752044439315796, 2.056759834289551, 2.2383151054382324, 2.419870376586914, 2.6014256477355957, 2.7829809188842773, 2.964536190032959, 3.1460914611816406, 3.3276467323303223, 3.509202241897583, 3.6907575130462646, 3.8723127841949463, 4.053868293762207, 4.235423564910889, 4.41697883605957, 4.598534107208252, 4.780089378356934, 4.961644649505615, 5.143199920654297, 5.3247551918029785]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 12.0, 13.0, 30.0, 65.0, 140.0, 328.0, 799.0, 2345.0, 7815.0, 35588.0, 261034.0, 617834.0, 98973.0, 16987.0, 4287.0, 1339.0, 536.0, 206.0, 112.0, 50.0, 26.0, 9.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3029327392578125, -1.251373291015625, -1.1998138427734375, -1.14825439453125, -1.0966949462890625, -1.045135498046875, -0.9935760498046875, -0.9420166015625, -0.8904571533203125, -0.838897705078125, -0.7873382568359375, -0.73577880859375, -0.6842193603515625, -0.632659912109375, -0.5811004638671875, -0.529541015625, -0.4779815673828125, -0.426422119140625, -0.3748626708984375, -0.32330322265625, -0.2717437744140625, -0.220184326171875, -0.1686248779296875, -0.1170654296875, -0.0655059814453125, -0.013946533203125, 0.0376129150390625, 0.08917236328125, 0.1407318115234375, 0.192291259765625, 0.2438507080078125, 0.29541015625, 0.3469696044921875, 0.398529052734375, 0.4500885009765625, 0.50164794921875, 0.5532073974609375, 0.604766845703125, 0.6563262939453125, 0.7078857421875, 0.7594451904296875, 0.811004638671875, 0.8625640869140625, 0.91412353515625, 0.9656829833984375, 1.017242431640625, 1.0688018798828125, 1.120361328125, 1.1719207763671875, 1.223480224609375, 1.2750396728515625, 1.32659912109375, 1.3781585693359375, 1.429718017578125, 1.4812774658203125, 1.5328369140625, 1.5843963623046875, 1.635955810546875, 1.6875152587890625, 1.73907470703125, 1.7906341552734375, 1.842193603515625, 1.8937530517578125, 1.9453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 7.0, 6.0, 6.0, 8.0, 7.0, 12.0, 16.0, 26.0, 13.0, 20.0, 20.0, 25.0, 44.0, 35.0, 30.0, 39.0, 52.0, 39.0, 51.0, 51.0, 44.0, 47.0, 44.0, 46.0, 44.0, 34.0, 34.0, 37.0, 32.0, 24.0, 25.0, 20.0, 14.0, 15.0, 11.0, 2.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6591796875, -0.6370849609375, -0.614990234375, -0.5928955078125, -0.57080078125, -0.5487060546875, -0.526611328125, -0.5045166015625, -0.482421875, -0.4603271484375, -0.438232421875, -0.4161376953125, -0.39404296875, -0.3719482421875, -0.349853515625, -0.3277587890625, -0.3056640625, -0.2835693359375, -0.261474609375, -0.2393798828125, -0.21728515625, -0.1951904296875, -0.173095703125, -0.1510009765625, -0.12890625, -0.1068115234375, -0.084716796875, -0.0626220703125, -0.04052734375, -0.0184326171875, 0.003662109375, 0.0257568359375, 0.0478515625, 0.0699462890625, 0.092041015625, 0.1141357421875, 0.13623046875, 0.1583251953125, 0.180419921875, 0.2025146484375, 0.224609375, 0.2467041015625, 0.268798828125, 0.2908935546875, 0.31298828125, 0.3350830078125, 0.357177734375, 0.3792724609375, 0.4013671875, 0.4234619140625, 0.445556640625, 0.4676513671875, 0.48974609375, 0.5118408203125, 0.533935546875, 0.5560302734375, 0.578125, 0.6002197265625, 0.622314453125, 0.6444091796875, 0.66650390625, 0.6885986328125, 0.710693359375, 0.7327880859375, 0.7548828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 12.0, 17.0, 32.0, 39.0, 56.0, 100.0, 117.0, 182.0, 319.0, 626.0, 1208.0, 3216.0, 13152.0, 99542.0, 821703.0, 89906.0, 12315.0, 3258.0, 1225.0, 591.0, 331.0, 215.0, 106.0, 88.0, 58.0, 39.0, 31.0, 15.0, 17.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.0899200439453125, -2.027496337890625, -1.9650726318359375, -1.90264892578125, -1.8402252197265625, -1.777801513671875, -1.7153778076171875, -1.6529541015625, -1.5905303955078125, -1.528106689453125, -1.4656829833984375, -1.40325927734375, -1.3408355712890625, -1.278411865234375, -1.2159881591796875, -1.153564453125, -1.0911407470703125, -1.028717041015625, -0.9662933349609375, -0.90386962890625, -0.8414459228515625, -0.779022216796875, -0.7165985107421875, -0.6541748046875, -0.5917510986328125, -0.529327392578125, -0.4669036865234375, -0.40447998046875, -0.3420562744140625, -0.279632568359375, -0.2172088623046875, -0.15478515625, -0.0923614501953125, -0.029937744140625, 0.0324859619140625, 0.09490966796875, 0.1573333740234375, 0.219757080078125, 0.2821807861328125, 0.3446044921875, 0.4070281982421875, 0.469451904296875, 0.5318756103515625, 0.59429931640625, 0.6567230224609375, 0.719146728515625, 0.7815704345703125, 0.843994140625, 0.9064178466796875, 0.968841552734375, 1.0312652587890625, 1.09368896484375, 1.1561126708984375, 1.218536376953125, 1.2809600830078125, 1.3433837890625, 1.4058074951171875, 1.468231201171875, 1.5306549072265625, 1.59307861328125, 1.6555023193359375, 1.717926025390625, 1.7803497314453125, 1.8427734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 2.0, 7.0, 7.0, 8.0, 12.0, 15.0, 20.0, 22.0, 30.0, 22.0, 24.0, 34.0, 48.0, 49.0, 47.0, 55.0, 43.0, 78.0, 58.0, 51.0, 47.0, 44.0, 42.0, 31.0, 22.0, 31.0, 27.0, 18.0, 21.0, 9.0, 16.0, 5.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.67578125, -2.590850830078125, -2.50592041015625, -2.420989990234375, -2.3360595703125, -2.251129150390625, -2.16619873046875, -2.081268310546875, -1.996337890625, -1.911407470703125, -1.82647705078125, -1.741546630859375, -1.6566162109375, -1.571685791015625, -1.48675537109375, -1.401824951171875, -1.31689453125, -1.231964111328125, -1.14703369140625, -1.062103271484375, -0.9771728515625, -0.892242431640625, -0.80731201171875, -0.722381591796875, -0.637451171875, -0.552520751953125, -0.46759033203125, -0.382659912109375, -0.2977294921875, -0.212799072265625, -0.12786865234375, -0.042938232421875, 0.0419921875, 0.126922607421875, 0.21185302734375, 0.296783447265625, 0.3817138671875, 0.466644287109375, 0.55157470703125, 0.636505126953125, 0.721435546875, 0.806365966796875, 0.89129638671875, 0.976226806640625, 1.0611572265625, 1.146087646484375, 1.23101806640625, 1.315948486328125, 1.40087890625, 1.485809326171875, 1.57073974609375, 1.655670166015625, 1.7406005859375, 1.825531005859375, 1.91046142578125, 1.995391845703125, 2.080322265625, 2.165252685546875, 2.25018310546875, 2.335113525390625, 2.4200439453125, 2.504974365234375, 2.58990478515625, 2.674835205078125, 2.759765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 5.0, 21.0, 24.0, 36.0, 62.0, 106.0, 161.0, 358.0, 727.0, 2091.0, 7767.0, 43009.0, 728428.0, 231814.0, 25640.0, 5351.0, 1621.0, 625.0, 286.0, 145.0, 92.0, 57.0, 32.0, 28.0, 16.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5597305297851562, -0.5388946533203125, -0.5180587768554688, -0.497222900390625, -0.47638702392578125, -0.4555511474609375, -0.43471527099609375, -0.41387939453125, -0.39304351806640625, -0.3722076416015625, -0.35137176513671875, -0.330535888671875, -0.30970001220703125, -0.2888641357421875, -0.26802825927734375, -0.2471923828125, -0.22635650634765625, -0.2055206298828125, -0.18468475341796875, -0.163848876953125, -0.14301300048828125, -0.1221771240234375, -0.10134124755859375, -0.08050537109375, -0.05966949462890625, -0.0388336181640625, -0.01799774169921875, 0.002838134765625, 0.02367401123046875, 0.0445098876953125, 0.06534576416015625, 0.086181640625, 0.10701751708984375, 0.1278533935546875, 0.14868927001953125, 0.169525146484375, 0.19036102294921875, 0.2111968994140625, 0.23203277587890625, 0.25286865234375, 0.27370452880859375, 0.2945404052734375, 0.31537628173828125, 0.336212158203125, 0.35704803466796875, 0.3778839111328125, 0.39871978759765625, 0.4195556640625, 0.44039154052734375, 0.4612274169921875, 0.48206329345703125, 0.502899169921875, 0.5237350463867188, 0.5445709228515625, 0.5654067993164062, 0.58624267578125, 0.6070785522460938, 0.6279144287109375, 0.6487503051757812, 0.669586181640625, 0.6904220581054688, 0.7112579345703125, 0.7320938110351562, 0.7529296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 5.0, 4.0, 3.0, 11.0, 5.0, 13.0, 25.0, 42.0, 63.0, 137.0, 208.0, 196.0, 104.0, 70.0, 42.0, 19.0, 17.0, 15.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025391578674316406, -0.00024643726646900177, -0.00023895874619483948, -0.00023148022592067719, -0.0002240017056465149, -0.0002165231853723526, -0.0002090446650981903, -0.00020156614482402802, -0.00019408762454986572, -0.00018660910427570343, -0.00017913058400154114, -0.00017165206372737885, -0.00016417354345321655, -0.00015669502317905426, -0.00014921650290489197, -0.00014173798263072968, -0.00013425946235656738, -0.0001267809420824051, -0.0001193024218082428, -0.0001118239015340805, -0.00010434538125991821, -9.686686098575592e-05, -8.938834071159363e-05, -8.190982043743134e-05, -7.443130016326904e-05, -6.695277988910675e-05, -5.947425961494446e-05, -5.1995739340782166e-05, -4.451721906661987e-05, -3.703869879245758e-05, -2.9560178518295288e-05, -2.2081658244132996e-05, -1.4603137969970703e-05, -7.124617695808411e-06, 3.5390257835388184e-07, 7.832422852516174e-06, 1.5310943126678467e-05, 2.278946340084076e-05, 3.0267983675003052e-05, 3.7746503949165344e-05, 4.522502422332764e-05, 5.270354449748993e-05, 6.018206477165222e-05, 6.766058504581451e-05, 7.51391053199768e-05, 8.26176255941391e-05, 9.009614586830139e-05, 9.757466614246368e-05, 0.00010505318641662598, 0.00011253170669078827, 0.00012001022696495056, 0.00012748874723911285, 0.00013496726751327515, 0.00014244578778743744, 0.00014992430806159973, 0.00015740282833576202, 0.00016488134860992432, 0.0001723598688840866, 0.0001798383891582489, 0.0001873169094324112, 0.00019479542970657349, 0.00020227394998073578, 0.00020975247025489807, 0.00021723099052906036, 0.00022470951080322266]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 12.0, 18.0, 25.0, 33.0, 46.0, 74.0, 136.0, 287.0, 410.0, 868.0, 1908.0, 4938.0, 15973.0, 67315.0, 641290.0, 250613.0, 45740.0, 11687.0, 3825.0, 1611.0, 751.0, 396.0, 218.0, 134.0, 71.0, 55.0, 34.0, 25.0, 9.0, 11.0, 9.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.53369140625, -0.5179367065429688, -0.5021820068359375, -0.48642730712890625, -0.470672607421875, -0.45491790771484375, -0.4391632080078125, -0.42340850830078125, -0.40765380859375, -0.39189910888671875, -0.3761444091796875, -0.36038970947265625, -0.344635009765625, -0.32888031005859375, -0.3131256103515625, -0.29737091064453125, -0.2816162109375, -0.26586151123046875, -0.2501068115234375, -0.23435211181640625, -0.218597412109375, -0.20284271240234375, -0.1870880126953125, -0.17133331298828125, -0.15557861328125, -0.13982391357421875, -0.1240692138671875, -0.10831451416015625, -0.092559814453125, -0.07680511474609375, -0.0610504150390625, -0.04529571533203125, -0.029541015625, -0.01378631591796875, 0.0019683837890625, 0.01772308349609375, 0.033477783203125, 0.04923248291015625, 0.0649871826171875, 0.08074188232421875, 0.09649658203125, 0.11225128173828125, 0.1280059814453125, 0.14376068115234375, 0.159515380859375, 0.17527008056640625, 0.1910247802734375, 0.20677947998046875, 0.2225341796875, 0.23828887939453125, 0.2540435791015625, 0.26979827880859375, 0.285552978515625, 0.30130767822265625, 0.3170623779296875, 0.33281707763671875, 0.34857177734375, 0.36432647705078125, 0.3800811767578125, 0.39583587646484375, 0.411590576171875, 0.42734527587890625, 0.4430999755859375, 0.45885467529296875, 0.474609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 6.0, 8.0, 13.0, 11.0, 20.0, 22.0, 41.0, 53.0, 62.0, 98.0, 135.0, 116.0, 101.0, 69.0, 66.0, 44.0, 32.0, 22.0, 18.0, 17.0, 14.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5780181884765625, -0.558868408203125, -0.5397186279296875, -0.52056884765625, -0.5014190673828125, -0.482269287109375, -0.4631195068359375, -0.4439697265625, -0.4248199462890625, -0.405670166015625, -0.3865203857421875, -0.36737060546875, -0.3482208251953125, -0.329071044921875, -0.3099212646484375, -0.290771484375, -0.2716217041015625, -0.252471923828125, -0.2333221435546875, -0.21417236328125, -0.1950225830078125, -0.175872802734375, -0.1567230224609375, -0.1375732421875, -0.1184234619140625, -0.099273681640625, -0.0801239013671875, -0.06097412109375, -0.0418243408203125, -0.022674560546875, -0.0035247802734375, 0.015625, 0.0347747802734375, 0.053924560546875, 0.0730743408203125, 0.09222412109375, 0.1113739013671875, 0.130523681640625, 0.1496734619140625, 0.1688232421875, 0.1879730224609375, 0.207122802734375, 0.2262725830078125, 0.24542236328125, 0.2645721435546875, 0.283721923828125, 0.3028717041015625, 0.322021484375, 0.3411712646484375, 0.360321044921875, 0.3794708251953125, 0.39862060546875, 0.4177703857421875, 0.436920166015625, 0.4560699462890625, 0.4752197265625, 0.4943695068359375, 0.513519287109375, 0.5326690673828125, 0.55181884765625, 0.5709686279296875, 0.590118408203125, 0.6092681884765625, 0.62841796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 19.0, 45.0, 83.0, 153.0, 312.0, 162.0, 80.0, 47.0, 34.0, 16.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.572731018066406, -18.11406135559082, -17.6553897857666, -17.196720123291016, -16.738048553466797, -16.27937889099121, -15.820708274841309, -15.362037658691406, -14.90336799621582, -14.444697380065918, -13.986026763916016, -13.52735710144043, -13.068686485290527, -12.610015869140625, -12.151345252990723, -11.69267463684082, -11.234004020690918, -10.775333404541016, -10.316662788391113, -9.857992172241211, -9.399322509765625, -8.940651893615723, -8.48198127746582, -8.023310661315918, -7.564640522003174, -7.1059699058532715, -6.647299766540527, -6.188629150390625, -5.729958534240723, -5.2712883949279785, -4.812617778778076, -4.353947639465332, -3.895277976989746, -3.436607599258423, -2.9779372215270996, -2.5192666053771973, -2.060596227645874, -1.6019258499145508, -1.1432552337646484, -0.6845848560333252, -0.22591447830200195, 0.23275595903396606, 0.6914263963699341, 1.1500968933105469, 1.6087672710418701, 2.0674376487731934, 2.5261082649230957, 2.984778642654419, 3.443449020385742, 3.9021193981170654, 4.360789775848389, 4.819460391998291, 5.278130531311035, 5.7368011474609375, 6.19547176361084, 6.654142379760742, 7.112812519073486, 7.571483135223389, 8.030153274536133, 8.488823890686035, 8.947494506835938, 9.406164169311523, 9.864835739135742, 10.323505401611328, 10.78217601776123]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 6.0, 6.0, 16.0, 10.0, 12.0, 15.0, 19.0, 18.0, 25.0, 33.0, 21.0, 24.0, 27.0, 28.0, 53.0, 66.0, 119.0, 96.0, 74.0, 55.0, 40.0, 40.0, 34.0, 23.0, 21.0, 28.0, 14.0, 14.0, 8.0, 10.0, 10.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.744438171386719, -9.383305549621582, -9.022173881530762, -8.661041259765625, -8.299908638000488, -7.93877649307251, -7.577644348144531, -7.2165117263793945, -6.855379581451416, -6.4942474365234375, -6.133114814758301, -5.771982669830322, -5.410850524902344, -5.049717903137207, -4.6885857582092285, -4.32745361328125, -3.9663209915161133, -3.6051886081695557, -3.244056224822998, -2.8829240798950195, -2.521791696548462, -2.1606593132019043, -1.7995271682739258, -1.4383947849273682, -1.0772624015808105, -0.7161300778388977, -0.35499775409698486, 0.006134510040283203, 0.3672668933868408, 0.7283992767333984, 1.089531421661377, 1.4506638050079346, 1.8117952346801758, 2.1729276180267334, 2.534060001373291, 2.8951921463012695, 3.256324529647827, 3.6174569129943848, 3.9785890579223633, 4.3397216796875, 4.7008538246154785, 5.061985969543457, 5.423118591308594, 5.784250736236572, 6.145382881164551, 6.5065155029296875, 6.867647647857666, 7.2287797927856445, 7.589912414550781, 7.95104455947876, 8.312176704406738, 8.673309326171875, 9.034441947937012, 9.395574569702148, 9.756706237792969, 10.117838859558105, 10.478971481323242, 10.840104103088379, 11.2012357711792, 11.562368392944336, 11.923501014709473, 12.28463363647461, 12.64576530456543, 13.006897926330566, 13.368029594421387]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 13.0, 15.0, 20.0, 27.0, 57.0, 124.0, 327.0, 898.0, 3505.0, 19997.0, 255886.0, 3369917.0, 507776.0, 29153.0, 4679.0, 1125.0, 382.0, 179.0, 90.0, 38.0, 25.0, 17.0, 10.0, 10.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.60345458984375, -2.5155029296875, -2.42755126953125, -2.339599609375, -2.25164794921875, -2.1636962890625, -2.07574462890625, -1.98779296875, -1.89984130859375, -1.8118896484375, -1.72393798828125, -1.635986328125, -1.54803466796875, -1.4600830078125, -1.37213134765625, -1.2841796875, -1.19622802734375, -1.1082763671875, -1.02032470703125, -0.932373046875, -0.84442138671875, -0.7564697265625, -0.66851806640625, -0.58056640625, -0.49261474609375, -0.4046630859375, -0.31671142578125, -0.228759765625, -0.14080810546875, -0.0528564453125, 0.03509521484375, 0.123046875, 0.21099853515625, 0.2989501953125, 0.38690185546875, 0.474853515625, 0.56280517578125, 0.6507568359375, 0.73870849609375, 0.82666015625, 0.91461181640625, 1.0025634765625, 1.09051513671875, 1.178466796875, 1.26641845703125, 1.3543701171875, 1.44232177734375, 1.5302734375, 1.61822509765625, 1.7061767578125, 1.79412841796875, 1.882080078125, 1.97003173828125, 2.0579833984375, 2.14593505859375, 2.23388671875, 2.32183837890625, 2.4097900390625, 2.49774169921875, 2.585693359375, 2.67364501953125, 2.7615966796875, 2.84954833984375, 2.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 9.0, 3.0, 8.0, 8.0, 11.0, 18.0, 18.0, 23.0, 31.0, 34.0, 50.0, 50.0, 57.0, 53.0, 61.0, 48.0, 61.0, 49.0, 57.0, 47.0, 37.0, 48.0, 50.0, 35.0, 29.0, 31.0, 14.0, 21.0, 7.0, 5.0, 11.0, 3.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8052520751953125, -0.780426025390625, -0.7555999755859375, -0.73077392578125, -0.7059478759765625, -0.681121826171875, -0.6562957763671875, -0.6314697265625, -0.6066436767578125, -0.581817626953125, -0.5569915771484375, -0.53216552734375, -0.5073394775390625, -0.482513427734375, -0.4576873779296875, -0.432861328125, -0.4080352783203125, -0.383209228515625, -0.3583831787109375, -0.33355712890625, -0.3087310791015625, -0.283905029296875, -0.2590789794921875, -0.2342529296875, -0.2094268798828125, -0.184600830078125, -0.1597747802734375, -0.13494873046875, -0.1101226806640625, -0.085296630859375, -0.0604705810546875, -0.03564453125, -0.0108184814453125, 0.014007568359375, 0.0388336181640625, 0.06365966796875, 0.0884857177734375, 0.113311767578125, 0.1381378173828125, 0.1629638671875, 0.1877899169921875, 0.212615966796875, 0.2374420166015625, 0.26226806640625, 0.2870941162109375, 0.311920166015625, 0.3367462158203125, 0.361572265625, 0.3863983154296875, 0.411224365234375, 0.4360504150390625, 0.46087646484375, 0.4857025146484375, 0.510528564453125, 0.5353546142578125, 0.5601806640625, 0.5850067138671875, 0.609832763671875, 0.6346588134765625, 0.65948486328125, 0.6843109130859375, 0.709136962890625, 0.7339630126953125, 0.7587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 6.0, 16.0, 33.0, 58.0, 83.0, 196.0, 520.0, 2114.0, 39798.0, 4138017.0, 11215.0, 1400.0, 452.0, 171.0, 92.0, 38.0, 19.0, 11.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.59375, -11.22412109375, -10.8544921875, -10.48486328125, -10.115234375, -9.74560546875, -9.3759765625, -9.00634765625, -8.63671875, -8.26708984375, -7.8974609375, -7.52783203125, -7.158203125, -6.78857421875, -6.4189453125, -6.04931640625, -5.6796875, -5.31005859375, -4.9404296875, -4.57080078125, -4.201171875, -3.83154296875, -3.4619140625, -3.09228515625, -2.72265625, -2.35302734375, -1.9833984375, -1.61376953125, -1.244140625, -0.87451171875, -0.5048828125, -0.13525390625, 0.234375, 0.60400390625, 0.9736328125, 1.34326171875, 1.712890625, 2.08251953125, 2.4521484375, 2.82177734375, 3.19140625, 3.56103515625, 3.9306640625, 4.30029296875, 4.669921875, 5.03955078125, 5.4091796875, 5.77880859375, 6.1484375, 6.51806640625, 6.8876953125, 7.25732421875, 7.626953125, 7.99658203125, 8.3662109375, 8.73583984375, 9.10546875, 9.47509765625, 9.8447265625, 10.21435546875, 10.583984375, 10.95361328125, 11.3232421875, 11.69287109375, 12.0625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 16.0, 22.0, 38.0, 51.0, 98.0, 125.0, 232.0, 389.0, 664.0, 993.0, 648.0, 343.0, 157.0, 112.0, 64.0, 48.0, 29.0, 17.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.74114990234375, -2.6190185546875, -2.49688720703125, -2.374755859375, -2.25262451171875, -2.1304931640625, -2.00836181640625, -1.88623046875, -1.76409912109375, -1.6419677734375, -1.51983642578125, -1.397705078125, -1.27557373046875, -1.1534423828125, -1.03131103515625, -0.9091796875, -0.78704833984375, -0.6649169921875, -0.54278564453125, -0.420654296875, -0.29852294921875, -0.1763916015625, -0.05426025390625, 0.06787109375, 0.19000244140625, 0.3121337890625, 0.43426513671875, 0.556396484375, 0.67852783203125, 0.8006591796875, 0.92279052734375, 1.044921875, 1.16705322265625, 1.2891845703125, 1.41131591796875, 1.533447265625, 1.65557861328125, 1.7777099609375, 1.89984130859375, 2.02197265625, 2.14410400390625, 2.2662353515625, 2.38836669921875, 2.510498046875, 2.63262939453125, 2.7547607421875, 2.87689208984375, 2.9990234375, 3.12115478515625, 3.2432861328125, 3.36541748046875, 3.487548828125, 3.60968017578125, 3.7318115234375, 3.85394287109375, 3.97607421875, 4.09820556640625, 4.2203369140625, 4.34246826171875, 4.464599609375, 4.58673095703125, 4.7088623046875, 4.83099365234375, 4.953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 13.0, 47.0, 267.0, 518.0, 111.0, 33.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-182.2290802001953, -178.86874389648438, -175.5084228515625, -172.14808654785156, -168.78775024414062, -165.4274139404297, -162.06707763671875, -158.70675659179688, -155.34642028808594, -151.986083984375, -148.62576293945312, -145.2654266357422, -141.90509033203125, -138.5447540283203, -135.18441772460938, -131.8240966796875, -128.46376037597656, -125.10342407226562, -121.74309539794922, -118.38276672363281, -115.02243041992188, -111.66209411621094, -108.30176544189453, -104.94143676757812, -101.58110046386719, -98.22076416015625, -94.86043548583984, -91.50010681152344, -88.1397705078125, -84.77943420410156, -81.41910552978516, -78.05877685546875, -74.69844055175781, -71.33810424804688, -67.97777557373047, -64.61744689941406, -61.257110595703125, -57.89677810668945, -54.53644561767578, -51.17611312866211, -47.81578063964844, -44.455448150634766, -41.095115661621094, -37.73478317260742, -34.37445068359375, -31.014118194580078, -27.653785705566406, -24.293453216552734, -20.933120727539062, -17.57278823852539, -14.212455749511719, -10.852123260498047, -7.491790771484375, -4.131458282470703, -0.7711257934570312, 2.5892066955566406, 5.9495391845703125, 9.309871673583984, 12.670204162597656, 16.030536651611328, 19.390869140625, 22.751201629638672, 26.111534118652344, 29.471866607666016, 32.83219909667969]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 9.0, 11.0, 20.0, 21.0, 21.0, 27.0, 47.0, 49.0, 67.0, 79.0, 60.0, 87.0, 82.0, 65.0, 50.0, 61.0, 38.0, 42.0, 28.0, 28.0, 16.0, 13.0, 13.0, 13.0, 9.0, 8.0, 2.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.76395034790039, -25.14447021484375, -24.524991989135742, -23.9055118560791, -23.286033630371094, -22.666553497314453, -22.047075271606445, -21.427595138549805, -20.808116912841797, -20.188636779785156, -19.56915855407715, -18.949678421020508, -18.3302001953125, -17.71072006225586, -17.09124183654785, -16.47176170349121, -15.85228157043457, -15.232802391052246, -14.613323211669922, -13.993844032287598, -13.374364852905273, -12.754884719848633, -12.135405540466309, -11.515926361083984, -10.89644718170166, -10.276968002319336, -9.657488822937012, -9.038009643554688, -8.418529510498047, -7.799050807952881, -7.179571151733398, -6.560091972351074, -5.940613746643066, -5.321134567260742, -4.701655387878418, -4.0821757316589355, -3.4626965522766113, -2.843217372894287, -2.223737955093384, -1.6042585372924805, -0.9847793579101562, -0.3653000593185425, 0.2541792392730713, 0.8736585378646851, 1.4931378364562988, 2.112617015838623, 2.7320964336395264, 3.3515758514404297, 3.971055030822754, 4.590534210205078, 5.210013389587402, 5.829493045806885, 6.448972225189209, 7.068451404571533, 7.687931060791016, 8.30741024017334, 8.926889419555664, 9.546368598937988, 10.165847778320312, 10.785326957702637, 11.404806137084961, 12.024286270141602, 12.643765449523926, 13.26324462890625, 13.882723808288574]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 13.0, 19.0, 35.0, 38.0, 56.0, 92.0, 166.0, 256.0, 542.0, 1090.0, 2832.0, 8337.0, 32587.0, 198274.0, 681878.0, 94253.0, 18877.0, 5417.0, 2005.0, 828.0, 411.0, 200.0, 122.0, 67.0, 33.0, 31.0, 19.0, 21.0, 10.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.678985595703125, -1.61968994140625, -1.560394287109375, -1.5010986328125, -1.441802978515625, -1.38250732421875, -1.323211669921875, -1.263916015625, -1.204620361328125, -1.14532470703125, -1.086029052734375, -1.0267333984375, -0.967437744140625, -0.90814208984375, -0.848846435546875, -0.78955078125, -0.730255126953125, -0.67095947265625, -0.611663818359375, -0.5523681640625, -0.493072509765625, -0.43377685546875, -0.374481201171875, -0.315185546875, -0.255889892578125, -0.19659423828125, -0.137298583984375, -0.0780029296875, -0.018707275390625, 0.04058837890625, 0.099884033203125, 0.1591796875, 0.218475341796875, 0.27777099609375, 0.337066650390625, 0.3963623046875, 0.455657958984375, 0.51495361328125, 0.574249267578125, 0.633544921875, 0.692840576171875, 0.75213623046875, 0.811431884765625, 0.8707275390625, 0.930023193359375, 0.98931884765625, 1.048614501953125, 1.10791015625, 1.167205810546875, 1.22650146484375, 1.285797119140625, 1.3450927734375, 1.404388427734375, 1.46368408203125, 1.522979736328125, 1.582275390625, 1.641571044921875, 1.70086669921875, 1.760162353515625, 1.8194580078125, 1.878753662109375, 1.93804931640625, 1.997344970703125, 2.056640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 15.0, 14.0, 14.0, 34.0, 20.0, 40.0, 56.0, 57.0, 66.0, 77.0, 55.0, 63.0, 75.0, 75.0, 59.0, 64.0, 46.0, 38.0, 28.0, 32.0, 18.0, 17.0, 10.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.650970458984375, -1.60174560546875, -1.552520751953125, -1.5032958984375, -1.454071044921875, -1.40484619140625, -1.355621337890625, -1.306396484375, -1.257171630859375, -1.20794677734375, -1.158721923828125, -1.1094970703125, -1.060272216796875, -1.01104736328125, -0.961822509765625, -0.91259765625, -0.863372802734375, -0.81414794921875, -0.764923095703125, -0.7156982421875, -0.666473388671875, -0.61724853515625, -0.568023681640625, -0.518798828125, -0.469573974609375, -0.42034912109375, -0.371124267578125, -0.3218994140625, -0.272674560546875, -0.22344970703125, -0.174224853515625, -0.125, -0.075775146484375, -0.02655029296875, 0.022674560546875, 0.0718994140625, 0.121124267578125, 0.17034912109375, 0.219573974609375, 0.268798828125, 0.318023681640625, 0.36724853515625, 0.416473388671875, 0.4656982421875, 0.514923095703125, 0.56414794921875, 0.613372802734375, 0.66259765625, 0.711822509765625, 0.76104736328125, 0.810272216796875, 0.8594970703125, 0.908721923828125, 0.95794677734375, 1.007171630859375, 1.056396484375, 1.105621337890625, 1.15484619140625, 1.204071044921875, 1.2532958984375, 1.302520751953125, 1.35174560546875, 1.400970458984375, 1.4501953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 10.0, 7.0, 12.0, 17.0, 21.0, 28.0, 20.0, 29.0, 64.0, 58.0, 94.0, 167.0, 252.0, 458.0, 904.0, 2290.0, 8367.0, 47046.0, 875350.0, 95206.0, 12592.0, 3076.0, 1083.0, 546.0, 281.0, 194.0, 119.0, 85.0, 45.0, 36.0, 15.0, 14.0, 12.0, 17.0, 8.0, 8.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.05029296875, -1.9833984375, -1.91650390625, -1.849609375, -1.78271484375, -1.7158203125, -1.64892578125, -1.58203125, -1.51513671875, -1.4482421875, -1.38134765625, -1.314453125, -1.24755859375, -1.1806640625, -1.11376953125, -1.046875, -0.97998046875, -0.9130859375, -0.84619140625, -0.779296875, -0.71240234375, -0.6455078125, -0.57861328125, -0.51171875, -0.44482421875, -0.3779296875, -0.31103515625, -0.244140625, -0.17724609375, -0.1103515625, -0.04345703125, 0.0234375, 0.09033203125, 0.1572265625, 0.22412109375, 0.291015625, 0.35791015625, 0.4248046875, 0.49169921875, 0.55859375, 0.62548828125, 0.6923828125, 0.75927734375, 0.826171875, 0.89306640625, 0.9599609375, 1.02685546875, 1.09375, 1.16064453125, 1.2275390625, 1.29443359375, 1.361328125, 1.42822265625, 1.4951171875, 1.56201171875, 1.62890625, 1.69580078125, 1.7626953125, 1.82958984375, 1.896484375, 1.96337890625, 2.0302734375, 2.09716796875, 2.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 12.0, 10.0, 4.0, 15.0, 17.0, 16.0, 20.0, 14.0, 37.0, 32.0, 38.0, 39.0, 54.0, 60.0, 62.0, 86.0, 83.0, 71.0, 40.0, 41.0, 52.0, 22.0, 33.0, 18.0, 20.0, 16.0, 19.0, 14.0, 10.0, 6.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.08319091796875, -3.9437255859375, -3.80426025390625, -3.664794921875, -3.52532958984375, -3.3858642578125, -3.24639892578125, -3.10693359375, -2.96746826171875, -2.8280029296875, -2.68853759765625, -2.549072265625, -2.40960693359375, -2.2701416015625, -2.13067626953125, -1.9912109375, -1.85174560546875, -1.7122802734375, -1.57281494140625, -1.433349609375, -1.29388427734375, -1.1544189453125, -1.01495361328125, -0.87548828125, -0.73602294921875, -0.5965576171875, -0.45709228515625, -0.317626953125, -0.17816162109375, -0.0386962890625, 0.10076904296875, 0.240234375, 0.37969970703125, 0.5191650390625, 0.65863037109375, 0.798095703125, 0.93756103515625, 1.0770263671875, 1.21649169921875, 1.35595703125, 1.49542236328125, 1.6348876953125, 1.77435302734375, 1.913818359375, 2.05328369140625, 2.1927490234375, 2.33221435546875, 2.4716796875, 2.61114501953125, 2.7506103515625, 2.89007568359375, 3.029541015625, 3.16900634765625, 3.3084716796875, 3.44793701171875, 3.58740234375, 3.72686767578125, 3.8663330078125, 4.00579833984375, 4.145263671875, 4.28472900390625, 4.4241943359375, 4.56365966796875, 4.703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 20.0, 28.0, 36.0, 58.0, 117.0, 201.0, 484.0, 1081.0, 2852.0, 11957.0, 123865.0, 873987.0, 25880.0, 4924.0, 1552.0, 681.0, 342.0, 186.0, 93.0, 62.0, 33.0, 29.0, 10.0, 6.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5861968994140625, -0.567413330078125, -0.5486297607421875, -0.52984619140625, -0.5110626220703125, -0.492279052734375, -0.4734954833984375, -0.4547119140625, -0.4359283447265625, -0.417144775390625, -0.3983612060546875, -0.37957763671875, -0.3607940673828125, -0.342010498046875, -0.3232269287109375, -0.304443359375, -0.2856597900390625, -0.266876220703125, -0.2480926513671875, -0.22930908203125, -0.2105255126953125, -0.191741943359375, -0.1729583740234375, -0.1541748046875, -0.1353912353515625, -0.116607666015625, -0.0978240966796875, -0.07904052734375, -0.0602569580078125, -0.041473388671875, -0.0226898193359375, -0.00390625, 0.0148773193359375, 0.033660888671875, 0.0524444580078125, 0.07122802734375, 0.0900115966796875, 0.108795166015625, 0.1275787353515625, 0.1463623046875, 0.1651458740234375, 0.183929443359375, 0.2027130126953125, 0.22149658203125, 0.2402801513671875, 0.259063720703125, 0.2778472900390625, 0.296630859375, 0.3154144287109375, 0.334197998046875, 0.3529815673828125, 0.37176513671875, 0.3905487060546875, 0.409332275390625, 0.4281158447265625, 0.4468994140625, 0.4656829833984375, 0.484466552734375, 0.5032501220703125, 0.52203369140625, 0.5408172607421875, 0.559600830078125, 0.5783843994140625, 0.59716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 14.0, 16.0, 18.0, 30.0, 65.0, 87.0, 163.0, 212.0, 130.0, 72.0, 42.0, 23.0, 16.0, 17.0, 4.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015616416931152344, -0.00015132129192352295, -0.00014647841453552246, -0.00014163553714752197, -0.00013679265975952148, -0.000131949782371521, -0.0001271069049835205, -0.00012226402759552002, -0.00011742115020751953, -0.00011257827281951904, -0.00010773539543151855, -0.00010289251804351807, -9.804964065551758e-05, -9.320676326751709e-05, -8.83638858795166e-05, -8.352100849151611e-05, -7.867813110351562e-05, -7.383525371551514e-05, -6.899237632751465e-05, -6.414949893951416e-05, -5.930662155151367e-05, -5.4463744163513184e-05, -4.9620866775512695e-05, -4.477798938751221e-05, -3.993511199951172e-05, -3.509223461151123e-05, -3.0249357223510742e-05, -2.5406479835510254e-05, -2.0563602447509766e-05, -1.5720725059509277e-05, -1.0877847671508789e-05, -6.034970283508301e-06, -1.1920928955078125e-06, 3.6507844924926758e-06, 8.493661880493164e-06, 1.3336539268493652e-05, 1.817941665649414e-05, 2.302229404449463e-05, 2.7865171432495117e-05, 3.2708048820495605e-05, 3.7550926208496094e-05, 4.239380359649658e-05, 4.723668098449707e-05, 5.207955837249756e-05, 5.692243576049805e-05, 6.176531314849854e-05, 6.660819053649902e-05, 7.145106792449951e-05, 7.62939453125e-05, 8.113682270050049e-05, 8.597970008850098e-05, 9.082257747650146e-05, 9.566545486450195e-05, 0.00010050833225250244, 0.00010535120964050293, 0.00011019408702850342, 0.0001150369644165039, 0.0001198798418045044, 0.00012472271919250488, 0.00012956559658050537, 0.00013440847396850586, 0.00013925135135650635, 0.00014409422874450684, 0.00014893710613250732, 0.0001537799835205078]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 6.0, 11.0, 10.0, 12.0, 24.0, 27.0, 42.0, 61.0, 73.0, 118.0, 231.0, 398.0, 857.0, 1994.0, 5891.0, 22246.0, 204285.0, 770120.0, 30130.0, 7267.0, 2477.0, 1041.0, 511.0, 226.0, 142.0, 98.0, 66.0, 41.0, 37.0, 19.0, 12.0, 8.0, 8.0, 9.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.59326171875, -0.5758590698242188, -0.5584564208984375, -0.5410537719726562, -0.523651123046875, -0.5062484741210938, -0.4888458251953125, -0.47144317626953125, -0.45404052734375, -0.43663787841796875, -0.4192352294921875, -0.40183258056640625, -0.384429931640625, -0.36702728271484375, -0.3496246337890625, -0.33222198486328125, -0.3148193359375, -0.29741668701171875, -0.2800140380859375, -0.26261138916015625, -0.245208740234375, -0.22780609130859375, -0.2104034423828125, -0.19300079345703125, -0.17559814453125, -0.15819549560546875, -0.1407928466796875, -0.12339019775390625, -0.105987548828125, -0.08858489990234375, -0.0711822509765625, -0.05377960205078125, -0.036376953125, -0.01897430419921875, -0.0015716552734375, 0.01583099365234375, 0.033233642578125, 0.05063629150390625, 0.0680389404296875, 0.08544158935546875, 0.10284423828125, 0.12024688720703125, 0.1376495361328125, 0.15505218505859375, 0.172454833984375, 0.18985748291015625, 0.2072601318359375, 0.22466278076171875, 0.2420654296875, 0.25946807861328125, 0.2768707275390625, 0.29427337646484375, 0.311676025390625, 0.32907867431640625, 0.3464813232421875, 0.36388397216796875, 0.38128662109375, 0.39868927001953125, 0.4160919189453125, 0.43349456787109375, 0.450897216796875, 0.46829986572265625, 0.4857025146484375, 0.5031051635742188, 0.5205078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 11.0, 11.0, 14.0, 29.0, 22.0, 34.0, 65.0, 91.0, 136.0, 148.0, 138.0, 91.0, 52.0, 41.0, 23.0, 18.0, 15.0, 13.0, 6.0, 7.0, 8.0, 6.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.787109375, -0.7660140991210938, -0.7449188232421875, -0.7238235473632812, -0.702728271484375, -0.6816329956054688, -0.6605377197265625, -0.6394424438476562, -0.61834716796875, -0.5972518920898438, -0.5761566162109375, -0.5550613403320312, -0.533966064453125, -0.5128707885742188, -0.4917755126953125, -0.47068023681640625, -0.4495849609375, -0.42848968505859375, -0.4073944091796875, -0.38629913330078125, -0.365203857421875, -0.34410858154296875, -0.3230133056640625, -0.30191802978515625, -0.28082275390625, -0.25972747802734375, -0.2386322021484375, -0.21753692626953125, -0.196441650390625, -0.17534637451171875, -0.1542510986328125, -0.13315582275390625, -0.112060546875, -0.09096527099609375, -0.0698699951171875, -0.04877471923828125, -0.027679443359375, -0.00658416748046875, 0.0145111083984375, 0.03560638427734375, 0.05670166015625, 0.07779693603515625, 0.0988922119140625, 0.11998748779296875, 0.141082763671875, 0.16217803955078125, 0.1832733154296875, 0.20436859130859375, 0.2254638671875, 0.24655914306640625, 0.2676544189453125, 0.28874969482421875, 0.309844970703125, 0.33094024658203125, 0.3520355224609375, 0.37313079833984375, 0.39422607421875, 0.41532135009765625, 0.4364166259765625, 0.45751190185546875, 0.478607177734375, 0.49970245361328125, 0.5207977294921875, 0.5418930053710938, 0.56298828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 10.0, 37.0, 102.0, 646.0, 159.0, 31.0, 13.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.45219421386719, -54.08751678466797, -52.72283935546875, -51.35816192626953, -49.99348449707031, -48.62881088256836, -47.26413345336914, -45.89945602416992, -44.5347785949707, -43.170101165771484, -41.805423736572266, -40.44074630737305, -39.076072692871094, -37.711395263671875, -36.346717834472656, -34.98204040527344, -33.61736297607422, -32.252685546875, -30.88800811767578, -29.523332595825195, -28.158655166625977, -26.793977737426758, -25.429302215576172, -24.064624786376953, -22.699947357177734, -21.335269927978516, -19.970592498779297, -18.60591697692871, -17.241239547729492, -15.876562118530273, -14.511885643005371, -13.147209167480469, -11.78253173828125, -10.417854309082031, -9.053177833557129, -7.688500881195068, -6.323823928833008, -4.959146976470947, -3.5944700241088867, -2.2297935485839844, -0.8651161193847656, 0.4995608329772949, 1.8642377853393555, 3.228914737701416, 4.593591690063477, 5.958268642425537, 7.322945594787598, 8.6876220703125, 10.052299499511719, 11.416976928710938, 12.78165340423584, 14.146329879760742, 15.511007308959961, 16.87568473815918, 18.240360260009766, 19.605037689208984, 20.969715118408203, 22.334392547607422, 23.69906997680664, 25.063745498657227, 26.428422927856445, 27.793100357055664, 29.15777587890625, 30.52245330810547, 31.887130737304688]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 5.0, 11.0, 8.0, 15.0, 14.0, 17.0, 21.0, 30.0, 28.0, 42.0, 44.0, 91.0, 160.0, 142.0, 110.0, 57.0, 28.0, 21.0, 21.0, 18.0, 21.0, 14.0, 17.0, 7.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.148698806762695, -11.71694564819336, -11.285191535949707, -10.853438377380371, -10.421685218811035, -9.989931106567383, -9.558177947998047, -9.126424789428711, -8.694670677185059, -8.262917518615723, -7.8311638832092285, -7.399410247802734, -6.96765661239624, -6.535902976989746, -6.10414981842041, -5.672396183013916, -5.24064302444458, -4.808889389038086, -4.37713623046875, -3.945382595062256, -3.5136289596557617, -3.0818755626678467, -2.6501221656799316, -2.2183685302734375, -1.7866151332855225, -1.3548616170883179, -0.9231081604957581, -0.49135470390319824, -0.05960118770599365, 0.37215232849121094, 0.803905725479126, 1.2356593608856201, 1.6674127578735352, 2.09916615486145, 2.5309197902679443, 2.9626731872558594, 3.3944268226623535, 3.8261802196502686, 4.257933616638184, 4.689687252044678, 5.121440887451172, 5.553194522857666, 5.984947681427002, 6.416701316833496, 6.84845495223999, 7.280208587646484, 7.71196174621582, 8.143714904785156, 8.575468063354492, 9.007221221923828, 9.43897533416748, 9.870728492736816, 10.302481651306152, 10.734235763549805, 11.16598892211914, 11.597742080688477, 12.029496192932129, 12.461249351501465, 12.893003463745117, 13.324756622314453, 13.756509780883789, 14.188263893127441, 14.620017051696777, 15.05177116394043, 15.483524322509766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 10.0, 10.0, 12.0, 18.0, 10.0, 20.0, 32.0, 37.0, 32.0, 41.0, 37.0, 76.0, 112.0, 168.0, 90.0, 41.0, 37.0, 35.0, 29.0, 31.0, 15.0, 16.0, 19.0, 11.0, 12.0, 6.0, 4.0, 3.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3515625, -1.315277099609375, -1.27899169921875, -1.242706298828125, -1.2064208984375, -1.170135498046875, -1.13385009765625, -1.097564697265625, -1.061279296875, -1.024993896484375, -0.98870849609375, -0.952423095703125, -0.9161376953125, -0.879852294921875, -0.84356689453125, -0.807281494140625, -0.77099609375, -0.734710693359375, -0.69842529296875, -0.662139892578125, -0.6258544921875, -0.589569091796875, -0.55328369140625, -0.516998291015625, -0.480712890625, -0.444427490234375, -0.40814208984375, -0.371856689453125, -0.3355712890625, -0.299285888671875, -0.26300048828125, -0.226715087890625, -0.1904296875, -0.154144287109375, -0.11785888671875, -0.081573486328125, -0.0452880859375, -0.009002685546875, 0.02728271484375, 0.063568115234375, 0.099853515625, 0.136138916015625, 0.17242431640625, 0.208709716796875, 0.2449951171875, 0.281280517578125, 0.31756591796875, 0.353851318359375, 0.39013671875, 0.426422119140625, 0.46270751953125, 0.498992919921875, 0.5352783203125, 0.571563720703125, 0.60784912109375, 0.644134521484375, 0.680419921875, 0.716705322265625, 0.75299072265625, 0.789276123046875, 0.8255615234375, 0.861846923828125, 0.89813232421875, 0.934417724609375, 0.970703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 10.0, 24.0, 15.0, 30.0, 52.0, 83.0, 182.0, 581.0, 2712.0, 86225.0, 8292955.0, 4342.0, 812.0, 250.0, 99.0, 54.0, 42.0, 21.0, 9.0, 13.0, 13.0, 7.0, 7.0, 9.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.000646591186523, -11.573607444763184, -11.14656925201416, -10.71953010559082, -10.29249095916748, -9.86545181274414, -9.438413619995117, -9.011374473571777, -8.584335327148438, -8.157296180725098, -7.730257511138916, -7.303218841552734, -6.8761796951293945, -6.449141025543213, -6.022102355957031, -5.595063209533691, -5.168025016784668, -4.740986347198486, -4.3139472007751465, -3.886908531188965, -3.459869623184204, -3.0328307151794434, -2.6057920455932617, -2.178753137588501, -1.7517142295837402, -1.3246753215789795, -0.8976365327835083, -0.4705977439880371, -0.04355883598327637, 0.3834800720214844, 0.810518741607666, 1.2375576496124268, 1.664597511291504, 2.0916364192962646, 2.5186753273010254, 2.945713996887207, 3.3727529048919678, 3.7997918128967285, 4.22683048248291, 4.65386962890625, 5.080908298492432, 5.507946968078613, 5.934986114501953, 6.362024784088135, 6.789063453674316, 7.216102600097656, 7.643141269683838, 8.07017993927002, 8.49721908569336, 8.9242582321167, 9.351296424865723, 9.778335571289062, 10.205374717712402, 10.632413864135742, 11.059452056884766, 11.486491203308105, 11.913530349731445, 12.340569496154785, 12.767607688903809, 13.194646835327148, 13.621685981750488, 14.048725128173828, 14.475763320922852, 14.902802467346191, 15.329840660095215]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 3.0, 8.0, 3.0, 0.0, 6.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.251260757446289, -10.830163955688477, -10.409067153930664, -9.987969398498535, -9.566872596740723, -9.14577579498291, -8.724678039550781, -8.303581237792969, -7.882484436035156, -7.461387634277344, -7.040290355682373, -6.619193077087402, -6.19809627532959, -5.776999473571777, -5.355902194976807, -4.934804916381836, -4.513708114624023, -4.092611312866211, -3.6715140342712402, -3.2504169940948486, -2.829319953918457, -2.4082229137420654, -1.9871258735656738, -1.5660288333892822, -1.1449317932128906, -0.723834753036499, -0.3027377128601074, 0.11835932731628418, 0.5394563674926758, 0.9605534076690674, 1.381650447845459, 1.8027474880218506, 2.223844528198242, 2.644941568374634, 3.0660386085510254, 3.487135648727417, 3.9082326889038086, 4.329329490661621, 4.750426769256592, 5.1715240478515625, 5.592620849609375, 6.0137176513671875, 6.434814929962158, 6.855912208557129, 7.277009010314941, 7.698105812072754, 8.119203567504883, 8.540300369262695, 8.961397171020508, 9.38249397277832, 9.803590774536133, 10.224688529968262, 10.645785331726074, 11.066882133483887, 11.487979888916016, 11.909076690673828, 12.33017349243164, 12.751270294189453, 13.172367095947266, 13.593464851379395, 14.014561653137207, 14.43565845489502, 14.856756210327148, 15.277853012084961, 15.698949813842773]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 20.0, 21.0, 22.0, 31.0, 53.0, 43.0, 55.0, 64.0, 81.0, 69.0, 78.0, 74.0, 67.0, 62.0, 41.0, 36.0, 32.0, 22.0, 25.0, 15.0, 15.0, 13.0, 11.0, 11.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.840667724609375, -0.81024169921875, -0.779815673828125, -0.7493896484375, -0.718963623046875, -0.68853759765625, -0.658111572265625, -0.627685546875, -0.597259521484375, -0.56683349609375, -0.536407470703125, -0.5059814453125, -0.475555419921875, -0.44512939453125, -0.414703369140625, -0.38427734375, -0.353851318359375, -0.32342529296875, -0.292999267578125, -0.2625732421875, -0.232147216796875, -0.20172119140625, -0.171295166015625, -0.140869140625, -0.110443115234375, -0.08001708984375, -0.049591064453125, -0.0191650390625, 0.011260986328125, 0.04168701171875, 0.072113037109375, 0.1025390625, 0.132965087890625, 0.16339111328125, 0.193817138671875, 0.2242431640625, 0.254669189453125, 0.28509521484375, 0.315521240234375, 0.345947265625, 0.376373291015625, 0.40679931640625, 0.437225341796875, 0.4676513671875, 0.498077392578125, 0.52850341796875, 0.558929443359375, 0.58935546875, 0.619781494140625, 0.65020751953125, 0.680633544921875, 0.7110595703125, 0.741485595703125, 0.77191162109375, 0.802337646484375, 0.832763671875, 0.863189697265625, 0.89361572265625, 0.924041748046875, 0.9544677734375, 0.984893798828125, 1.01531982421875, 1.045745849609375, 1.076171875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 14.0, 9.0, 20.0, 27.0, 52.0, 55.0, 89.0, 167.0, 302.0, 574.0, 1114.0, 2620.0, 6403.0, 17783.0, 53107.0, 150798.0, 179664.0, 70505.0, 24606.0, 9225.0, 3748.0, 1676.0, 761.0, 392.0, 245.0, 120.0, 68.0, 46.0, 24.0, 14.0, 9.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.89666748046875, -7.6839599609375, -7.47125244140625, -7.258544921875, -7.04583740234375, -6.8331298828125, -6.62042236328125, -6.40771484375, -6.19500732421875, -5.9822998046875, -5.76959228515625, -5.556884765625, -5.34417724609375, -5.1314697265625, -4.91876220703125, -4.7060546875, -4.49334716796875, -4.2806396484375, -4.06793212890625, -3.855224609375, -3.64251708984375, -3.4298095703125, -3.21710205078125, -3.00439453125, -2.79168701171875, -2.5789794921875, -2.36627197265625, -2.153564453125, -1.94085693359375, -1.7281494140625, -1.51544189453125, -1.302734375, -1.09002685546875, -0.8773193359375, -0.66461181640625, -0.451904296875, -0.23919677734375, -0.0264892578125, 0.18621826171875, 0.39892578125, 0.61163330078125, 0.8243408203125, 1.03704833984375, 1.249755859375, 1.46246337890625, 1.6751708984375, 1.88787841796875, 2.1005859375, 2.31329345703125, 2.5260009765625, 2.73870849609375, 2.951416015625, 3.16412353515625, 3.3768310546875, 3.58953857421875, 3.80224609375, 4.01495361328125, 4.2276611328125, 4.44036865234375, 4.653076171875, 4.86578369140625, 5.0784912109375, 5.29119873046875, 5.50390625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 6.0, 5.0, 9.0, 9.0, 10.0, 19.0, 21.0, 37.0, 37.0, 26.0, 41.0, 44.0, 62.0, 57.0, 81.0, 63.0, 69.0, 61.0, 53.0, 42.0, 39.0, 42.0, 28.0, 28.0, 20.0, 17.0, 17.0, 5.0, 10.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1376953125, -1.10296630859375, -1.0682373046875, -1.03350830078125, -0.998779296875, -0.96405029296875, -0.9293212890625, -0.89459228515625, -0.85986328125, -0.82513427734375, -0.7904052734375, -0.75567626953125, -0.720947265625, -0.68621826171875, -0.6514892578125, -0.61676025390625, -0.58203125, -0.54730224609375, -0.5125732421875, -0.47784423828125, -0.443115234375, -0.40838623046875, -0.3736572265625, -0.33892822265625, -0.30419921875, -0.26947021484375, -0.2347412109375, -0.20001220703125, -0.165283203125, -0.13055419921875, -0.0958251953125, -0.06109619140625, -0.0263671875, 0.00836181640625, 0.0430908203125, 0.07781982421875, 0.112548828125, 0.14727783203125, 0.1820068359375, 0.21673583984375, 0.25146484375, 0.28619384765625, 0.3209228515625, 0.35565185546875, 0.390380859375, 0.42510986328125, 0.4598388671875, 0.49456787109375, 0.529296875, 0.56402587890625, 0.5987548828125, 0.63348388671875, 0.668212890625, 0.70294189453125, 0.7376708984375, 0.77239990234375, 0.80712890625, 0.84185791015625, 0.8765869140625, 0.91131591796875, 0.946044921875, 0.98077392578125, 1.0155029296875, 1.05023193359375, 1.0849609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 6.0, 4.0, 4.0, 9.0, 15.0, 15.0, 37.0, 21.0, 40.0, 52.0, 56.0, 66.0, 40.0, 28.0, 20.0, 18.0, 12.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.822357177734375, -7.621732711791992, -7.421108245849609, -7.220483303070068, -7.0198588371276855, -6.819234371185303, -6.61860990524292, -6.417984962463379, -6.217360496520996, -6.016736030578613, -5.8161115646362305, -5.6154866218566895, -5.414862155914307, -5.214237689971924, -5.013613224029541, -4.81298828125, -4.612363815307617, -4.411739349365234, -4.211114883422852, -4.0104899406433105, -3.8098654747009277, -3.609241008758545, -3.408616542816162, -3.2079918384552, -3.0073676109313965, -2.8067431449890137, -2.6061184406280518, -2.405493974685669, -2.204869270324707, -2.004244804382324, -1.8036202192306519, -1.6029956340789795, -1.4023709297180176, -1.2017463445663452, -1.0011217594146729, -0.8004972338676453, -0.5998726487159729, -0.3992481231689453, -0.19862353801727295, 0.002001047134399414, 0.20262563228607178, 0.40325021743774414, 0.6038748025894165, 0.8044993281364441, 1.0051238536834717, 1.205748438835144, 1.4063730239868164, 1.6069976091384888, 1.8076221942901611, 2.008246660232544, 2.208871364593506, 2.4094958305358887, 2.6101205348968506, 2.8107450008392334, 3.0113697052001953, 3.211994171142578, 3.412618637084961, 3.6132431030273438, 3.8138678073883057, 4.014492511749268, 4.21511697769165, 4.415741443634033, 4.616365909576416, 4.816990852355957, 5.01761531829834]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 15.0, 5.0, 8.0, 17.0, 21.0, 32.0, 45.0, 74.0, 70.0, 62.0, 41.0, 21.0, 16.0, 11.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.803354263305664, -11.522051811218262, -11.24074935913086, -10.959447860717773, -10.678145408630371, -10.396842956542969, -10.115540504455566, -9.834238052368164, -9.552936553955078, -9.271634101867676, -8.990331649780273, -8.709030151367188, -8.427727699279785, -8.146425247192383, -7.8651227951049805, -7.583820819854736, -7.302518367767334, -7.021215915679932, -6.7399139404296875, -6.458611488342285, -6.177309513092041, -5.896007061004639, -5.6147050857543945, -5.333402633666992, -5.05210018157959, -4.7707977294921875, -4.489495754241943, -4.208193302154541, -3.926891326904297, -3.6455888748168945, -3.3642866611480713, -3.082984447479248, -2.801682472229004, -2.5203802585601807, -2.2390780448913574, -1.9577757120132446, -1.6764734983444214, -1.3951712846755981, -1.1138689517974854, -0.8325667381286621, -0.5512645244598389, -0.26996228098869324, 0.011339962482452393, 0.2926422357559204, 0.5739444494247437, 0.8552466630935669, 1.1365489959716797, 1.417851209640503, 1.6991534233093262, 1.9804556369781494, 2.2617578506469727, 2.543060302734375, 2.824362277984619, 3.1056647300720215, 3.3869669437408447, 3.668269157409668, 3.949571371078491, 4.2308735847473145, 4.512176036834717, 4.793478012084961, 5.074780464172363, 5.356082439422607, 5.63738489151001, 5.918686866760254, 6.199989318847656]}, "eval/loss": 1.7438108921051025, "eval/wer": 1.471360571201904, "eval/runtime": 1557.2283, "eval/samples_per_second": 1.697, "eval/steps_per_second": 0.213, "train/train_runtime": 115954.4449, "train/train_samples_per_second": 4.922, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 1.0593869240786682} \ No newline at end of file